aaif-goose · DOsinga · May 18, 2026 · May 15, 2026
diff --git a/crates/goose/src/providers/declarative/saladcloud.json b/crates/goose/src/providers/declarative/saladcloud.json
@@ -0,0 +1,48 @@
+{
+  "name": "saladcloud",
+  "engine": "openai",
+  "display_name": "SaladCloud AI Gateway",
+  "description": "OpenAI-compatible access to SaladCloud-hosted Qwen and Gemma models",
+  "api_key_env": "SALAD_CLOUD_API_KEY",
+  "base_url": "https://ai.salad.cloud/v1/chat/completions",
+  "models": [
+    {
+      "name": "qwen3.6-35b-a3b",
+      "context_limit": 262144,
+      "input_token_cost": 0.00000009,
+      "output_token_cost": 0.0000006,
+      "currency": "USD"
+    },
+    {
+      "name": "qwen3.6-27b",
+      "context_limit": 262144,
+      "input_token_cost": 0.0000003,
+      "output_token_cost": 0.0000012,
+      "currency": "USD"
+    },
+    {
+      "name": "qwen3.5-9b",
+      "context_limit": 262144,
+      "input_token_cost": 0.00000006,
+      "output_token_cost": 0.00000009,
+      "currency": "USD"
+    },
+    {
+      "name": "gemma-4-26b-a4b-instruct",
+      "context_limit": 262144,
+      "input_token_cost": 0.00000004,
+      "output_token_cost": 0.0000002,
+      "currency": "USD"
+    }
+  ],
+  "supports_streaming": true,
+  "dynamic_models": true,
+  "skip_canonical_filtering": true,
+  "model_doc_link": "https://docs.salad.com/ai-gateway/explanation/overview",
+  "setup_steps": [
+    "Register at portal.salad.com and enable access to the AI Gateway.",
+    "Copy your API key from https://portal.salad.com/api-key and paste it above as SALAD_CLOUD_API_KEY.",
+    "Select a supported model such as qwen3.6-35b-a3b."
+  ],
+  "fast_model": "qwen3.5-9b"
+}
diff --git a/documentation/docs/getting-started/providers.md b/documentation/docs/getting-started/providers.md
@@ -46,6 +46,7 @@ goose is compatible with a wide range of LLM providers, allowing you to choose a
 | [OVHcloud AI](https://www.ovhcloud.com/en/public-cloud/ai-endpoints/)       | Provides access to open-source models including Qwen, Llama, Mistral, and DeepSeek through AI Endpoints service.                                                       | `OVHCLOUD_API_KEY`                                                                                                                                                                  |
 | [Ramalama](https://ramalama.ai/)                                            | Local model using native [OCI](https://opencontainers.org/) container runtimes, [CNCF](https://www.cncf.io/) tools, and supporting models as OCI artifacts. Ramalama API is a compatible alternative to Ollama and can be used with the goose Ollama provider. Supports Qwen, Llama, DeepSeek, and other open-source models. **Because this provider runs locally, you must first [download and run a model](#local-llms).**  | `OLLAMA_HOST`                                                                                                                                                                       |
 | [Routstr](https://routstr.com/)                                             | OpenAI-compatible aggregator that fronts dozens of upstream providers (Anthropic, OpenAI, Google, DeepSeek, Llama, …) behind a single API. Authenticate with an `sk-...` bearer issued by your Routstr instance — payment is handled outside goose.                                                                                                                                                                       | `ROUTSTR_API_KEY`, `ROUTSTR_HOST` (optional, default `https://api.routstr.com`)                                                                                                     |
+| [SaladCloud AI Gateway](https://salad.com/)                                 | OpenAI-compatible access to SaladCloud-hosted open-source models, including Qwen, Gemma, and others.                                                                                                          | `SALAD_CLOUD_API_KEY`                                                                                                                                                              |
 | [Snowflake](https://docs.snowflake.com/user-guide/snowflake-cortex/aisql#choosing-a-model) | Access the latest models using Snowflake Cortex services, including Claude models. **Requires a Snowflake account and programmatic access token (PAT)**.                                                     | `SNOWFLAKE_HOST`, `SNOWFLAKE_TOKEN`                                                                                                                                                                 |
 | [VMware Tanzu Platform](https://techdocs.broadcom.com/us/en/vmware-tanzu/platform/ai-services/10-3/ai/index.html) | Enterprise-managed LLM access through AI Services on VMware Tanzu Platform. Models are fetched dynamically from the endpoint. | `TANZU_AI_API_KEY`, `TANZU_AI_ENDPOINT` |
 | [Tetrate Agent Router Service](https://router.tetrate.ai)                   | Unified API gateway for AI models including Claude, Gemini, GPT, open-weight models, and others. Supports PKCE authentication flow for secure API key generation.                                                                                | `TETRATE_API_KEY`, `TETRATE_HOST` (optional)                                                                                                                                        |