mirror of
https://github.com/block/goose.git
synced 2026-05-19 16:27:54 +00:00
Add documentation for new provider SaladCloud AI Gateway (#9253)
This commit is contained in:
parent
688b6d706e
commit
809a82ea53
2 changed files with 49 additions and 0 deletions
48
crates/goose/src/providers/declarative/saladcloud.json
Normal file
48
crates/goose/src/providers/declarative/saladcloud.json
Normal file
|
|
@ -0,0 +1,48 @@
|
|||
{
|
||||
"name": "saladcloud",
|
||||
"engine": "openai",
|
||||
"display_name": "SaladCloud AI Gateway",
|
||||
"description": "OpenAI-compatible access to SaladCloud-hosted Qwen and Gemma models",
|
||||
"api_key_env": "SALAD_CLOUD_API_KEY",
|
||||
"base_url": "https://ai.salad.cloud/v1/chat/completions",
|
||||
"models": [
|
||||
{
|
||||
"name": "qwen3.6-35b-a3b",
|
||||
"context_limit": 262144,
|
||||
"input_token_cost": 0.00000009,
|
||||
"output_token_cost": 0.0000006,
|
||||
"currency": "USD"
|
||||
},
|
||||
{
|
||||
"name": "qwen3.6-27b",
|
||||
"context_limit": 262144,
|
||||
"input_token_cost": 0.0000003,
|
||||
"output_token_cost": 0.0000012,
|
||||
"currency": "USD"
|
||||
},
|
||||
{
|
||||
"name": "qwen3.5-9b",
|
||||
"context_limit": 262144,
|
||||
"input_token_cost": 0.00000006,
|
||||
"output_token_cost": 0.00000009,
|
||||
"currency": "USD"
|
||||
},
|
||||
{
|
||||
"name": "gemma-4-26b-a4b-instruct",
|
||||
"context_limit": 262144,
|
||||
"input_token_cost": 0.00000004,
|
||||
"output_token_cost": 0.0000002,
|
||||
"currency": "USD"
|
||||
}
|
||||
],
|
||||
"supports_streaming": true,
|
||||
"dynamic_models": true,
|
||||
"skip_canonical_filtering": true,
|
||||
"model_doc_link": "https://docs.salad.com/ai-gateway/explanation/overview",
|
||||
"setup_steps": [
|
||||
"Register at portal.salad.com and enable access to the AI Gateway.",
|
||||
"Copy your API key from https://portal.salad.com/api-key and paste it above as SALAD_CLOUD_API_KEY.",
|
||||
"Select a supported model such as qwen3.6-35b-a3b."
|
||||
],
|
||||
"fast_model": "qwen3.5-9b"
|
||||
}
|
||||
|
|
@ -47,6 +47,7 @@ goose is compatible with a wide range of LLM providers, allowing you to choose a
|
|||
| [OVHcloud AI](https://www.ovhcloud.com/en/public-cloud/ai-endpoints/) | Provides access to open-source models including Qwen, Llama, Mistral, and DeepSeek through AI Endpoints service. | `OVHCLOUD_API_KEY` |
|
||||
| [Ramalama](https://ramalama.ai/) | Local model using native [OCI](https://opencontainers.org/) container runtimes, [CNCF](https://www.cncf.io/) tools, and supporting models as OCI artifacts. Ramalama API is a compatible alternative to Ollama and can be used with the goose Ollama provider. Supports Qwen, Llama, DeepSeek, and other open-source models. **Because this provider runs locally, you must first [download and run a model](#local-llms).** | `OLLAMA_HOST` |
|
||||
| [Routstr](https://routstr.com/) | OpenAI-compatible aggregator that fronts dozens of upstream providers (Anthropic, OpenAI, Google, DeepSeek, Llama, …) behind a single API. Authenticate with an `sk-...` bearer issued by your Routstr instance — payment is handled outside goose. | `ROUTSTR_API_KEY`, `ROUTSTR_HOST` (optional, default `https://api.routstr.com`) |
|
||||
| [SaladCloud AI Gateway](https://salad.com/) | OpenAI-compatible access to SaladCloud-hosted open-source models, including Qwen, Gemma, and others. | `SALAD_CLOUD_API_KEY` |
|
||||
| [Snowflake](https://docs.snowflake.com/user-guide/snowflake-cortex/aisql#choosing-a-model) | Access the latest models using Snowflake Cortex services, including Claude models. **Requires a Snowflake account and programmatic access token (PAT)**. | `SNOWFLAKE_HOST`, `SNOWFLAKE_TOKEN` |
|
||||
| [VMware Tanzu Platform](https://techdocs.broadcom.com/us/en/vmware-tanzu/platform/ai-services/10-3/ai/index.html) | Enterprise-managed LLM access through AI Services on VMware Tanzu Platform. Models are fetched dynamically from the endpoint. | `TANZU_AI_API_KEY`, `TANZU_AI_ENDPOINT` |
|
||||
| [Tetrate Agent Router Service](https://router.tetrate.ai) | Unified API gateway for AI models including Claude, Gemini, GPT, open-weight models, and others. Supports PKCE authentication flow for secure API key generation. | `TETRATE_API_KEY`, `TETRATE_HOST` (optional) |
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue