diff --git a/Cargo.lock b/Cargo.lock index 3824589312e4..c4b75e7f5efb 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -4365,7 +4365,7 @@ dependencies = [ [[package]] name = "goose" -version = "1.34.1" +version = "1.34.2" dependencies = [ "agent-client-protocol", "agent-client-protocol-schema", @@ -4492,7 +4492,7 @@ dependencies = [ [[package]] name = "goose-acp-macros" -version = "1.34.1" +version = "1.34.2" dependencies = [ "quote", "syn 2.0.117", @@ -4500,7 +4500,7 @@ dependencies = [ [[package]] name = "goose-cli" -version = "1.34.1" +version = "1.34.2" dependencies = [ "anstream", "anyhow", @@ -4552,7 +4552,7 @@ dependencies = [ [[package]] name = "goose-mcp" -version = "1.34.1" +version = "1.34.2" dependencies = [ "anyhow", "base64 0.22.1", @@ -4582,7 +4582,7 @@ dependencies = [ [[package]] name = "goose-sdk" -version = "1.34.1" +version = "1.34.2" dependencies = [ "agent-client-protocol", "agent-client-protocol-schema", @@ -4595,7 +4595,7 @@ dependencies = [ [[package]] name = "goose-server" -version = "1.34.1" +version = "1.34.2" dependencies = [ "anyhow", "aws-lc-rs", @@ -4643,7 +4643,7 @@ dependencies = [ [[package]] name = "goose-test" -version = "1.34.1" +version = "1.34.2" dependencies = [ "clap", "serde_json", @@ -4651,7 +4651,7 @@ dependencies = [ [[package]] name = "goose-test-support" -version = "1.34.1" +version = "1.34.2" dependencies = [ "axum", "env-lock", diff --git a/Cargo.toml b/Cargo.toml index 12bef637904c..fab837a02ad6 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -9,7 +9,7 @@ resolver = "2" [workspace.package] edition = "2021" -version = "1.34.1" +version = "1.34.2" rust-version = "1.91.1" authors = ["AAIF "] license = "Apache-2.0" diff --git a/crates/goose/src/providers/canonical/data/canonical_models.json b/crates/goose/src/providers/canonical/data/canonical_models.json index dad61fd29090..5221c44057c4 100644 --- a/crates/goose/src/providers/canonical/data/canonical_models.json +++ b/crates/goose/src/providers/canonical/data/canonical_models.json @@ -167,7 +167,7 @@ }, { "id": "302ai/claude-3.5-haiku", - "name": "claude-3-5-haiku-20241022", + "name": "claude-3-5-haiku-latest", "family": "claude-haiku", "attachment": true, "reasoning": false, @@ -505,7 +505,7 @@ }, { "id": "302ai/claude-sonnet-4.5", - "name": "claude-sonnet-4-5-20250929", + "name": "claude-sonnet-4-5", "family": "claude-sonnet", "attachment": true, "reasoning": true, @@ -13282,7 +13282,7 @@ }, { "id": "anthropic/claude-3.5-haiku", - "name": "Claude Haiku 3.5", + "name": "Claude Haiku 3.5 (latest)", "family": "claude-haiku", "attachment": true, "reasoning": false, @@ -13315,15 +13315,15 @@ }, { "id": "anthropic/claude-3.5-sonnet", - "name": "Claude Sonnet 3.5 v2", + "name": "Claude Sonnet 3.5", "family": "claude-sonnet", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", "modalities": { "input": [ "text", @@ -13480,7 +13480,7 @@ }, { "id": "anthropic/claude-opus-4.1", - "name": "Claude Opus 4.1 (latest)", + "name": "Claude Opus 4.1", "family": "claude-opus", "attachment": true, "reasoning": true, @@ -13678,7 +13678,7 @@ }, { "id": "anthropic/claude-sonnet-4.5", - "name": "Claude Sonnet 4.5", + "name": "Claude Sonnet 4.5 (latest)", "family": "claude-sonnet", "attachment": true, "reasoning": true, @@ -13742,6 +13742,148 @@ "output": 64000 } }, + { + "id": "atomic-chat/Meta-Llama-3_1-8B-Instruct-GGUF", + "name": "Meta Llama 3.1 8B Instruct (GGUF)", + "family": "llama", + "attachment": false, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 131072, + "output": 4096 + } + }, + { + "id": "atomic-chat/Qwen3_5-9B-MLX-4bit", + "name": "Qwen 3.5 9B (MLX 4-bit)", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-03-05", + "last_updated": "2026-04-04", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "atomic-chat/Qwen3_5-9B-Q4_K_M", + "name": "Qwen 3.5 9B (Q4_K_M)", + "family": "qwen", + "attachment": true, + "reasoning": false, + "tool_call": true, + "temperature": true, + "release_date": "2026-03-05", + "last_updated": "2026-04-04", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "atomic-chat/gemma-4-E4B-it-IQ4_XS", + "name": "Gemma 4 E4B Instruct (IQ4_XS)", + "family": "gemma", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, + { + "id": "atomic-chat/gemma-4-E4B-it-MLX-4bit", + "name": "Gemma 4 E4B Instruct (MLX 4-bit)", + "family": "gemma", + "attachment": false, + "reasoning": false, + "tool_call": false, + "temperature": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.0, + "output": 0.0 + }, + "limit": { + "context": 32768, + "output": 8192 + } + }, { "id": "auriko/claude-opus-4.6", "name": "Claude Opus 4.6", @@ -14758,15 +14900,15 @@ }, { "id": "azure-cognitive-services/gpt-3.5-turbo", - "name": "GPT-3.5 Turbo 0301", + "name": "GPT-3.5 Turbo 0125", "family": "gpt", "attachment": false, "reasoning": false, "tool_call": false, "temperature": true, "knowledge": "2021-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "modalities": { "input": [ "text" @@ -14777,12 +14919,12 @@ }, "open_weights": false, "cost": { - "input": 1.5, - "output": 2.0 + "input": 0.5, + "output": 1.5 }, "limit": { - "context": 4096, - "output": 4096 + "context": 16384, + "output": 16384 } }, { @@ -16874,10 +17016,10 @@ }, { "id": "azure-cognitive-services/phi-4", - "name": "Phi-4", + "name": "Phi-4-reasoning", "family": "phi", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": false, "temperature": true, "knowledge": "2023-10", @@ -16897,16 +17039,16 @@ "output": 0.5 }, "limit": { - "context": 128000, + "context": 32000, "output": 4096 } }, { "id": "azure-cognitive-services/phi-4-mini", - "name": "Phi-4-mini", + "name": "Phi-4-mini-reasoning", "family": "phi", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": true, "temperature": true, "knowledge": "2023-10", @@ -19943,10 +20085,10 @@ }, { "id": "azure/phi-4", - "name": "Phi-4-reasoning", + "name": "Phi-4", "family": "phi", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": false, "temperature": true, "knowledge": "2023-10", @@ -19966,16 +20108,16 @@ "output": 0.5 }, "limit": { - "context": 32000, + "context": 128000, "output": 4096 } }, { "id": "azure/phi-4-mini", - "name": "Phi-4-mini-reasoning", + "name": "Phi-4-mini", "family": "phi", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, "knowledge": "2023-10", @@ -35347,7 +35489,7 @@ }, { "id": "github-models/microsoft/phi-4", - "name": "Phi-4-Reasoning", + "name": "Phi-4", "family": "phi", "attachment": false, "reasoning": true, @@ -35370,7 +35512,7 @@ "output": 0.0 }, "limit": { - "context": 128000, + "context": 16000, "output": 4096 } }, @@ -36497,6 +36639,244 @@ "output": 64000 } }, + { + "id": "gmicloud/anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 5.0, + "output": 25.0, + "cache_read": 0.5 + }, + "limit": { + "context": 409600, + "output": 128000 + } + }, + { + "id": "gmicloud/anthropic/claude-opus-4.7", + "name": "Claude Opus 4.7", + "family": "claude-opus", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 4.5, + "output": 22.5, + "cache_read": 0.45 + }, + "limit": { + "context": 409600, + "output": 128000 + } + }, + { + "id": "gmicloud/anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "family": "claude-sonnet", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 3.0, + "output": 15.0, + "cache_read": 0.3 + }, + "limit": { + "context": 409600, + "output": 64000 + } + }, + { + "id": "gmicloud/deepseek-ai/DeepSeek-V4-Flash", + "name": "DeepSeek V4 Flash", + "family": "deepseek-flash", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.112, + "output": 0.224, + "cache_read": 0.022 + }, + "limit": { + "context": 1048575, + "output": 384000 + } + }, + { + "id": "gmicloud/deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "family": "deepseek-thinking", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 1.392, + "output": 2.784, + "cache_read": 0.116 + }, + "limit": { + "context": 1048576, + "output": 384000 + } + }, + { + "id": "gmicloud/moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "family": "kimi-k2.6", + "attachment": true, + "reasoning": true, + "tool_call": true, + "temperature": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.855, + "output": 3.6, + "cache_read": 0.144 + }, + "limit": { + "context": 65536, + "output": 65536 + } + }, + { + "id": "gmicloud/zai-org/GLM-5-FP8", + "name": "GLM-5", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": true, + "cost": { + "input": 0.6, + "output": 1.92, + "cache_read": 0.12 + }, + "limit": { + "context": 202752, + "output": 131072 + } + }, + { + "id": "gmicloud/zai-org/GLM-5.1-FP8", + "name": "GLM-5.1", + "family": "glm", + "attachment": false, + "reasoning": true, + "tool_call": true, + "temperature": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "open_weights": false, + "cost": { + "input": 0.98, + "output": 3.08, + "cache_read": 0.182 + }, + "limit": { + "context": 202752, + "output": 131072 + } + }, { "id": "google-vertex-anthropic/claude-3.5-haiku", "name": "Claude Haiku 3.5", @@ -40041,15 +40421,15 @@ }, { "id": "groq/moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", + "name": "Kimi K2 Instruct 0905", "family": "kimi", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "modalities": { "input": [ "text" @@ -40064,7 +40444,7 @@ "output": 3.0 }, "limit": { - "context": 131072, + "context": 262144, "output": 16384 } }, @@ -40590,7 +40970,7 @@ }, { "id": "helicone/claude-opus-4.1", - "name": "Anthropic: Claude Opus 4.1", + "name": "Anthropic: Claude Opus 4.1 (20250805)", "family": "claude-opus", "attachment": false, "reasoning": true, @@ -41908,15 +42288,15 @@ }, { "id": "helicone/kimi-k2", - "name": "Kimi K2 (07/11)", + "name": "Kimi K2 (09/05)", "family": "kimi", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-09", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "modalities": { "input": [ "text" @@ -41927,11 +42307,12 @@ }, "open_weights": false, "cost": { - "input": 0.5700000000000001, - "output": 2.3 + "input": 0.5, + "output": 2.0, + "cache_read": 0.39999999999999997 }, "limit": { - "context": 131072, + "context": 262144, "output": 16384 } }, @@ -42772,10 +43153,10 @@ }, { "id": "helicone/sonar", - "name": "Perplexity Sonar", - "family": "sonar", + "name": "Perplexity Sonar Reasoning", + "family": "sonar-reasoning", "attachment": false, - "reasoning": false, + "reasoning": true, "tool_call": false, "temperature": true, "knowledge": "2025-01", @@ -42792,7 +43173,7 @@ "open_weights": false, "cost": { "input": 1.0, - "output": 1.0 + "output": 5.0 }, "limit": { "context": 127000, @@ -51473,13 +51854,13 @@ }, { "id": "kilo/openai/gpt-4", - "name": "OpenAI: GPT-4", + "name": "OpenAI: GPT-4 (older v0314)", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2023-03-14", - "last_updated": "2024-04-09", + "release_date": "2023-05-28", + "last_updated": "2026-03-15", "modalities": { "input": [ "text" @@ -51672,12 +52053,12 @@ }, { "id": "kilo/openai/gpt-4o", - "name": "OpenAI: GPT-4o (2024-08-06)", + "name": "OpenAI: GPT-4o (2024-11-20)", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2024-08-06", + "release_date": "2024-11-20", "last_updated": "2026-03-15", "modalities": { "input": [ @@ -53511,13 +53892,13 @@ }, { "id": "kilo/qwen/qwen-plus", - "name": "Qwen: Qwen-Plus", + "name": "Qwen: Qwen Plus 0728", "attachment": false, "reasoning": false, "tool_call": true, "temperature": true, - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "release_date": "2025-09-09", + "last_updated": "2026-03-15", "modalities": { "input": [ "text" @@ -53526,11 +53907,10 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { - "input": 0.4, - "output": 1.2, - "cache_read": 0.08 + "input": 0.26, + "output": 0.78 }, "limit": { "context": 1000000, @@ -53708,13 +54088,13 @@ }, { "id": "kilo/qwen/qwen3-235b-a22b", - "name": "Qwen: Qwen3 235B A22B", + "name": "Qwen: Qwen3 235B A22B Instruct 2507", "attachment": false, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2024-12-01", - "last_updated": "2026-03-15", + "release_date": "2025-04", + "last_updated": "2026-01", "modalities": { "input": [ "text" @@ -53725,13 +54105,12 @@ }, "open_weights": true, "cost": { - "input": 0.455, - "output": 1.82, - "cache_read": 0.15 + "input": 0.071, + "output": 0.1 }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 52429 } }, { @@ -56922,7 +57301,7 @@ }, { "id": "llmgateway/claude-sonnet-4.5", - "name": "Claude Sonnet 4.5", + "name": "Claude Sonnet 4.5 (latest)", "family": "claude-sonnet", "attachment": true, "reasoning": true, @@ -64129,15 +64508,15 @@ }, { "id": "mistralai/mistral-small", - "name": "Mistral Small 3.2", + "name": "Mistral Small 4", "family": "mistral-small", - "attachment": false, - "reasoning": false, + "attachment": true, + "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2025-03", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "modalities": { "input": [ "text", @@ -64149,12 +64528,12 @@ }, "open_weights": true, "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.15, + "output": 0.6 }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 256000 } }, { @@ -70210,16 +70589,17 @@ }, { "id": "nano-gpt/claude-3.5-sonnet", - "name": "Claude 3.5 Sonnet", + "name": "Claude 3.5 Sonnet Old", "attachment": true, "reasoning": false, "tool_call": true, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -73434,12 +73814,12 @@ }, { "id": "nano-gpt/glm-4-air", - "name": "GLM 4 Air 0111", + "name": "GLM-4 Air", "attachment": false, "reasoning": false, "tool_call": false, - "release_date": "2025-01-11", - "last_updated": "2025-01-11", + "release_date": "2024-06-05", + "last_updated": "2024-06-05", "modalities": { "input": [ "text" @@ -73450,8 +73830,8 @@ }, "open_weights": false, "cost": { - "input": 0.1394, - "output": 0.1394 + "input": 0.2006, + "output": 0.2006 }, "limit": { "context": 128000, @@ -73538,12 +73918,12 @@ }, { "id": "nano-gpt/glm-4-plus", - "name": "GLM 4 Plus 0111", + "name": "GLM-4 Plus", "attachment": false, "reasoning": false, "tool_call": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "modalities": { "input": [ "text" @@ -73554,8 +73934,8 @@ }, "open_weights": false, "cost": { - "input": 9.996, - "output": 9.996 + "input": 7.497, + "output": 7.497 }, "limit": { "context": 128000, @@ -76135,13 +76515,13 @@ }, { "id": "nano-gpt/openai/gpt-4o", - "name": "GPT-4o (2024-08-06)", + "name": "GPT-4o (2024-11-20)", "family": "gpt", "attachment": true, "reasoning": false, "tool_call": false, - "release_date": "2024-08-06", - "last_updated": "2024-08-06", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "modalities": { "input": [ "text", @@ -76153,8 +76533,8 @@ }, "open_weights": false, "cost": { - "input": 2.499, - "output": 9.996 + "input": 2.5, + "output": 10.0 }, "limit": { "context": 128000, @@ -76414,18 +76794,16 @@ }, { "id": "nano-gpt/openai/gpt-5.1", - "name": "GPT 5.1", + "name": "GPT-5.1 (2025-11-13)", "family": "gpt", - "attachment": true, - "reasoning": true, - "tool_call": true, + "attachment": false, + "reasoning": false, + "tool_call": false, "release_date": "2025-11-13", "last_updated": "2025-11-13", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -76437,8 +76815,8 @@ "output": 10.0 }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 32768 } }, { @@ -78581,11 +78959,11 @@ }, { "id": "nano-gpt/x-ai/grok-4.1-fast", - "name": "Grok 4.1 Fast", + "name": "Grok 4.1 Fast Reasoning", "family": "grok", "attachment": true, "reasoning": true, - "tool_call": true, + "tool_call": false, "release_date": "2025-11-20", "last_updated": "2025-11-20", "modalities": { @@ -85525,14 +85903,14 @@ }, { "id": "nvidia/moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", + "name": "Kimi K2 0905", "family": "kimi", "attachment": false, - "reasoning": true, + "reasoning": false, "tool_call": true, "temperature": true, - "knowledge": "2024-01", - "release_date": "2025-01-01", + "knowledge": "2024-10", + "release_date": "2025-09-05", "last_updated": "2025-09-05", "modalities": { "input": [ @@ -85542,14 +85920,14 @@ "text" ] }, - "open_weights": false, + "open_weights": true, "cost": { "input": 0.0, "output": 0.0 }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 } }, { @@ -88101,15 +88479,15 @@ }, { "id": "openai/gpt-4o", - "name": "GPT-4o (2024-08-06)", + "name": "GPT-4o (2024-11-20)", "family": "gpt", "attachment": true, "reasoning": false, "tool_call": true, "temperature": true, "knowledge": "2023-09", - "release_date": "2024-08-06", - "last_updated": "2024-08-06", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "modalities": { "input": [ "text", @@ -91608,16 +91986,18 @@ "id": "opencode/qwen3.6-plus-free", "name": "Qwen3.6 Plus Free", "family": "qwen-free", - "attachment": false, + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "knowledge": "2024-12", - "release_date": "2026-03-30", - "last_updated": "2026-03-30", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -91630,8 +92010,8 @@ "cache_read": 0.0 }, "limit": { - "context": 1048576, - "output": 64000 + "context": 262144, + "output": 65536 } }, { @@ -104536,16 +104916,19 @@ }, { "id": "qiniu-ai/x-ai/grok-4.1-fast", - "name": "x-AI/Grok-4.1-Fast", - "attachment": false, + "name": "X-Ai/Grok 4.1 Fast Reasoning", + "attachment": true, "reasoning": true, "tool_call": true, "temperature": true, - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" @@ -104554,7 +104937,7 @@ "open_weights": false, "cost": {}, "limit": { - "context": 2000000, + "context": 20000000, "output": 2000000 } }, @@ -122099,19 +122482,18 @@ }, { "id": "vercel/perplexity/sonar", - "name": "Sonar", - "family": "sonar", - "attachment": true, - "reasoning": false, - "tool_call": true, + "name": "Sonar Reasoning", + "family": "sonar-reasoning", + "attachment": false, + "reasoning": true, + "tool_call": false, "temperature": true, - "knowledge": "2025-02", + "knowledge": "2025-09", "release_date": "2025-02-19", "last_updated": "2025-02-19", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -122120,7 +122502,7 @@ "open_weights": false, "cost": { "input": 1.0, - "output": 1.0 + "output": 5.0 }, "limit": { "context": 127000, @@ -124862,7 +125244,7 @@ }, { "id": "x-ai/grok-2-vision", - "name": "Grok 2 Vision", + "name": "Grok 2 Vision (1212)", "family": "grok", "attachment": true, "reasoning": false, @@ -124870,7 +125252,7 @@ "temperature": true, "knowledge": "2024-08", "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "last_updated": "2024-12-12", "modalities": { "input": [ "text", @@ -124923,7 +125305,7 @@ }, { "id": "x-ai/grok-3-fast", - "name": "Grok 3 Fast", + "name": "Grok 3 Fast Latest", "family": "grok", "attachment": false, "reasoning": false, @@ -124953,7 +125335,7 @@ }, { "id": "x-ai/grok-3-mini", - "name": "Grok 3 Mini Latest", + "name": "Grok 3 Mini", "family": "grok", "attachment": false, "reasoning": true, @@ -124983,7 +125365,7 @@ }, { "id": "x-ai/grok-3-mini-fast", - "name": "Grok 3 Mini Fast", + "name": "Grok 3 Mini Fast Latest", "family": "grok", "attachment": false, "reasoning": true, diff --git a/crates/goose/src/providers/canonical/data/provider_metadata.json b/crates/goose/src/providers/canonical/data/provider_metadata.json index ef58aa071399..8b0a6078abe8 100644 --- a/crates/goose/src/providers/canonical/data/provider_metadata.json +++ b/crates/goose/src/providers/canonical/data/provider_metadata.json @@ -1,36 +1,36 @@ [ { - "id": "helicone", - "display_name": "Helicone", + "id": "302ai", + "display_name": "302.AI", "npm": "@ai-sdk/openai-compatible", - "api": "https://ai-gateway.helicone.ai/v1", - "doc": "https://helicone.ai/models", + "api": "https://api.302.ai/v1", + "doc": "https://doc.302.ai", "env": [ - "HELICONE_API_KEY" + "302AI_API_KEY" ], - "model_count": 90 + "model_count": 97 }, { - "id": "auriko", - "display_name": "Auriko", + "id": "alibaba", + "display_name": "Alibaba", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.auriko.ai/v1", - "doc": "https://docs.auriko.ai", + "api": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/models", "env": [ - "AURIKO_API_KEY" + "DASHSCOPE_API_KEY" ], - "model_count": 15 + "model_count": 48 }, { - "id": "firepass", - "display_name": "Fireworks (Firepass)", + "id": "scaleway", + "display_name": "Scaleway", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.fireworks.ai/inference/v1/", - "doc": "https://docs.fireworks.ai/firepass", + "api": "https://api.scaleway.ai/v1", + "doc": "https://www.scaleway.com/en/docs/generative-apis/", "env": [ - "FIREPASS_API_KEY" + "SCALEWAY_API_KEY" ], - "model_count": 1 + "model_count": 16 }, { "id": "nano-gpt", @@ -44,26 +44,37 @@ "model_count": 525 }, { - "id": "io-net", - "display_name": "IO.NET", + "id": "abacus", + "display_name": "Abacus", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.intelligence.io.solutions/api/v1", - "doc": "https://io.net/docs/guides/intelligence/io-intelligence", + "api": "https://routellm.abacus.ai/v1", + "doc": "https://abacus.ai/help/api", "env": [ - "IOINTELLIGENCE_API_KEY" + "ABACUS_API_KEY" ], - "model_count": 17 + "model_count": 65 }, { - "id": "inception", - "display_name": "Inception", + "id": "perplexity-agent", + "display_name": "Perplexity Agent", + "npm": "@ai-sdk/openai", + "api": "https://api.perplexity.ai/v1", + "doc": "https://docs.perplexity.ai/docs/agent-api/models", + "env": [ + "PERPLEXITY_API_KEY" + ], + "model_count": 18 + }, + { + "id": "siliconflow-cn", + "display_name": "SiliconFlow (China)", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.inceptionlabs.ai/v1/", - "doc": "https://platform.inceptionlabs.ai/docs", + "api": "https://api.siliconflow.cn/v1", + "doc": "https://cloud.siliconflow.com/models", "env": [ - "INCEPTION_API_KEY" + "SILICONFLOW_CN_API_KEY" ], - "model_count": 2 + "model_count": 81 }, { "id": "submodel", @@ -77,81 +88,59 @@ "model_count": 9 }, { - "id": "requesty", - "display_name": "Requesty", - "npm": "@ai-sdk/openai-compatible", - "api": "https://router.requesty.ai/v1", - "doc": "https://requesty.ai/solution/llm-routing/models", - "env": [ - "REQUESTY_API_KEY" - ], - "model_count": 38 - }, - { - "id": "zai", - "display_name": "Z.AI", - "npm": "@ai-sdk/openai-compatible", - "api": "https://api.z.ai/api/paas/v4", - "doc": "https://docs.z.ai/guides/overview/pricing", - "env": [ - "ZHIPU_API_KEY" - ], - "model_count": 13 - }, - { - "id": "zai-coding-plan", - "display_name": "Z.AI Coding Plan", - "npm": "@ai-sdk/openai-compatible", - "api": "https://api.z.ai/api/coding/paas/v4", - "doc": "https://docs.z.ai/devpack/overview", + "id": "minimax-coding-plan", + "display_name": "MiniMax Token Plan (minimax.io)", + "npm": "@ai-sdk/anthropic", + "api": "https://api.minimax.io/anthropic/v1", + "doc": "https://platform.minimax.io/docs/token-plan/intro", "env": [ - "ZHIPU_API_KEY" + "MINIMAX_API_KEY" ], - "model_count": 5 + "model_count": 6 }, { - "id": "clarifai", - "display_name": "Clarifai", + "id": "claudinio", + "display_name": "Claudinio", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.clarifai.com/v2/ext/openai/v1", - "doc": "https://docs.clarifai.com/compute/inference/", + "api": "https://api.claudin.io/v1", + "doc": "https://claudin.io", "env": [ - "CLARIFAI_PAT" + "CLAUDINIO_API_KEY" ], - "model_count": 12 + "model_count": 1 }, { - "id": "moark", - "display_name": "Moark", + "id": "deepseek", + "display_name": "DeepSeek", "npm": "@ai-sdk/openai-compatible", - "api": "https://moark.com/v1", - "doc": "https://moark.com/docs/openapi/v1#tag/%E6%96%87%E6%9C%AC%E7%94%9F%E6%88%90", + "api": "https://api.deepseek.com", + "doc": "https://api-docs.deepseek.com/quick_start/pricing", "env": [ - "MOARK_API_KEY" + "DEEPSEEK_API_KEY" ], - "model_count": 2 + "model_count": 4 }, { - "id": "frogbot", - "display_name": "FrogBot", + "id": "meta-llama", + "display_name": "Llama", "npm": "@ai-sdk/openai-compatible", - "api": "https://app.frogbot.ai/api/v1", - "doc": "https://docs.frogbot.ai", + "api": "https://api.llama.com/compat/v1/", + "doc": "https://llama.developer.meta.com/docs/models", "env": [ - "FROGBOT_API_KEY" + "LLAMA_API_KEY" ], - "model_count": 26 + "model_count": 7 }, { - "id": "wandb", - "display_name": "Weights & Biases", + "id": "fireworks-ai", + "display_name": "Fireworks AI", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.inference.wandb.ai/v1", - "doc": "https://docs.wandb.ai/guides/integrations/inference/", + "api": "https://api.fireworks.ai/inference/v1/", + "doc": "https://fireworks.ai/docs/", "env": [ - "WANDB_API_KEY" + "FIREWORKS_API_KEY" ], - "model_count": 18 + "model_count": 19 }, { "id": "ambient", @@ -165,226 +154,203 @@ "model_count": 2 }, { - "id": "the-grid-ai", - "display_name": "The Grid AI", - "npm": "@ai-sdk/openai-compatible", - "api": "https://api.thegrid.ai/v1", - "doc": "https://thegrid.ai/docs", + "id": "kimi-for-coding", + "display_name": "Kimi For Coding", + "npm": "@ai-sdk/anthropic", + "api": "https://api.kimi.com/coding/v1", + "doc": "https://www.kimi.com/coding/docs/en/third-party-agents.html", "env": [ - "THEGRIDAI_API_KEY" + "KIMI_API_KEY" ], "model_count": 3 }, { - "id": "fastrouter", - "display_name": "FastRouter", + "id": "moark", + "display_name": "Moark", "npm": "@ai-sdk/openai-compatible", - "api": "https://go.fastrouter.ai/api/v1", - "doc": "https://fastrouter.ai/models", + "api": "https://moark.com/v1", + "doc": "https://moark.com/docs/openapi/v1#tag/%E6%96%87%E6%9C%AC%E7%94%9F%E6%88%90", "env": [ - "FASTROUTER_API_KEY" + "MOARK_API_KEY" ], - "model_count": 15 + "model_count": 2 }, { - "id": "tencent-coding-plan", - "display_name": "Tencent Coding Plan (China)", + "id": "opencode-go", + "display_name": "OpenCode Go", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.lkeap.cloud.tencent.com/coding/v3", - "doc": "https://cloud.tencent.com/document/product/1772/128947", + "api": "https://opencode.ai/zen/go/v1", + "doc": "https://opencode.ai/docs/zen", "env": [ - "TENCENT_CODING_PLAN_API_KEY" + "OPENCODE_API_KEY" ], - "model_count": 8 + "model_count": 14 }, { - "id": "cortecs", - "display_name": "Cortecs", + "id": "databricks", + "display_name": "Databricks", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.cortecs.ai/v1", - "doc": "https://api.cortecs.ai/v1/models", + "api": "https://${DATABRICKS_HOST}/ai-gateway/mlflow/v1", + "doc": "https://docs.databricks.com/aws/en/machine-learning/foundation-models/", "env": [ - "CORTECS_API_KEY" + "DATABRICKS_HOST", + "DATABRICKS_TOKEN" ], - "model_count": 49 + "model_count": 25 }, { - "id": "baseten", - "display_name": "Baseten", + "id": "io-net", + "display_name": "IO.NET", "npm": "@ai-sdk/openai-compatible", - "api": "https://inference.baseten.co/v1", - "doc": "https://docs.baseten.co/development/model-apis/overview", + "api": "https://api.intelligence.io.solutions/api/v1", + "doc": "https://io.net/docs/guides/intelligence/io-intelligence", "env": [ - "BASETEN_API_KEY" + "IOINTELLIGENCE_API_KEY" ], - "model_count": 14 + "model_count": 17 }, { - "id": "meta-llama", - "display_name": "Llama", + "id": "alibaba-cn", + "display_name": "Alibaba (China)", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.llama.com/compat/v1/", - "doc": "https://llama.developer.meta.com/docs/models", + "api": "https://dashscope.aliyuncs.com/compatible-mode/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/models", "env": [ - "LLAMA_API_KEY" + "DASHSCOPE_API_KEY" ], - "model_count": 7 + "model_count": 80 }, { - "id": "novita-ai", - "display_name": "NovitaAI", + "id": "firepass", + "display_name": "Fireworks (Firepass)", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.novita.ai/openai", - "doc": "https://novita.ai/docs/guides/introduction", + "api": "https://api.fireworks.ai/inference/v1/", + "doc": "https://docs.fireworks.ai/firepass", "env": [ - "NOVITA_API_KEY" + "FIREPASS_API_KEY" ], - "model_count": 99 + "model_count": 1 }, { - "id": "digitalocean", - "display_name": "DigitalOcean", - "npm": "@ai-sdk/openai-compatible", - "api": "https://inference.do-ai.run/v1", - "doc": "https://docs.digitalocean.com/products/gradient-ai-platform/details/models/", + "id": "minimax-cn-coding-plan", + "display_name": "MiniMax Token Plan (minimaxi.com)", + "npm": "@ai-sdk/anthropic", + "api": "https://api.minimaxi.com/anthropic/v1", + "doc": "https://platform.minimaxi.com/docs/token-plan/intro", "env": [ - "DIGITALOCEAN_ACCESS_TOKEN" + "MINIMAX_API_KEY" ], - "model_count": 76 + "model_count": 6 }, { - "id": "moonshotai", - "display_name": "Moonshot AI", + "id": "jiekou", + "display_name": "Jiekou.AI", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.moonshot.ai/v1", - "doc": "https://platform.moonshot.ai/docs/api/chat", + "api": "https://api.jiekou.ai/openai", + "doc": "https://docs.jiekou.ai/docs/support/quickstart?utm_source=github_models.dev", "env": [ - "MOONSHOT_API_KEY" + "JIEKOU_API_KEY" ], - "model_count": 7 + "model_count": 61 }, { - "id": "kilo", - "display_name": "Kilo Gateway", + "id": "bailing", + "display_name": "Bailing", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.kilo.ai/api/gateway", - "doc": "https://kilo.ai", + "api": "https://api.tbox.cn/api/llm/v1/chat/completions", + "doc": "https://alipaytbox.yuque.com/sxs0ba/ling/intro", "env": [ - "KILO_API_KEY" + "BAILING_API_TOKEN" ], - "model_count": 357 + "model_count": 2 }, { - "id": "cloudflare-workers-ai", - "display_name": "Cloudflare Workers AI", + "id": "iflowcn", + "display_name": "iFlow", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.cloudflare.com/client/v4/accounts/${CLOUDFLARE_ACCOUNT_ID}/ai/v1", - "doc": "https://developers.cloudflare.com/workers-ai/models/", + "api": "https://apis.iflow.cn/v1", + "doc": "https://platform.iflow.cn/en/docs", "env": [ - "CLOUDFLARE_ACCOUNT_ID", - "CLOUDFLARE_API_KEY" + "IFLOW_API_KEY" ], - "model_count": 8 + "model_count": 14 }, { - "id": "lmstudio", - "display_name": "LMStudio", + "id": "huggingface", + "display_name": "Hugging Face", "npm": "@ai-sdk/openai-compatible", - "api": "http://127.0.0.1:1234/v1", - "doc": "https://lmstudio.ai/models", + "api": "https://router.huggingface.co/v1", + "doc": "https://huggingface.co/docs/inference-providers", "env": [ - "LMSTUDIO_API_KEY" + "HF_TOKEN" ], - "model_count": 3 + "model_count": 24 }, { - "id": "xiaomi-token-plan-cn", - "display_name": "Xiaomi Token Plan (China)", + "id": "zenmux", + "display_name": "ZenMux", "npm": "@ai-sdk/openai-compatible", - "api": "https://token-plan-cn.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", + "api": "https://zenmux.ai/api/v1", + "doc": "https://docs.zenmux.ai", "env": [ - "XIAOMI_API_KEY" + "ZENMUX_API_KEY" ], - "model_count": 6 + "model_count": 96 }, { - "id": "morph", - "display_name": "Morph", + "id": "upstage", + "display_name": "Upstage", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.morphllm.com/v1", - "doc": "https://docs.morphllm.com/api-reference/introduction", + "api": "https://api.upstage.ai/v1/solar", + "doc": "https://developers.upstage.ai/docs/apis/chat", "env": [ - "MORPH_API_KEY" + "UPSTAGE_API_KEY" ], "model_count": 3 }, { - "id": "nearai", - "display_name": "NEAR AI Cloud", - "npm": "@ai-sdk/openai-compatible", - "api": "https://cloud-api.near.ai/v1", - "doc": "https://docs.near.ai/", - "env": [ - "NEARAI_API_KEY" - ], - "model_count": 33 - }, - { - "id": "abacus", - "display_name": "Abacus", + "id": "novita-ai", + "display_name": "NovitaAI", "npm": "@ai-sdk/openai-compatible", - "api": "https://routellm.abacus.ai/v1", - "doc": "https://abacus.ai/help/api", + "api": "https://api.novita.ai/openai", + "doc": "https://novita.ai/docs/guides/introduction", "env": [ - "ABACUS_API_KEY" + "NOVITA_API_KEY" ], - "model_count": 65 + "model_count": 99 }, { - "id": "privatemode-ai", - "display_name": "Privatemode AI", + "id": "xiaomi-token-plan-cn", + "display_name": "Xiaomi Token Plan (China)", "npm": "@ai-sdk/openai-compatible", - "api": "http://localhost:8080/v1", - "doc": "https://docs.privatemode.ai/api/overview", - "env": [ - "PRIVATEMODE_API_KEY", - "PRIVATEMODE_ENDPOINT" - ], - "model_count": 5 - }, - { - "id": "minimax-cn-coding-plan", - "display_name": "MiniMax Coding Plan (minimaxi.com)", - "npm": "@ai-sdk/anthropic", - "api": "https://api.minimaxi.com/anthropic/v1", - "doc": "https://platform.minimaxi.com/docs/coding-plan/intro", + "api": "https://token-plan-cn.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", "env": [ - "MINIMAX_API_KEY" + "XIAOMI_API_KEY" ], "model_count": 6 }, { - "id": "xiaomi-token-plan-ams", - "display_name": "Xiaomi Token Plan (Europe)", + "id": "wandb", + "display_name": "Weights & Biases", "npm": "@ai-sdk/openai-compatible", - "api": "https://token-plan-ams.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", + "api": "https://api.inference.wandb.ai/v1", + "doc": "https://docs.wandb.ai/guides/integrations/inference/", "env": [ - "XIAOMI_API_KEY" + "WANDB_API_KEY" ], - "model_count": 6 + "model_count": 18 }, { - "id": "cloudferro-sherlock", - "display_name": "CloudFerro Sherlock", + "id": "chutes", + "display_name": "Chutes", "npm": "@ai-sdk/openai-compatible", - "api": "https://api-sherlock.cloudferro.com/openai/v1/", - "doc": "https://docs.sherlock.cloudferro.com/", + "api": "https://llm.chutes.ai/v1", + "doc": "https://llm.chutes.ai/v1/models", "env": [ - "CLOUDFERRO_SHERLOCK_API_KEY" + "CHUTES_API_KEY" ], - "model_count": 5 + "model_count": 39 }, { "id": "dinference", @@ -409,225 +375,246 @@ "model_count": 13 }, { - "id": "vultr", - "display_name": "Vultr", + "id": "qiniu-ai", + "display_name": "Qiniu", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.vultrinference.com/v1", - "doc": "https://api.vultrinference.com/", + "api": "https://api.qnaigc.com/v1", + "doc": "https://developer.qiniu.com/aitokenapi", "env": [ - "VULTR_API_KEY" + "QINIU_API_KEY" ], - "model_count": 5 + "model_count": 91 }, { - "id": "kuae-cloud-coding-plan", - "display_name": "KUAE Cloud Coding Plan", + "id": "kilo", + "display_name": "Kilo Gateway", "npm": "@ai-sdk/openai-compatible", - "api": "https://coding-plan-endpoint.kuaecloud.net/v1", - "doc": "https://docs.mthreads.com/kuaecloud/kuaecloud-doc-online/coding_plan/", + "api": "https://api.kilo.ai/api/gateway", + "doc": "https://kilo.ai", "env": [ - "KUAE_API_KEY" + "KILO_API_KEY" ], - "model_count": 1 + "model_count": 357 }, { - "id": "modelscope", - "display_name": "ModelScope", + "id": "auriko", + "display_name": "Auriko", "npm": "@ai-sdk/openai-compatible", - "api": "https://api-inference.modelscope.cn/v1", - "doc": "https://modelscope.cn/docs/model-service/API-Inference/intro", + "api": "https://api.auriko.ai/v1", + "doc": "https://docs.auriko.ai", "env": [ - "MODELSCOPE_API_KEY" + "AURIKO_API_KEY" ], - "model_count": 7 + "model_count": 15 }, { - "id": "kimi-for-coding", - "display_name": "Kimi For Coding", - "npm": "@ai-sdk/anthropic", - "api": "https://api.kimi.com/coding/v1", - "doc": "https://www.kimi.com/coding/docs/en/third-party-agents.html", + "id": "morph", + "display_name": "Morph", + "npm": "@ai-sdk/openai-compatible", + "api": "https://api.morphllm.com/v1", + "doc": "https://docs.morphllm.com/api-reference/introduction", "env": [ - "KIMI_API_KEY" + "MORPH_API_KEY" ], "model_count": 3 }, { - "id": "lucidquery", - "display_name": "LucidQuery AI", + "id": "github-copilot", + "display_name": "GitHub Copilot", "npm": "@ai-sdk/openai-compatible", - "api": "https://lucidquery.com/api/v1", - "doc": "https://lucidquery.com/api/docs", + "api": "https://api.githubcopilot.com", + "doc": "https://docs.github.com/en/copilot", "env": [ - "LUCIDQUERY_API_KEY" + "GITHUB_TOKEN" ], - "model_count": 2 + "model_count": 27 }, { - "id": "neuralwatt", - "display_name": "Neuralwatt", + "id": "mixlayer", + "display_name": "Mixlayer", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.neuralwatt.com/v1", - "doc": "https://portal.neuralwatt.com/docs", + "api": "https://models.mixlayer.ai/v1", + "doc": "https://docs.mixlayer.com", "env": [ - "NEURALWATT_API_KEY" + "MIXLAYER_API_KEY" ], - "model_count": 14 + "model_count": 5 }, { - "id": "jiekou", - "display_name": "Jiekou.AI", + "id": "xiaomi-token-plan-sgp", + "display_name": "Xiaomi Token Plan (Singapore)", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.jiekou.ai/openai", - "doc": "https://docs.jiekou.ai/docs/support/quickstart?utm_source=github_models.dev", + "api": "https://token-plan-sgp.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", "env": [ - "JIEKOU_API_KEY" + "XIAOMI_API_KEY" ], - "model_count": 61 + "model_count": 6 }, { - "id": "ovhcloud", - "display_name": "OVHcloud AI Endpoints", + "id": "zai", + "display_name": "Z.AI", "npm": "@ai-sdk/openai-compatible", - "api": "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1", - "doc": "https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//", + "api": "https://api.z.ai/api/paas/v4", + "doc": "https://docs.z.ai/guides/overview/pricing", "env": [ - "OVHCLOUD_API_KEY" + "ZHIPU_API_KEY" ], - "model_count": 11 + "model_count": 13 }, { - "id": "friendli", - "display_name": "Friendli", + "id": "opencode", + "display_name": "OpenCode Zen", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.friendli.ai/serverless/v1", - "doc": "https://friendli.ai/docs/guides/serverless_endpoints/introduction", + "api": "https://opencode.ai/zen/v1", + "doc": "https://opencode.ai/docs/zen", "env": [ - "FRIENDLI_TOKEN" + "OPENCODE_API_KEY" ], - "model_count": 6 + "model_count": 60 }, { - "id": "regolo-ai", - "display_name": "Regolo AI", + "id": "stepfun", + "display_name": "StepFun", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.regolo.ai/v1", - "doc": "https://docs.regolo.ai/", + "api": "https://api.stepfun.com/v1", + "doc": "https://platform.stepfun.com/docs/zh/overview/concept", "env": [ - "REGOLO_API_KEY" + "STEPFUN_API_KEY" ], - "model_count": 13 + "model_count": 4 }, { - "id": "claudinio", - "display_name": "Claudinio", + "id": "nebius", + "display_name": "Nebius Token Factory", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.claudin.io/v1", - "doc": "https://claudin.io", + "api": "https://api.tokenfactory.nebius.com/v1", + "doc": "https://docs.tokenfactory.nebius.com/", "env": [ - "CLAUDINIO_API_KEY" + "NEBIUS_API_KEY" ], - "model_count": 1 + "model_count": 31 }, { - "id": "opencode-go", - "display_name": "OpenCode Go", + "id": "poe", + "display_name": "Poe", "npm": "@ai-sdk/openai-compatible", - "api": "https://opencode.ai/zen/go/v1", - "doc": "https://opencode.ai/docs/zen", + "api": "https://api.poe.com/v1", + "doc": "https://creator.poe.com/docs/external-applications/openai-compatible-api", "env": [ - "OPENCODE_API_KEY" + "POE_API_KEY" ], - "model_count": 14 + "model_count": 135 }, { - "id": "llmgateway", - "display_name": "LLM Gateway", + "id": "helicone", + "display_name": "Helicone", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.llmgateway.io/v1", - "doc": "https://llmgateway.io/docs", + "api": "https://ai-gateway.helicone.ai/v1", + "doc": "https://helicone.ai/models", "env": [ - "LLMGATEWAY_API_KEY" + "HELICONE_API_KEY" ], - "model_count": 196 + "model_count": 90 }, { - "id": "poe", - "display_name": "Poe", + "id": "ollama-cloud", + "display_name": "Ollama Cloud", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.poe.com/v1", - "doc": "https://creator.poe.com/docs/external-applications/openai-compatible-api", + "api": "https://ollama.com/v1", + "doc": "https://docs.ollama.com/cloud", "env": [ - "POE_API_KEY" + "OLLAMA_API_KEY" ], - "model_count": 135 + "model_count": 39 }, { - "id": "minimax", - "display_name": "MiniMax (minimax.io)", - "npm": "@ai-sdk/anthropic", - "api": "https://api.minimax.io/anthropic/v1", - "doc": "https://platform.minimax.io/docs/guides/quickstart", + "id": "zai-coding-plan", + "display_name": "Z.AI Coding Plan", + "npm": "@ai-sdk/openai-compatible", + "api": "https://api.z.ai/api/coding/paas/v4", + "doc": "https://docs.z.ai/devpack/overview", "env": [ - "MINIMAX_API_KEY" + "ZHIPU_API_KEY" ], - "model_count": 6 + "model_count": 5 }, { - "id": "xiaomi-token-plan-sgp", - "display_name": "Xiaomi Token Plan (Singapore)", + "id": "the-grid-ai", + "display_name": "The Grid AI", "npm": "@ai-sdk/openai-compatible", - "api": "https://token-plan-sgp.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", + "api": "https://api.thegrid.ai/v1", + "doc": "https://thegrid.ai/docs", "env": [ - "XIAOMI_API_KEY" + "THEGRIDAI_API_KEY" ], - "model_count": 6 + "model_count": 3 }, { - "id": "siliconflow", - "display_name": "SiliconFlow", + "id": "baseten", + "display_name": "Baseten", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.siliconflow.com/v1", - "doc": "https://cloud.siliconflow.com/models", + "api": "https://inference.baseten.co/v1", + "doc": "https://docs.baseten.co/development/model-apis/overview", "env": [ - "SILICONFLOW_API_KEY" + "BASETEN_API_KEY" ], - "model_count": 76 + "model_count": 14 }, { - "id": "ollama-cloud", - "display_name": "Ollama Cloud", + "id": "frogbot", + "display_name": "FrogBot", "npm": "@ai-sdk/openai-compatible", - "api": "https://ollama.com/v1", - "doc": "https://docs.ollama.com/cloud", + "api": "https://app.frogbot.ai/api/v1", + "doc": "https://docs.frogbot.ai", "env": [ - "OLLAMA_API_KEY" + "FROGBOT_API_KEY" ], - "model_count": 39 + "model_count": 26 }, { - "id": "databricks", - "display_name": "Databricks", + "id": "zhipuai-coding-plan", + "display_name": "Zhipu AI Coding Plan", "npm": "@ai-sdk/openai-compatible", - "api": "https://${DATABRICKS_HOST}/ai-gateway/mlflow/v1", - "doc": "https://docs.databricks.com/aws/en/machine-learning/foundation-models/", + "api": "https://open.bigmodel.cn/api/coding/paas/v4", + "doc": "https://docs.bigmodel.cn/cn/coding-plan/overview", "env": [ - "DATABRICKS_HOST", - "DATABRICKS_TOKEN" + "ZHIPU_API_KEY" ], - "model_count": 25 + "model_count": 5 }, { - "id": "berget", - "display_name": "Berget.AI", + "id": "alibaba-coding-plan", + "display_name": "Alibaba Coding Plan", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.berget.ai/v1", - "doc": "https://api.berget.ai", + "api": "https://coding-intl.dashscope.aliyuncs.com/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/coding-plan", "env": [ - "BERGET_API_KEY" + "ALIBABA_CODING_PLAN_API_KEY" ], - "model_count": 6 + "model_count": 9 + }, + { + "id": "lmstudio", + "display_name": "LMStudio", + "npm": "@ai-sdk/openai-compatible", + "api": "http://127.0.0.1:1234/v1", + "doc": "https://lmstudio.ai/models", + "env": [ + "LMSTUDIO_API_KEY" + ], + "model_count": 3 + }, + { + "id": "lucidquery", + "display_name": "LucidQuery AI", + "npm": "@ai-sdk/openai-compatible", + "api": "https://lucidquery.com/api/v1", + "doc": "https://lucidquery.com/api/docs", + "env": [ + "LUCIDQUERY_API_KEY" + ], + "model_count": 2 }, { "id": "moonshotai-cn", @@ -641,235 +628,280 @@ "model_count": 7 }, { - "id": "alibaba-coding-plan-cn", - "display_name": "Alibaba Coding Plan (China)", + "id": "gmicloud", + "display_name": "GMI Cloud", "npm": "@ai-sdk/openai-compatible", - "api": "https://coding.dashscope.aliyuncs.com/v1", - "doc": "https://help.aliyun.com/zh/model-studio/coding-plan", + "api": "https://api.gmi-serving.com/v1", + "doc": "https://docs.gmicloud.ai/inference-engine/api-reference/llm-api-reference", "env": [ - "ALIBABA_CODING_PLAN_API_KEY" + "GMICLOUD_API_KEY" ], - "model_count": 9 + "model_count": 8 }, { - "id": "minimax-cn", - "display_name": "MiniMax (minimaxi.com)", - "npm": "@ai-sdk/anthropic", - "api": "https://api.minimaxi.com/anthropic/v1", - "doc": "https://platform.minimaxi.com/docs/guides/quickstart", + "id": "abliteration-ai", + "display_name": "abliteration.ai", + "npm": "@ai-sdk/openai-compatible", + "api": "https://api.abliteration.ai/v1", + "doc": "https://docs.abliteration.ai/models", "env": [ - "MINIMAX_API_KEY" + "ABLIT_KEY" ], - "model_count": 6 + "model_count": 1 }, { - "id": "chutes", - "display_name": "Chutes", + "id": "wafer.ai", + "display_name": "Wafer", "npm": "@ai-sdk/openai-compatible", - "api": "https://llm.chutes.ai/v1", - "doc": "https://llm.chutes.ai/v1/models", + "api": "https://pass.wafer.ai/v1", + "doc": "https://docs.wafer.ai/wafer-pass", "env": [ - "CHUTES_API_KEY" + "WAFER_API_KEY" ], - "model_count": 39 + "model_count": 2 }, { - "id": "siliconflow-cn", - "display_name": "SiliconFlow (China)", + "id": "xpersona", + "display_name": "Xpersona", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.siliconflow.cn/v1", - "doc": "https://cloud.siliconflow.com/models", + "api": "https://xpersona.co/v1", + "doc": "https://xpersona.co/docs", "env": [ - "SILICONFLOW_CN_API_KEY" + "XPERSONA_API_KEY" ], - "model_count": 81 + "model_count": 1 }, { - "id": "nvidia", - "display_name": "Nvidia", + "id": "cloudferro-sherlock", + "display_name": "CloudFerro Sherlock", "npm": "@ai-sdk/openai-compatible", - "api": "https://integrate.api.nvidia.com/v1", - "doc": "https://docs.api.nvidia.com/nim/", + "api": "https://api-sherlock.cloudferro.com/openai/v1/", + "doc": "https://docs.sherlock.cloudferro.com/", "env": [ - "NVIDIA_API_KEY" + "CLOUDFERRO_SHERLOCK_API_KEY" ], - "model_count": 92 + "model_count": 5 }, { - "id": "zhipuai-coding-plan", - "display_name": "Zhipu AI Coding Plan", + "id": "kuae-cloud-coding-plan", + "display_name": "KUAE Cloud Coding Plan", "npm": "@ai-sdk/openai-compatible", - "api": "https://open.bigmodel.cn/api/coding/paas/v4", - "doc": "https://docs.bigmodel.cn/cn/coding-plan/overview", + "api": "https://coding-plan-endpoint.kuaecloud.net/v1", + "doc": "https://docs.mthreads.com/kuaecloud/kuaecloud-doc-online/coding_plan/", "env": [ - "ZHIPU_API_KEY" + "KUAE_API_KEY" ], - "model_count": 5 + "model_count": 1 }, { - "id": "github-models", - "display_name": "GitHub Models", + "id": "meganova", + "display_name": "Meganova", "npm": "@ai-sdk/openai-compatible", - "api": "https://models.github.ai/inference", - "doc": "https://docs.github.com/en/github-models", + "api": "https://api.meganova.ai/v1", + "doc": "https://docs.meganova.ai", "env": [ - "GITHUB_TOKEN" + "MEGANOVA_API_KEY" ], - "model_count": 55 + "model_count": 19 }, { - "id": "qiniu-ai", - "display_name": "Qiniu", + "id": "evroc", + "display_name": "evroc", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.qnaigc.com/v1", - "doc": "https://developer.qiniu.com/aitokenapi", + "api": "https://models.think.evroc.com/v1", + "doc": "https://docs.evroc.com/products/think/overview.html", "env": [ - "QINIU_API_KEY" + "EVROC_API_KEY" ], - "model_count": 91 + "model_count": 13 }, { - "id": "scaleway", - "display_name": "Scaleway", + "id": "nearai", + "display_name": "NEAR AI Cloud", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.scaleway.ai/v1", - "doc": "https://www.scaleway.com/en/docs/generative-apis/", + "api": "https://cloud-api.near.ai/v1", + "doc": "https://docs.near.ai/", "env": [ - "SCALEWAY_API_KEY" + "NEARAI_API_KEY" ], - "model_count": 16 + "model_count": 33 }, { - "id": "opencode", - "display_name": "OpenCode Zen", + "id": "synthetic", + "display_name": "Synthetic", "npm": "@ai-sdk/openai-compatible", - "api": "https://opencode.ai/zen/v1", - "doc": "https://opencode.ai/docs/zen", + "api": "https://api.synthetic.new/openai/v1", + "doc": "https://synthetic.new/pricing", "env": [ - "OPENCODE_API_KEY" + "SYNTHETIC_API_KEY" ], - "model_count": 60 + "model_count": 33 }, { - "id": "mixlayer", - "display_name": "Mixlayer", + "id": "nvidia", + "display_name": "Nvidia", "npm": "@ai-sdk/openai-compatible", - "api": "https://models.mixlayer.ai/v1", - "doc": "https://docs.mixlayer.com", + "api": "https://integrate.api.nvidia.com/v1", + "doc": "https://docs.api.nvidia.com/nim/", "env": [ - "MIXLAYER_API_KEY" + "NVIDIA_API_KEY" ], - "model_count": 5 + "model_count": 92 }, { - "id": "zenmux", - "display_name": "ZenMux", + "id": "inference", + "display_name": "Inference", "npm": "@ai-sdk/openai-compatible", - "api": "https://zenmux.ai/api/v1", - "doc": "https://docs.zenmux.ai", + "api": "https://inference.net/v1", + "doc": "https://inference.net/models", "env": [ - "ZENMUX_API_KEY" + "INFERENCE_API_KEY" ], - "model_count": 96 + "model_count": 9 }, { - "id": "perplexity-agent", - "display_name": "Perplexity Agent", - "npm": "@ai-sdk/openai", - "api": "https://api.perplexity.ai/v1", - "doc": "https://docs.perplexity.ai/docs/agent-api/models", + "id": "inception", + "display_name": "Inception", + "npm": "@ai-sdk/openai-compatible", + "api": "https://api.inceptionlabs.ai/v1/", + "doc": "https://platform.inceptionlabs.ai/docs", "env": [ - "PERPLEXITY_API_KEY" + "INCEPTION_API_KEY" ], - "model_count": 18 + "model_count": 2 }, { - "id": "alibaba-coding-plan", - "display_name": "Alibaba Coding Plan", + "id": "requesty", + "display_name": "Requesty", "npm": "@ai-sdk/openai-compatible", - "api": "https://coding-intl.dashscope.aliyuncs.com/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/coding-plan", + "api": "https://router.requesty.ai/v1", + "doc": "https://requesty.ai/solution/llm-routing/models", + "env": [ + "REQUESTY_API_KEY" + ], + "model_count": 38 + }, + { + "id": "digitalocean", + "display_name": "DigitalOcean", + "npm": "@ai-sdk/openai-compatible", + "api": "https://inference.do-ai.run/v1", + "doc": "https://docs.digitalocean.com/products/gradient-ai-platform/details/models/", + "env": [ + "DIGITALOCEAN_ACCESS_TOKEN" + ], + "model_count": 76 + }, + { + "id": "vultr", + "display_name": "Vultr", + "npm": "@ai-sdk/openai-compatible", + "api": "https://api.vultrinference.com/v1", + "doc": "https://api.vultrinference.com/", + "env": [ + "VULTR_API_KEY" + ], + "model_count": 5 + }, + { + "id": "alibaba-coding-plan-cn", + "display_name": "Alibaba Coding Plan (China)", + "npm": "@ai-sdk/openai-compatible", + "api": "https://coding.dashscope.aliyuncs.com/v1", + "doc": "https://help.aliyun.com/zh/model-studio/coding-plan", "env": [ "ALIBABA_CODING_PLAN_API_KEY" ], "model_count": 9 }, { - "id": "meganova", - "display_name": "Meganova", + "id": "ovhcloud", + "display_name": "OVHcloud AI Endpoints", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.meganova.ai/v1", - "doc": "https://docs.meganova.ai", + "api": "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1", + "doc": "https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//", "env": [ - "MEGANOVA_API_KEY" + "OVHCLOUD_API_KEY" ], - "model_count": 19 + "model_count": 11 }, { - "id": "synthetic", - "display_name": "Synthetic", + "id": "friendli", + "display_name": "Friendli", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.synthetic.new/openai/v1", - "doc": "https://synthetic.new/pricing", + "api": "https://api.friendli.ai/serverless/v1", + "doc": "https://friendli.ai/docs/guides/serverless_endpoints/introduction", "env": [ - "SYNTHETIC_API_KEY" + "FRIENDLI_TOKEN" ], - "model_count": 33 + "model_count": 6 }, { - "id": "minimax-coding-plan", - "display_name": "MiniMax Coding Plan (minimax.io)", - "npm": "@ai-sdk/anthropic", - "api": "https://api.minimax.io/anthropic/v1", - "doc": "https://platform.minimax.io/docs/coding-plan/intro", + "id": "cortecs", + "display_name": "Cortecs", + "npm": "@ai-sdk/openai-compatible", + "api": "https://api.cortecs.ai/v1", + "doc": "https://api.cortecs.ai/v1/models", "env": [ - "MINIMAX_API_KEY" + "CORTECS_API_KEY" ], - "model_count": 6 + "model_count": 49 }, { - "id": "upstage", - "display_name": "Upstage", + "id": "siliconflow", + "display_name": "SiliconFlow", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.upstage.ai/v1/solar", - "doc": "https://developers.upstage.ai/docs/apis/chat", + "api": "https://api.siliconflow.com/v1", + "doc": "https://cloud.siliconflow.com/models", "env": [ - "UPSTAGE_API_KEY" + "SILICONFLOW_API_KEY" ], - "model_count": 3 + "model_count": 76 }, { - "id": "abliteration-ai", - "display_name": "abliteration.ai", + "id": "minimax", + "display_name": "MiniMax (minimax.io)", + "npm": "@ai-sdk/anthropic", + "api": "https://api.minimax.io/anthropic/v1", + "doc": "https://platform.minimax.io/docs/guides/quickstart", + "env": [ + "MINIMAX_API_KEY" + ], + "model_count": 6 + }, + { + "id": "llmgateway", + "display_name": "LLM Gateway", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.abliteration.ai/v1", - "doc": "https://docs.abliteration.ai/models", + "api": "https://api.llmgateway.io/v1", + "doc": "https://llmgateway.io/docs", "env": [ - "ABLIT_KEY" + "LLMGATEWAY_API_KEY" ], - "model_count": 1 + "model_count": 196 }, { - "id": "deepseek", - "display_name": "DeepSeek", + "id": "cloudflare-workers-ai", + "display_name": "Cloudflare Workers AI", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.deepseek.com", - "doc": "https://api-docs.deepseek.com/quick_start/pricing", + "api": "https://api.cloudflare.com/client/v4/accounts/${CLOUDFLARE_ACCOUNT_ID}/ai/v1", + "doc": "https://developers.cloudflare.com/workers-ai/models/", "env": [ - "DEEPSEEK_API_KEY" + "CLOUDFLARE_ACCOUNT_ID", + "CLOUDFLARE_API_KEY" ], - "model_count": 4 + "model_count": 8 }, { - "id": "iflowcn", - "display_name": "iFlow", + "id": "fastrouter", + "display_name": "FastRouter", "npm": "@ai-sdk/openai-compatible", - "api": "https://apis.iflow.cn/v1", - "doc": "https://platform.iflow.cn/en/docs", + "api": "https://go.fastrouter.ai/api/v1", + "doc": "https://fastrouter.ai/models", "env": [ - "IFLOW_API_KEY" + "FASTROUTER_API_KEY" ], - "model_count": 14 + "model_count": 15 }, { "id": "stackit", @@ -883,92 +915,82 @@ "model_count": 8 }, { - "id": "wafer.ai", - "display_name": "Wafer", - "npm": "@ai-sdk/openai-compatible", - "api": "https://pass.wafer.ai/v1", - "doc": "https://docs.wafer.ai/wafer-pass", - "env": [ - "WAFER_API_KEY" - ], - "model_count": 2 - }, - { - "id": "evroc", - "display_name": "evroc", + "id": "tencent-coding-plan", + "display_name": "Tencent Coding Plan (China)", "npm": "@ai-sdk/openai-compatible", - "api": "https://models.think.evroc.com/v1", - "doc": "https://docs.evroc.com/products/think/overview.html", + "api": "https://api.lkeap.cloud.tencent.com/coding/v3", + "doc": "https://cloud.tencent.com/document/product/1772/128947", "env": [ - "EVROC_API_KEY" + "TENCENT_CODING_PLAN_API_KEY" ], - "model_count": 13 + "model_count": 8 }, { - "id": "nova", - "display_name": "Nova", + "id": "privatemode-ai", + "display_name": "Privatemode AI", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.nova.amazon.com/v1", - "doc": "https://nova.amazon.com/dev/documentation", + "api": "http://localhost:8080/v1", + "doc": "https://docs.privatemode.ai/api/overview", "env": [ - "NOVA_API_KEY" + "PRIVATEMODE_API_KEY", + "PRIVATEMODE_ENDPOINT" ], - "model_count": 2 + "model_count": 5 }, { - "id": "fireworks-ai", - "display_name": "Fireworks AI", + "id": "drun", + "display_name": "D.Run (China)", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.fireworks.ai/inference/v1/", - "doc": "https://fireworks.ai/docs/", + "api": "https://chat.d.run/v1", + "doc": "https://www.d.run", "env": [ - "FIREWORKS_API_KEY" + "DRUN_API_KEY" ], - "model_count": 19 + "model_count": 3 }, { - "id": "alibaba", - "display_name": "Alibaba", + "id": "moonshotai", + "display_name": "Moonshot AI", "npm": "@ai-sdk/openai-compatible", - "api": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/models", + "api": "https://api.moonshot.ai/v1", + "doc": "https://platform.moonshot.ai/docs/api/chat", "env": [ - "DASHSCOPE_API_KEY" + "MOONSHOT_API_KEY" ], - "model_count": 48 + "model_count": 7 }, { - "id": "302ai", - "display_name": "302.AI", + "id": "berget", + "display_name": "Berget.AI", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.302.ai/v1", - "doc": "https://doc.302.ai", + "api": "https://api.berget.ai/v1", + "doc": "https://api.berget.ai", "env": [ - "302AI_API_KEY" + "BERGET_API_KEY" ], - "model_count": 97 + "model_count": 6 }, { - "id": "xpersona", - "display_name": "Xpersona", + "id": "github-models", + "display_name": "GitHub Models", "npm": "@ai-sdk/openai-compatible", - "api": "https://xpersona.co/v1", - "doc": "https://xpersona.co/docs", + "api": "https://models.github.ai/inference", + "doc": "https://docs.github.com/en/github-models", "env": [ - "XPERSONA_API_KEY" + "GITHUB_TOKEN" ], - "model_count": 1 + "model_count": 55 }, { - "id": "stepfun", - "display_name": "StepFun", + "id": "neuralwatt", + "display_name": "Neuralwatt", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.stepfun.com/v1", - "doc": "https://platform.stepfun.com/docs/zh/overview/concept", + "api": "https://api.neuralwatt.com/v1", + "doc": "https://portal.neuralwatt.com/docs", "env": [ - "STEPFUN_API_KEY" + "NEURALWATT_API_KEY" ], - "model_count": 4 + "model_count": 14 }, { "id": "sarvam", @@ -981,28 +1003,6 @@ ], "model_count": 2 }, - { - "id": "zhipuai", - "display_name": "Zhipu AI", - "npm": "@ai-sdk/openai-compatible", - "api": "https://open.bigmodel.cn/api/paas/v4", - "doc": "https://docs.z.ai/guides/overview/pricing", - "env": [ - "ZHIPU_API_KEY" - ], - "model_count": 12 - }, - { - "id": "bailing", - "display_name": "Bailing", - "npm": "@ai-sdk/openai-compatible", - "api": "https://api.tbox.cn/api/llm/v1/chat/completions", - "doc": "https://alipaytbox.yuque.com/sxs0ba/ling/intro", - "env": [ - "BAILING_API_TOKEN" - ], - "model_count": 2 - }, { "id": "qihang-ai", "display_name": "QiHang", @@ -1014,39 +1014,6 @@ ], "model_count": 9 }, - { - "id": "alibaba-cn", - "display_name": "Alibaba (China)", - "npm": "@ai-sdk/openai-compatible", - "api": "https://dashscope.aliyuncs.com/compatible-mode/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/models", - "env": [ - "DASHSCOPE_API_KEY" - ], - "model_count": 80 - }, - { - "id": "drun", - "display_name": "D.Run (China)", - "npm": "@ai-sdk/openai-compatible", - "api": "https://chat.d.run/v1", - "doc": "https://www.d.run", - "env": [ - "DRUN_API_KEY" - ], - "model_count": 3 - }, - { - "id": "huggingface", - "display_name": "Hugging Face", - "npm": "@ai-sdk/openai-compatible", - "api": "https://router.huggingface.co/v1", - "doc": "https://huggingface.co/docs/inference-providers", - "env": [ - "HF_TOKEN" - ], - "model_count": 24 - }, { "id": "tencent-tokenhub", "display_name": "Tencent TokenHub", @@ -1059,15 +1026,15 @@ "model_count": 1 }, { - "id": "nebius", - "display_name": "Nebius Token Factory", + "id": "modelscope", + "display_name": "ModelScope", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.tokenfactory.nebius.com/v1", - "doc": "https://docs.tokenfactory.nebius.com/", + "api": "https://api-inference.modelscope.cn/v1", + "doc": "https://modelscope.cn/docs/model-service/API-Inference/intro", "env": [ - "NEBIUS_API_KEY" + "MODELSCOPE_API_KEY" ], - "model_count": 31 + "model_count": 7 }, { "id": "hpc-ai", @@ -1092,25 +1059,80 @@ "model_count": 5 }, { - "id": "github-copilot", - "display_name": "GitHub Copilot", + "id": "clarifai", + "display_name": "Clarifai", "npm": "@ai-sdk/openai-compatible", - "api": "https://api.githubcopilot.com", - "doc": "https://docs.github.com/en/copilot", + "api": "https://api.clarifai.com/v2/ext/openai/v1", + "doc": "https://docs.clarifai.com/compute/inference/", "env": [ - "GITHUB_TOKEN" + "CLARIFAI_PAT" ], - "model_count": 27 + "model_count": 12 }, { - "id": "inference", - "display_name": "Inference", + "id": "minimax-cn", + "display_name": "MiniMax (minimaxi.com)", + "npm": "@ai-sdk/anthropic", + "api": "https://api.minimaxi.com/anthropic/v1", + "doc": "https://platform.minimaxi.com/docs/guides/quickstart", + "env": [ + "MINIMAX_API_KEY" + ], + "model_count": 6 + }, + { + "id": "regolo-ai", + "display_name": "Regolo AI", "npm": "@ai-sdk/openai-compatible", - "api": "https://inference.net/v1", - "doc": "https://inference.net/models", + "api": "https://api.regolo.ai/v1", + "doc": "https://docs.regolo.ai/", "env": [ - "INFERENCE_API_KEY" + "REGOLO_API_KEY" ], - "model_count": 9 + "model_count": 13 + }, + { + "id": "xiaomi-token-plan-ams", + "display_name": "Xiaomi Token Plan (Europe)", + "npm": "@ai-sdk/openai-compatible", + "api": "https://token-plan-ams.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", + "env": [ + "XIAOMI_API_KEY" + ], + "model_count": 6 + }, + { + "id": "zhipuai", + "display_name": "Zhipu AI", + "npm": "@ai-sdk/openai-compatible", + "api": "https://open.bigmodel.cn/api/paas/v4", + "doc": "https://docs.z.ai/guides/overview/pricing", + "env": [ + "ZHIPU_API_KEY" + ], + "model_count": 12 + }, + { + "id": "nova", + "display_name": "Nova", + "npm": "@ai-sdk/openai-compatible", + "api": "https://api.nova.amazon.com/v1", + "doc": "https://nova.amazon.com/dev/documentation", + "env": [ + "NOVA_API_KEY" + ], + "model_count": 2 + }, + { + "id": "atomic-chat", + "display_name": "Atomic Chat", + "npm": "@ai-sdk/openai-compatible", + "api": "http://127.0.0.1:1337/v1", + "doc": "https://atomic.chat", + "env": [ + "ATOMIC_CHAT_API_KEY" + ], + "model_count": 5 } ] \ No newline at end of file diff --git a/ui/desktop/openapi.json b/ui/desktop/openapi.json index 81cf91e2a554..ed287df3ef02 100644 --- a/ui/desktop/openapi.json +++ b/ui/desktop/openapi.json @@ -10,7 +10,7 @@ "license": { "name": "Apache-2.0" }, - "version": "1.34.1" + "version": "1.34.2" }, "paths": { "/action-required/tool-confirmation": { diff --git a/ui/desktop/package.json b/ui/desktop/package.json index 646348914d38..751ef8984428 100644 --- a/ui/desktop/package.json +++ b/ui/desktop/package.json @@ -1,7 +1,7 @@ { "name": "goose-app", "productName": "Goose", - "version": "1.34.1", + "version": "1.34.2", "description": "Goose App", "engines": { "node": "^24.10.0",