audit model field values against official docs

This commit is contained in:
2026-04-24 12:20:24 +08:00
parent ca99ea272f
commit c57cd4723d
114 changed files with 6550 additions and 368 deletions

View File

@@ -10,7 +10,10 @@
"enabled": false,
"status": "unconfigured",
"accessMode": "coding-plan",
"services": ["chat", "reasoning"],
"services": [
"chat",
"reasoning"
],
"codingPlan": {
"quotas": {},
"usageTracking": {
@@ -22,22 +25,45 @@
{
"modelName": "qwen3-coder-plus",
"displayName": "Qwen3 Coder Plus (Coding)",
"serviceType": ["chat"],
"description": "阿里云百炼 Coding PlanQwen3 编程增强版",
"contextWindow": 131072,
"maxOutputTokens": 16384,
"capabilities": ["chat", "reasoning", "code", "tool_use"],
"source": "preset"
"serviceType": [
"chat"
],
"description": "阿里云百炼 Coding PlanQwen3 编程增强版100万上下文",
"contextWindow": 1000000,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
"reasoning",
"code",
"tool_use"
],
"source": "preset",
"inputPrice": 1,
"outputPrice": 5,
"defaultTemperature": 0.7
},
{
"modelName": "qwen3-max",
"modelName": "qwen3-max-2026-01-23",
"displayName": "Qwen3 Max (Coding)",
"serviceType": ["chat"],
"description": "阿里云百炼 Coding PlanQwen3 Max 旗舰模型",
"contextWindow": 131072,
"maxOutputTokens": 16384,
"capabilities": ["chat", "reasoning", "code", "multilingual", "tool_use", "long_context", "vision"],
"source": "preset"
"serviceType": [
"chat"
],
"description": "阿里云百炼 Coding PlanQwen3 Max 旗舰模型262K 上下文",
"contextWindow": 262144,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
"reasoning",
"code",
"multilingual",
"tool_use",
"long_context",
"vision"
],
"source": "preset",
"inputPrice": 1.2,
"outputPrice": 6,
"defaultTemperature": 0.7
}
]
}

View File

@@ -27,6 +27,7 @@
"contextWindow": 128000,
"maxOutputTokens": 8192,
"capabilities": ["chat", "reasoning", "code", "multilingual"],
"defaultTemperature": 1,
"source": "preset"
}
]

View File

@@ -25,6 +25,9 @@
"serviceType": ["chat"],
"description": "快手 KwaiKAT Coding Plan编程辅助模型",
"capabilities": ["chat", "code"],
"contextWindow": 128000,
"maxOutputTokens": 8192,
"defaultTemperature": 1,
"source": "preset"
}
]

View File

@@ -2,7 +2,7 @@
"id": "provider-minimax-coding-001",
"provider": "minimax",
"brandGroup": "minimax",
"label": "MiniMax Coding Plan",
"label": "MiniMax Token Plan",
"baseUrl": "https://api.minimaxi.com/v1",
"apiFormat": "openai-completions",
"apiKeyRef": "",
@@ -10,25 +10,108 @@
"enabled": false,
"status": "unconfigured",
"accessMode": "coding-plan",
"services": ["chat", "reasoning"],
"services": [
"chat",
"reasoning",
"fast"
],
"codingPlan": {
"quotas": {},
"quotas": {
"textWindow": "5h",
"standard": {
"starterRequestsPer5h": 1500,
"plusRequestsPer5h": 4500,
"maxRequestsPer5h": 15000
},
"highspeed": {
"plusHighspeedRequestsPer5h": 4500,
"maxHighspeedRequestsPer5h": 15000,
"ultraHighspeedRequestsPer5h": 30000
}
},
"usageTracking": {
"method": "rest-api",
"endpoint": "https://api.minimaxi.com/v1/coding/usage",
"consoleUrl": "https://platform.minimaxi.com/"
"endpoint": "https://www.minimax.io/v1/token_plan/remains",
"consoleUrl": "https://www.minimax.io/user-center/token-plan"
}
},
"models": [
{
"modelName": "MiniMax-M1",
"displayName": "MiniMax-M1 (Coding)",
"serviceType": ["chat"],
"description": "MiniMax Coding PlanM1 旗舰模型",
"contextWindow": 1000000,
"modelName": "MiniMax-M2.7",
"displayName": "MiniMax-M2.7 (Token Plan)",
"serviceType": [
"chat"
],
"description": "MiniMax Token Plan 默认文本模型M2.7204,800 上下文,约 60 TPS 输出",
"contextWindow": 204800,
"maxOutputTokens": 131072,
"capabilities": ["chat", "reasoning", "code", "long_context"],
"source": "preset"
"capabilities": [
"chat",
"reasoning",
"code",
"tool_use",
"long_context"
],
"source": "preset",
"inputPrice": 0.3,
"outputPrice": 1.2,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {
"billing": "token_plan_request_quota",
"cacheReadPrice": 0.06,
"cacheWritePrice": 0.375,
"outputSpeedTps": 60
}
},
{
"modelName": "MiniMax-M2.7-highspeed",
"displayName": "MiniMax-M2.7 高速版 (Token Plan)",
"serviceType": [
"fast"
],
"description": "MiniMax Token Plan 高速订阅支持模型M2.7-highspeed效果与 M2.7 一致但输出更快",
"contextWindow": 204800,
"maxOutputTokens": 131072,
"capabilities": [
"chat",
"reasoning",
"code",
"tool_use",
"long_context",
"fast"
],
"source": "preset",
"inputPrice": 0.6,
"outputPrice": 2.4,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {
"billing": "token_plan_highspeed_request_quota",
"cacheReadPrice": 0.06,
"cacheWritePrice": 0.375,
"outputSpeedTps": 100
}
},
{
"modelName": "MiniMax-M2.5",
"displayName": "MiniMax-M2.5 (Coding)",
"serviceType": [
"chat"
],
"description": "MiniMax Coding PlanM2.5 模型204.8K 上下文",
"contextWindow": 204800,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
"reasoning",
"code",
"long_context"
],
"source": "preset",
"inputPrice": 0.3,
"outputPrice": 1.2,
"defaultTemperature": 1
}
]
}

View File

@@ -10,24 +10,76 @@
"enabled": false,
"status": "unconfigured",
"accessMode": "coding-plan",
"services": ["chat", "reasoning"],
"services": [
"chat",
"reasoning"
],
"codingPlan": {
"quotas": {},
"quotas": {
"window": "5h",
"approxApiCallsPerWindow": "300-1200",
"maxConcurrency": 30
},
"usageTracking": {
"method": "none",
"consoleUrl": "https://platform.moonshot.cn/"
"consoleUrl": "https://www.kimi.com/code/console"
}
},
"models": [
{
"modelName": "kimi-k2",
"displayName": "Kimi K2 (Coding)",
"serviceType": ["chat"],
"description": "Kimi Code 套餐,万亿参数 MoE 模型128K 上下文",
"contextWindow": 128000,
"maxOutputTokens": 8192,
"capabilities": ["chat", "reasoning", "code", "tool_use", "agent", "long_context", "vision"],
"source": "preset"
"modelName": "kimi-for-coding",
"displayName": "Kimi for Coding",
"serviceType": [
"chat"
],
"description": "Kimi Code 会员权益模型,官方第三方 Coding Agent 推荐模型 IDKimi Code 平台按会员额度计费",
"contextWindow": 262144,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
"reasoning",
"code",
"tool_use",
"agent",
"long_context",
"vision",
"video_understanding"
],
"source": "preset",
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"billing": "kimi_membership_quota",
"baseUrlNote": "Kimi Code API Key must use https://api.kimi.com/coding/v1",
"recommendedFor": [
"Kimi Code CLI",
"Claude Code",
"Roo Code"
]
}
},
{
"modelName": "kimi-k2.5",
"displayName": "Kimi K2.5 (Coding)",
"serviceType": [
"chat"
],
"description": "Kimi Code 套餐Kimi K2.5 模型256K 上下文",
"contextWindow": 256000,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
"reasoning",
"code",
"tool_use",
"agent",
"long_context",
"vision"
],
"source": "preset",
"inputPrice": 0.58,
"outputPrice": 3.02,
"defaultTemperature": 1
}
]
}

View File

@@ -25,6 +25,9 @@
"serviceType": ["chat"],
"description": "摩尔线程 Coding Plan国产 GPU 推理",
"capabilities": ["chat", "code"],
"contextWindow": 128000,
"maxOutputTokens": 8192,
"defaultTemperature": 1,
"source": "preset"
}
]

View File

@@ -31,6 +31,9 @@
"serviceType": ["chat"],
"description": "自动路由最优编程模型Doubao-Seed-Code / GLM-4.7 / DeepSeek-V3.2 / Kimi-K2 等)",
"capabilities": ["code", "reasoning", "chat"],
"contextWindow": 256000,
"maxOutputTokens": 32000,
"defaultTemperature": 1,
"source": "preset"
}
]

View File

@@ -10,7 +10,10 @@
"enabled": false,
"status": "unconfigured",
"accessMode": "coding-plan",
"services": ["chat", "reasoning"],
"services": [
"chat",
"reasoning"
],
"codingPlan": {
"quotas": {},
"usageTracking": {
@@ -19,25 +22,117 @@
}
},
"models": [
{
"modelName": "glm-5.1",
"displayName": "GLM-5.1 (Coding)",
"serviceType": [
"chat"
],
"description": "GLM Coding Plan 全量套餐支持的 GLM-5.1面向复杂推理和大型工程任务204,800 上下文131,072 最大输出",
"contextWindow": 204800,
"maxOutputTokens": 131072,
"capabilities": [
"chat",
"reasoning",
"code",
"deep_thinking",
"long_context",
"tool_use",
"agent",
"math",
"multilingual"
],
"source": "preset",
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"quotaMultiplier": {
"peakHoursUtc8": "14:00-18:00",
"peak": 3,
"offPeak": 2,
"promotionalOffPeak": 1,
"promotionalOffPeakEndsAt": "2026-04-30"
}
}
},
{
"modelName": "glm-5-turbo",
"displayName": "GLM-5-Turbo (Coding)",
"serviceType": [
"chat"
],
"description": "GLM Coding Plan 支持的 GLM-5-Turbo面向 OpenClaw 等长链路任务优化204,800 上下文131,072 最大输出",
"contextWindow": 204800,
"maxOutputTokens": 131072,
"capabilities": [
"chat",
"reasoning",
"code",
"deep_thinking",
"long_context",
"tool_use",
"agent"
],
"source": "preset",
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"quotaMultiplier": {
"peakHoursUtc8": "14:00-18:00",
"peak": 3,
"offPeak": 2,
"promotionalOffPeak": 1,
"promotionalOffPeakEndsAt": "2026-04-30"
}
}
},
{
"modelName": "glm-5",
"displayName": "GLM-5 (Coding)",
"serviceType": ["chat"],
"description": "智谱 GLM-5 Coding Plan 版本745B MoE编程能力登顶",
"contextWindow": 192000,
"serviceType": [
"chat"
],
"description": "智谱 GLM-5 Coding Plan 版本202,752 token 上下文,编程能力登顶",
"contextWindow": 200000,
"maxOutputTokens": 128000,
"capabilities": ["chat", "reasoning", "code", "deep_thinking", "long_context", "tool_use", "agent", "math", "multilingual"],
"source": "preset"
"capabilities": [
"chat",
"reasoning",
"code",
"deep_thinking",
"long_context",
"tool_use",
"agent",
"math",
"multilingual"
],
"source": "preset",
"inputPrice": 0.58,
"outputPrice": 2.6,
"defaultTemperature": 0.95
},
{
"modelName": "glm-4.7",
"displayName": "GLM-4.7 (Coding)",
"serviceType": ["chat"],
"description": "智谱 GLM-4.7 Coding Plan 版本200K 上下文",
"serviceType": [
"chat"
],
"description": "智谱 GLM-4.7 Coding Plan 版本202,752 token 上下文",
"contextWindow": 200000,
"maxOutputTokens": 128000,
"capabilities": ["chat", "reasoning", "code", "deep_thinking", "long_context", "tool_use", "multilingual"],
"source": "preset"
"capabilities": [
"chat",
"reasoning",
"code",
"deep_thinking",
"long_context",
"tool_use",
"multilingual"
],
"source": "preset",
"inputPrice": 0.2911,
"outputPrice": 1.1645,
"defaultTemperature": 0.95
}
]
}

View File

@@ -17,10 +17,12 @@
{
"modelName": "claude-opus-4-6",
"displayName": "Claude Opus 4.6",
"serviceType": ["chat"],
"description": "Anthropic 最新旗舰 Opus 模型,最强能力",
"serviceType": [
"chat"
],
"description": "Anthropic Opus 4.61M 上下文,适合复杂代理和编码任务",
"contextWindow": 200000,
"maxOutputTokens": 32768,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"reasoning",
@@ -36,7 +38,9 @@
{
"modelName": "claude-opus-4-5",
"displayName": "Claude Opus 4.5",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "Anthropic Opus 4.5,顶级推理能力",
"contextWindow": 200000,
"maxOutputTokens": 32768,
@@ -55,7 +59,9 @@
{
"modelName": "claude-sonnet-4-5",
"displayName": "Claude Sonnet 4.5",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "Anthropic Sonnet 4.5,高性能性价比",
"contextWindow": 200000,
"maxOutputTokens": 64000,
@@ -74,7 +80,9 @@
{
"modelName": "claude-sonnet-4",
"displayName": "Claude Sonnet 4",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "Anthropic Sonnet 4 旗舰模型",
"contextWindow": 200000,
"maxOutputTokens": 64000,
@@ -93,7 +101,9 @@
{
"modelName": "claude-sonnet-4-5-computer",
"displayName": "Claude Sonnet 4.5 Computer Use",
"serviceType": ["computer_use"],
"serviceType": [
"computer_use"
],
"description": "Anthropic 最佳 Computer Use 模型",
"contextWindow": 200000,
"maxOutputTokens": 64000,

View File

@@ -18,8 +18,8 @@
"displayName": "百川 M3-Plus",
"serviceType": ["chat"],
"description": "百川智能M3-Plus医疗增强模型235B参数幻觉率仅2.6%API价格较前代下降70%",
"contextWindow": 192000,
"maxOutputTokens": 8192,
"contextWindow": 32000,
"maxOutputTokens": 32000,
"capabilities": [
"chat",
"reasoning",
@@ -40,8 +40,8 @@
"displayName": "百川 M3",
"serviceType": ["chat"],
"description": "百川智能M3新一代开源医疗增强模型235B参数",
"contextWindow": 192000,
"maxOutputTokens": 8192,
"contextWindow": 32000,
"maxOutputTokens": 32000,
"capabilities": [
"chat",
"reasoning",
@@ -61,8 +61,8 @@
"displayName": "百川 M2-Plus",
"serviceType": ["chat"],
"description": "百川智能M2-Plus旗舰模型最强推理和创作能力",
"contextWindow": 128000,
"maxOutputTokens": 8192,
"contextWindow": 32000,
"maxOutputTokens": 32000,
"capabilities": [
"chat",
"reasoning",
@@ -81,8 +81,8 @@
"displayName": "百川 M2",
"serviceType": ["chat"],
"description": "百川智能M2模型高性能通用模型",
"contextWindow": 128000,
"maxOutputTokens": 8192,
"contextWindow": 32000,
"maxOutputTokens": 32000,
"capabilities": [
"chat",
"reasoning",

View File

@@ -9,14 +9,20 @@
"enabled": false,
"status": "unconfigured",
"priceCurrency": "CNY",
"services": ["chat", "reasoning"],
"services": [
"chat",
"reasoning"
],
"models": [
{
"modelName": "ernie-5.0-thinking-latest",
"displayName": "文心 ERNIE 5.0",
"serviceType": ["chat", "reasoning"],
"serviceType": [
"chat",
"reasoning"
],
"description": "百度最新旗舰模型支持深度推理、多模态和工具调用119K输入/64K输出",
"contextWindow": 131072,
"contextWindow": 128000,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
@@ -34,10 +40,12 @@
{
"modelName": "ernie-4.5-turbo-128k-latest",
"displayName": "文心 ERNIE 4.5 Turbo",
"serviceType": ["chat"],
"description": "百度高性价比长上下文模型128K 窗口,适合日常对话和文档处理",
"serviceType": [
"chat"
],
"description": "百度高性价比长上下文模型128K 窗口,最大输出 12,288 token",
"contextWindow": 131072,
"maxOutputTokens": 8192,
"maxOutputTokens": 12288,
"capabilities": [
"chat",
"code",

View File

@@ -15,9 +15,9 @@
"modelName": "command-a-03-2025",
"displayName": "Command A",
"serviceType": ["chat"],
"description": "Cohere 旗舰对话模型262K 上下文,擅长 RAG 和工具调用",
"contextWindow": 262144,
"maxOutputTokens": 8192,
"description": "Cohere 旗舰对话模型256K 上下文,擅长 RAG 和工具调用",
"contextWindow": 256000,
"maxOutputTokens": 8000,
"capabilities": [
"chat",
"reasoning",
@@ -37,8 +37,8 @@
"modelName": "embed-v4.0",
"displayName": "Embed V4",
"serviceType": ["embedding"],
"description": "Cohere 最新 Embedding 模型131K 上下文,多语言支持",
"contextWindow": 131072,
"description": "Cohere 最新 Embedding 模型128K 上下文,多语言支持",
"contextWindow": 128000,
"maxOutputTokens": 0,
"capabilities": [
"text_embedding",
@@ -46,14 +46,15 @@
],
"inputPrice": 0.12,
"outputPrice": 0,
"defaultTemperature": 1,
"extra": {}
},
{
"modelName": "rerank-v3.5",
"displayName": "Rerank V3.5",
"serviceType": ["rerank"],
"description": "Cohere 语义重排序模型,用于检索结果精排",
"contextWindow": 0,
"description": "Cohere 语义重排序模型,用于检索结果精排,默认单文档截断 4096 token",
"contextWindow": 4096,
"maxOutputTokens": 0,
"capabilities": [
"rerank",
@@ -61,6 +62,7 @@
],
"inputPrice": 2.00,
"outputPrice": 0,
"defaultTemperature": 1,
"extra": {}
}
]

View File

@@ -26,10 +26,12 @@
{
"modelName": "qwen3.5-plus",
"displayName": "阿里云 Qwen3.5-Plus",
"serviceType": ["chat"],
"description": "通义千问3.5旗舰模型,支持文本/图像/视频输入效果媲美Qwen3 Max性价比更优",
"contextWindow": 262144,
"maxOutputTokens": 16384,
"serviceType": [
"chat"
],
"description": "通义千问3.5旗舰模型,支持文本/图像/视频输入100万上下文默认开启思考模式",
"contextWindow": 1000000,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
"reasoning",
@@ -44,14 +46,35 @@
"outputPrice": 4.8,
"defaultTemperature": 0.7,
"defaultTopP": 0.8,
"extra": {}
"extra": {
"pricingTiers": [
{
"maxInputTokens": 128000,
"inputPrice": 0.8,
"outputPrice": 4.8
},
{
"maxInputTokens": 256000,
"inputPrice": 2,
"outputPrice": 12
},
{
"maxInputTokens": 1000000,
"inputPrice": 4,
"outputPrice": 24
}
],
"thinkingMaxTokens": 81920
}
},
{
"modelName": "qwen-max",
"displayName": "阿里云 qwen-max",
"serviceType": ["chat"],
"description": "通义千问Max千亿参数旗舰模型最强性能",
"contextWindow": 131072,
"serviceType": [
"chat"
],
"description": "通义千问Max千亿参数旗舰模型32K 上下文",
"contextWindow": 32768,
"maxOutputTokens": 8192,
"capabilities": [
"chat",
@@ -69,10 +92,12 @@
{
"modelName": "qwen-plus",
"displayName": "阿里云 qwen-plus",
"serviceType": ["chat"],
"description": "通义千问Plus支持思考模式128K 上下文",
"contextWindow": 131072,
"maxOutputTokens": 8192,
"serviceType": [
"chat"
],
"description": "通义千问Plus支持思考模式100万上下文",
"contextWindow": 1000000,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
"reasoning",
@@ -83,34 +108,64 @@
"outputPrice": 2,
"defaultTemperature": 0.6,
"defaultTopP": 0.8,
"extra": {}
"extra": {
"pricingTiers": [
{
"maxInputTokens": 128000,
"inputPrice": 0.8,
"outputPrice": 2,
"thinkingOutputPrice": 8
},
{
"maxInputTokens": 256000,
"inputPrice": 2.4,
"outputPrice": 20,
"thinkingOutputPrice": 24
},
{
"maxInputTokens": 1000000,
"inputPrice": 4.8,
"outputPrice": 48,
"thinkingOutputPrice": 64
}
],
"thinkingMaxTokens": 81920
}
},
{
"modelName": "qwen-turbo",
"displayName": "阿里云 qwen-turbo",
"serviceType": ["chat"],
"description": "通义千问Turbo支持100万上下文高性价比",
"serviceType": [
"chat"
],
"description": "通义千问Turbo非思考模式支持100万上下文思考模式支持131K上下文",
"contextWindow": 1000000,
"maxOutputTokens": 8192,
"maxOutputTokens": 16384,
"capabilities": [
"chat",
"code",
"long_context",
"fast"
],
"inputPrice": 0.3,
"outputPrice": 0.6,
"inputPrice": 0.367,
"outputPrice": 1.468,
"defaultTemperature": 0.7,
"defaultTopP": 0.8,
"extra": {}
"extra": {
"thinkingContextWindow": 131072,
"thinkingOutputPrice": 3.67,
"thinkingMaxTokens": 38912
}
},
{
"modelName": "qwen-long",
"displayName": "阿里云 qwen-long",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "通义千问Long支持1000万上下文适合超长文档处理降价97%",
"contextWindow": 10000000,
"maxOutputTokens": 8192,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
"ultra_long_context",
@@ -125,7 +180,9 @@
{
"modelName": "qwen3-max",
"displayName": "阿里云 Qwen3-Max",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "通义千问3代旗舰模型262K 上下文,支持思考模式",
"contextWindow": 262144,
"maxOutputTokens": 65536,
@@ -148,10 +205,12 @@
{
"modelName": "qwen3-vl-plus",
"displayName": "阿里云 Qwen3-VL-Plus",
"serviceType": ["vision"],
"serviceType": [
"vision"
],
"description": "通义千问3代视觉模型Plus版支持图像理解",
"contextWindow": 131072,
"maxOutputTokens": 8192,
"contextWindow": 262144,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
"vision",
@@ -161,15 +220,18 @@
],
"inputPrice": 1.5,
"outputPrice": 6,
"defaultTemperature": 0.7,
"extra": {}
},
{
"modelName": "qwen3-vl-flash",
"displayName": "阿里云 Qwen3-VL-Flash",
"serviceType": ["vision"],
"serviceType": [
"vision"
],
"description": "通义千问3代视觉模型Flash版高性价比",
"contextWindow": 131072,
"maxOutputTokens": 8192,
"contextWindow": 262144,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
"vision",
@@ -178,57 +240,78 @@
],
"inputPrice": 0.8,
"outputPrice": 3,
"defaultTemperature": 0.7,
"extra": {}
},
{
"modelName": "text-embedding-v3",
"displayName": "text-embedding-v3",
"serviceType": ["embedding"],
"serviceType": [
"embedding"
],
"description": "阿里云文本向量化",
"contextWindow": 8192,
"capabilities": [
"text_embedding",
"semantic_search",
"chinese_optimized"
],
"inputPrice": 0.7,
"maxOutputTokens": 0,
"defaultTemperature": 1,
"extra": {}
},
{
"modelName": "text-embedding-v4",
"displayName": "阿里云 text-embedding-v4",
"serviceType": ["embedding"],
"serviceType": [
"embedding"
],
"description": "阿里云百炼文本向量模型v4支持多维度与多语种",
"contextWindow": 8192,
"capabilities": [
"text_embedding",
"semantic_search",
"rag"
],
"inputPrice": 0.5,
"maxOutputTokens": 0,
"defaultTemperature": 1,
"extra": {}
},
{
"modelName": "qwen3-rerank",
"displayName": "Qwen3-Rerank",
"serviceType": ["rerank"],
"serviceType": [
"rerank"
],
"description": "检索重排序,支持 100+ 语种",
"contextWindow": 120000,
"maxOutputTokens": 0,
"capabilities": [
"rerank",
"semantic_reranking",
"multilingual"
],
"inputPrice": 1,
"defaultTemperature": 1,
"extra": {}
},
{
"modelName": "cosyvoice-v2",
"displayName": "CosyVoice V2",
"serviceType": ["tts"],
"serviceType": [
"tts"
],
"description": "通义语音合成,支持中英文",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"tts",
"multilingual",
"chinese_optimized"
],
"defaultTemperature": 1,
"extra": {
"voices": [
"longxiaochun",
@@ -246,12 +329,17 @@
{
"modelName": "paraformer-v2",
"displayName": "Paraformer V2",
"serviceType": ["asr"],
"serviceType": [
"asr"
],
"description": "通义语音识别",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"asr",
"chinese_optimized"
],
"defaultTemperature": 1,
"extra": {
"maxAudioLength": 3600,
"supportedInputFormats": [
@@ -266,12 +354,17 @@
{
"modelName": "wanx-v2",
"displayName": "通义万相 V2",
"serviceType": ["image_gen"],
"serviceType": [
"image_gen"
],
"description": "通义万相文生图",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"image_generation",
"chinese_optimized"
],
"defaultTemperature": 1,
"extra": {
"supportedImageSizes": [
"1024x1024",
@@ -289,12 +382,17 @@
{
"modelName": "wanx-video",
"displayName": "通义万相视频",
"serviceType": ["video_gen"],
"serviceType": [
"video_gen"
],
"description": "通义万相文生视频",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"video_generation",
"chinese_optimized"
],
"defaultTemperature": 1,
"extra": {
"maxVideoDuration": 10,
"supportedResolutions": [
@@ -306,13 +404,18 @@
{
"modelName": "cosyvoice-clone",
"displayName": "CosyVoice 声音复刻",
"serviceType": ["voice_clone"],
"serviceType": [
"voice_clone"
],
"description": "通义声音复刻,少量样本即可克隆",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"voice_clone",
"chinese_optimized",
"few_shot"
],
"defaultTemperature": 1,
"extra": {
"maxCloneSamples": 5,
"minCloneDuration": 3
@@ -321,9 +424,12 @@
{
"modelName": "qwen-omni-turbo",
"displayName": "Qwen-Omni-Turbo",
"serviceType": ["omni"],
"serviceType": [
"omni"
],
"description": "通义全能模型,支持音视频文本多模态",
"contextWindow": 32768,
"maxOutputTokens": 2048,
"capabilities": [
"chat",
"vision",
@@ -332,19 +438,24 @@
"multimodal",
"tool_use"
],
"defaultTemperature": 0.7,
"extra": {}
},
{
"modelName": "qwen3-max-trans",
"displayName": "Qwen3-Max翻译",
"serviceType": ["translation"],
"serviceType": [
"translation"
],
"description": "通义千问翻译,中英日韩等多语种互译",
"contextWindow": 131072,
"maxOutputTokens": 8192,
"capabilities": [
"translation",
"multilingual",
"chinese_optimized"
],
"defaultTemperature": 0.7,
"extra": {}
}
]

View File

@@ -17,10 +17,12 @@
{
"modelName": "deepseek-chat",
"displayName": "DeepSeek V3.2",
"serviceType": ["chat"],
"description": "高性价比通用对话模型64K 上下文",
"contextWindow": 64000,
"maxOutputTokens": 8000,
"serviceType": [
"chat"
],
"description": "高性价比通用对话模型128K 上下文",
"contextWindow": 128000,
"maxOutputTokens": 8192,
"capabilities": [
"chat",
"code",
@@ -36,10 +38,12 @@
{
"modelName": "deepseek-reasoner",
"displayName": "DeepSeek R1",
"serviceType": ["reasoning"],
"description": "DeepSeek R1 推理模型64K 上下文,深度推理能力,思维链最长 32K",
"contextWindow": 64000,
"maxOutputTokens": 8192,
"serviceType": [
"reasoning"
],
"description": "DeepSeek V3.2 思考模式128K 上下文,思维链默认 32K最大输出 64K",
"contextWindow": 128000,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
"reasoning",

View File

@@ -19,8 +19,8 @@
"modelName": "gemini-2.5-pro",
"displayName": "Gemini 2.5 Pro",
"serviceType": ["chat"],
"description": "Google 最新旗舰模型100万上下文,多模态",
"contextWindow": 1000000,
"description": "Google 最新旗舰模型1,048,576 token 上下文,多模态",
"contextWindow": 1048576,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
@@ -40,8 +40,8 @@
"modelName": "gemini-2.5-flash",
"displayName": "Gemini 2.5 Flash",
"serviceType": ["chat"],
"description": "Google 高性价比模型100万上下文,速度快",
"contextWindow": 1000000,
"description": "Google 高性价比模型1,048,576 token 上下文,速度快",
"contextWindow": 1048576,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
@@ -63,11 +63,14 @@
"displayName": "Text Embedding 005",
"serviceType": ["embedding"],
"description": "Google 文本嵌入模型768维度",
"contextWindow": 2048,
"maxOutputTokens": 0,
"capabilities": [
"text_embedding",
"semantic_search"
],
"inputPrice": 0.10,
"defaultTemperature": 1,
"extra": {}
}
]

View File

@@ -23,7 +23,7 @@
"chat"
],
"description": "MiniMax M2.7 高速版低延迟吞吐优化200K 上下文",
"contextWindow": 200000,
"contextWindow": 204800,
"maxOutputTokens": 8192,
"capabilities": [
"chat",
@@ -41,9 +41,9 @@
"serviceType": [
"chat"
],
"description": "智谱 GLM-5.1 新一代旗舰模型编程与推理能力断档领先204K 上下文",
"contextWindow": 204800,
"maxOutputTokens": 131072,
"description": "智谱 GLM-5.1 新一代旗舰模型编程与推理能力断档领先200K 上下文",
"contextWindow": 200000,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"reasoning",
@@ -63,9 +63,9 @@
"serviceType": [
"chat"
],
"description": "智谱 GLM-5 大语言模型",
"contextWindow": 128000,
"maxOutputTokens": 8192,
"description": "智谱 GLM-5 大语言模型200K 上下文",
"contextWindow": 200000,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"reasoning",
@@ -83,8 +83,8 @@
"chat"
],
"description": "智谱 GLM-5-Turbo 大语言模型,更快的推理速度",
"contextWindow": 128000,
"maxOutputTokens": 8192,
"contextWindow": 200000,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"reasoning",
@@ -122,7 +122,7 @@
],
"description": "月之暗面 Kimi K2.6 Code Preview万亿参数 MoE 架构32B 激活256K 上下文,代码与智能体能力增强",
"contextWindow": 256000,
"maxOutputTokens": 16384,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
"reasoning",
@@ -144,8 +144,8 @@
"chat"
],
"description": "月之暗面 Kimi-2.5 大语言模型",
"contextWindow": 128000,
"maxOutputTokens": 8192,
"contextWindow": 256000,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
"reasoning",
@@ -167,7 +167,7 @@
"chat"
],
"description": "MiniMax M2.5 大语言模型",
"contextWindow": 128000,
"contextWindow": 204800,
"maxOutputTokens": 8192,
"capabilities": [
"chat",
@@ -211,8 +211,8 @@
"chat"
],
"description": "阿里通义千问 Qwen3.5 Plus",
"contextWindow": 128000,
"maxOutputTokens": 8192,
"contextWindow": 1000000,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
"reasoning",
@@ -276,8 +276,8 @@
"chat"
],
"description": "阿里通义千问 Qwen3 Max (2026-01-23)",
"contextWindow": 128000,
"maxOutputTokens": 8192,
"contextWindow": 262144,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
"reasoning",
@@ -299,8 +299,8 @@
"chat"
],
"description": "字节跳动豆包 Seed 2.0 Code Preview (260215)",
"contextWindow": 128000,
"maxOutputTokens": 8192,
"contextWindow": 256000,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"reasoning",

View File

@@ -18,12 +18,15 @@
"displayName": "可灵 V2.5 Turbo",
"serviceType": ["video_gen"],
"description": "可灵最新视频生成模型,高性价比",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"video_generation",
"chinese_optimized",
"high_quality",
"fast"
],
"defaultTemperature": 1,
"extra": {
"maxVideoDuration": 10,
"supportedResolutions": [
@@ -38,11 +41,14 @@
"displayName": "可灵 V2.5 Turbo Pro",
"serviceType": ["video_gen"],
"description": "可灵高品质视频生成",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"video_generation",
"chinese_optimized",
"ultra_quality"
],
"defaultTemperature": 1,
"extra": {
"maxVideoDuration": 10,
"supportedResolutions": [
@@ -57,11 +63,14 @@
"displayName": "可灵 V2",
"serviceType": ["video_gen"],
"description": "可灵文生视频旗舰模型",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"video_generation",
"chinese_optimized",
"high_quality"
],
"defaultTemperature": 1,
"extra": {
"maxVideoDuration": 10,
"supportedResolutions": [
@@ -75,11 +84,14 @@
"displayName": "可灵 V2 Master",
"serviceType": ["video_gen"],
"description": "可灵最高品质视频生成",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"video_generation",
"chinese_optimized",
"ultra_quality"
],
"defaultTemperature": 1,
"extra": {
"maxVideoDuration": 10,
"supportedResolutions": [

View File

@@ -18,6 +18,9 @@
"displayName": "Whisper Large V3",
"serviceType": ["asr"],
"description": "本地部署的 Whisper 大模型",
"contextWindow": 0,
"maxOutputTokens": 0,
"defaultTemperature": 1,
"capabilities": [
"asr",
"multilingual"

View File

@@ -8,13 +8,20 @@
"apiKeyVerified": false,
"enabled": false,
"status": "unconfigured",
"priceCurrency": "CNY",
"services": ["chat", "fast", "reasoning"],
"priceCurrency": "USD",
"services": [
"chat",
"fast",
"reasoning"
],
"models": [
{
"modelName": "MiniMax-M2.7",
"displayName": "MiniMax M2.7",
"serviceType": ["chat", "reasoning"],
"serviceType": [
"chat",
"reasoning"
],
"description": "MiniMax 新一代旗舰模型,擅长复杂 Agent、软件工程与专业办公任务",
"contextWindow": 204800,
"maxOutputTokens": 131072,
@@ -24,14 +31,22 @@
"code",
"tool_use"
],
"inputPrice": 0.3,
"outputPrice": 1.2,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
"extra": {
"cacheReadPrice": 0.06,
"cacheWritePrice": 0.375,
"outputSpeedTps": 60
}
},
{
"modelName": "MiniMax-M2.7-highspeed",
"displayName": "MiniMax M2.7 高速版",
"serviceType": ["fast"],
"serviceType": [
"fast"
],
"description": "MiniMax M2.7 极速版,效果一致,输出更快,适合低延迟场景",
"contextWindow": 204800,
"maxOutputTokens": 131072,
@@ -42,16 +57,25 @@
"tool_use",
"fast"
],
"inputPrice": 0.6,
"outputPrice": 2.4,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
"extra": {
"cacheReadPrice": 0.06,
"cacheWritePrice": 0.375,
"outputSpeedTps": 100
}
},
{
"modelName": "MiniMax-M2.5",
"displayName": "MiniMax M2.5",
"serviceType": ["chat", "reasoning"],
"description": "MiniMax 最新旗舰模型230B参数(10B激活)MoE架构百万级上下文支持深度推理和工具调用",
"contextWindow": 1000000,
"serviceType": [
"chat",
"reasoning"
],
"description": "MiniMax M2.5204.8K 上下文,支持深度推理和工具调用",
"contextWindow": 204800,
"maxOutputTokens": 131072,
"capabilities": [
"chat",
@@ -60,18 +84,24 @@
"tool_use",
"long_context"
],
"inputPrice": 2.1,
"outputPrice": 8.4,
"inputPrice": 0.3,
"outputPrice": 1.2,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
"extra": {
"cacheReadPrice": 0.03,
"cacheWritePrice": 0.375,
"outputSpeedTps": 60
}
},
{
"modelName": "MiniMax-M2.5-highspeed",
"displayName": "MiniMax M2.5 高速版",
"serviceType": ["fast"],
"serviceType": [
"fast"
],
"description": "MiniMax M2.5 高速推理版本(100TPS),适合低延迟场景",
"contextWindow": 200000,
"contextWindow": 204800,
"maxOutputTokens": 131072,
"capabilities": [
"chat",
@@ -80,16 +110,22 @@
"tool_use",
"fast"
],
"inputPrice": 2.1,
"outputPrice": 16.8,
"inputPrice": 0.6,
"outputPrice": 2.4,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
"extra": {
"cacheReadPrice": 0.03,
"cacheWritePrice": 0.375,
"outputSpeedTps": 100
}
},
{
"modelName": "MiniMax-M2.1",
"displayName": "MiniMax M2.1",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "MiniMax 上一代主力模型200K 上下文,性价比优秀",
"contextWindow": 204800,
"maxOutputTokens": 131072,
@@ -99,16 +135,22 @@
"tool_use",
"reasoning"
],
"inputPrice": 2.1,
"outputPrice": 8.4,
"inputPrice": 0.3,
"outputPrice": 1.2,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
"extra": {
"cacheReadPrice": 0.03,
"cacheWritePrice": 0.375,
"outputSpeedTps": 60
}
},
{
"modelName": "MiniMax-M2.1-highspeed",
"displayName": "MiniMax M2.1 高速版",
"serviceType": ["fast"],
"serviceType": [
"fast"
],
"description": "MiniMax M2.1 高速推理版本,适合低延迟场景",
"contextWindow": 204800,
"maxOutputTokens": 131072,
@@ -119,16 +161,22 @@
"tool_use",
"fast"
],
"inputPrice": 2.1,
"outputPrice": 16.8,
"inputPrice": 0.6,
"outputPrice": 2.4,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
"extra": {
"cacheReadPrice": 0.03,
"cacheWritePrice": 0.375,
"outputSpeedTps": 100
}
},
{
"modelName": "MiniMax-Text-01",
"displayName": "MiniMax Text 01",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "MiniMax 百万级长上下文文本模型,擅长长文档处理",
"contextWindow": 1000000,
"maxOutputTokens": 131072,
@@ -138,8 +186,8 @@
"code",
"long_context"
],
"inputPrice": 1.4,
"outputPrice": 7.7,
"inputPrice": 0.2,
"outputPrice": 1.1,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}

View File

@@ -9,12 +9,17 @@
"enabled": false,
"status": "unconfigured",
"priceCurrency": "USD",
"services": ["chat", "fast"],
"services": [
"chat",
"fast"
],
"models": [
{
"modelName": "mistral-large-latest",
"displayName": "Mistral Large 3",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "Mistral 旗舰模型256K 上下文,支持视觉和工具调用",
"contextWindow": 256000,
"maxOutputTokens": 262144,
@@ -26,8 +31,8 @@
"tool_use",
"long_context"
],
"inputPrice": 0.50,
"outputPrice": 1.50,
"inputPrice": 0.5,
"outputPrice": 1.5,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
@@ -35,9 +40,11 @@
{
"modelName": "mistral-small-latest",
"displayName": "Mistral Small 3.2",
"serviceType": ["fast"],
"serviceType": [
"fast"
],
"description": "Mistral 高效小模型,低延迟,适合快速推理场景",
"contextWindow": 130000,
"contextWindow": 128000,
"maxOutputTokens": 8192,
"capabilities": [
"chat",
@@ -47,8 +54,8 @@
"fast",
"tool_use"
],
"inputPrice": 0.10,
"outputPrice": 0.30,
"inputPrice": 0.1,
"outputPrice": 0.3,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
@@ -56,16 +63,18 @@
{
"modelName": "codestral-latest",
"displayName": "Codestral",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "Mistral 专业代码模型,支持 Fill-in-the-Middle 补全",
"contextWindow": 256000,
"contextWindow": 128000,
"maxOutputTokens": 32768,
"capabilities": [
"code",
"fill_in_the_middle"
],
"inputPrice": 0.30,
"outputPrice": 0.90,
"inputPrice": 0.3,
"outputPrice": 0.9,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}

View File

@@ -14,13 +14,64 @@
"reasoning"
],
"models": [
{
"modelName": "kimi-k2.6",
"displayName": "Kimi K2.6",
"serviceType": [
"chat"
],
"description": "月之暗面 Kimi K2.6,最新多模态模型,长程代码编写与 Agent 自主执行能力增强256K 上下文,支持思考/非思考模式",
"contextWindow": 256000,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
"reasoning",
"code",
"tool_use",
"agent",
"long_context",
"vision",
"video_understanding",
"image_understanding"
],
"inputPrice": 6.5,
"outputPrice": 27,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"thinking": {
"default": "enabled",
"disabledTemperature": 0.6
},
"cacheHitPrice": 1.1,
"supportedImageFormats": [
"png",
"jpeg",
"webp",
"gif"
],
"supportedVideoFormats": [
"mp4",
"mpeg",
"mov",
"avi",
"x-flv",
"mpg",
"webm",
"wmv",
"3gpp"
]
}
},
{
"modelName": "kimi-k2.5",
"displayName": "Kimi K2.5",
"serviceType": ["chat"],
"description": "月之暗面Kimi K2.52026年1月发布的原生多模态模型支持视觉编码和智能体集群",
"serviceType": [
"chat"
],
"description": "月之暗面Kimi K2.5原生多模态模型256K 上下文,支持思考/非思考模式",
"contextWindow": 256000,
"maxOutputTokens": 16384,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
"reasoning",
@@ -32,15 +83,40 @@
],
"inputPrice": 4,
"outputPrice": 21,
"defaultTemperature": 0.7,
"defaultTopP": 0.9,
"extra": {}
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"thinking": {
"default": "enabled",
"disabledTemperature": 0.6
},
"cacheHitPrice": 0.7,
"supportedImageFormats": [
"png",
"jpeg",
"webp",
"gif"
],
"supportedVideoFormats": [
"mp4",
"mpeg",
"mov",
"avi",
"x-flv",
"mpg",
"webm",
"wmv",
"3gpp"
]
}
},
{
"modelName": "kimi-k2",
"displayName": "Kimi K2",
"serviceType": ["chat"],
"description": "月之暗面Kimi K2万亿参数MoE模型(320B激活)256K上下文专为智能体设计",
"serviceType": [
"chat"
],
"description": "月之暗面Kimi K2万亿参数MoE模型(32B激活)256K上下文专为智能体设计",
"contextWindow": 256000,
"maxOutputTokens": 8192,
"capabilities": [
@@ -49,19 +125,22 @@
"code",
"tool_use",
"agent",
"long_context",
"vision"
"long_context"
],
"inputPrice": 4,
"outputPrice": 16,
"defaultTemperature": 0.7,
"defaultTopP": 0.9,
"extra": {}
"extra": {
"cacheHitPrice": 1
}
},
{
"modelName": "kimi-k2-thinking",
"displayName": "Kimi K2 思考版",
"serviceType": ["reasoning"],
"serviceType": [
"reasoning"
],
"description": "月之暗面Kimi K2思考版256K上下文深度推理能力",
"contextWindow": 256000,
"maxOutputTokens": 16384,
@@ -76,12 +155,16 @@
"outputPrice": 16,
"defaultTemperature": 0.7,
"defaultTopP": 0.9,
"extra": {}
"extra": {
"cacheHitPrice": 1
}
},
{
"modelName": "moonshot-v1-8k",
"displayName": "Moonshot V1 8K",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "月之暗面标准模型8K上下文",
"contextWindow": 8192,
"maxOutputTokens": 4096,
@@ -98,7 +181,9 @@
{
"modelName": "moonshot-v1-32k",
"displayName": "Moonshot V1 32K",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "月之暗面标准模型32K上下文",
"contextWindow": 32768,
"maxOutputTokens": 4096,
@@ -116,7 +201,9 @@
{
"modelName": "moonshot-v1-128k",
"displayName": "Moonshot V1 128K",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "月之暗面标准模型128K上下文",
"contextWindow": 131072,
"maxOutputTokens": 4096,

View File

@@ -19,11 +19,13 @@
"serviceType": ["chat"],
"description": "本地运行的 Llama 3.1 70B",
"contextWindow": 131072,
"maxOutputTokens": 8192,
"capabilities": [
"chat",
"code",
"reasoning"
],
"defaultTemperature": 0.7,
"extra": {}
}
]

View File

@@ -25,7 +25,9 @@
{
"modelName": "gpt-5.2",
"displayName": "GPT-5.2",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "OpenAI 最新旗舰模型400K 上下文,编码和智能体任务优化",
"contextWindow": 400000,
"maxOutputTokens": 128000,
@@ -46,7 +48,9 @@
{
"modelName": "gpt-5.2-pro",
"displayName": "GPT-5.2 Pro",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "OpenAI GPT-5.2 Pro 专业版,最高性能",
"contextWindow": 400000,
"maxOutputTokens": 128000,
@@ -67,7 +71,9 @@
{
"modelName": "gpt-5.1",
"displayName": "GPT-5.1",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "OpenAI GPT-5.1400K 上下文,高性能旗舰",
"contextWindow": 400000,
"maxOutputTokens": 128000,
@@ -88,7 +94,9 @@
{
"modelName": "gpt-5",
"displayName": "GPT-5",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "OpenAI GPT-5 新一代旗舰模型,统一所有模型能力",
"contextWindow": 400000,
"maxOutputTokens": 128000,
@@ -109,10 +117,12 @@
{
"modelName": "gpt-5-pro",
"displayName": "GPT-5 Pro",
"serviceType": ["chat"],
"description": "OpenAI GPT-5 Pro 专业版高性能模型",
"serviceType": [
"chat"
],
"description": "OpenAI GPT-5 Pro 专业版高性能推理模型",
"contextWindow": 400000,
"maxOutputTokens": 128000,
"maxOutputTokens": 272000,
"capabilities": [
"chat",
"reasoning",
@@ -130,10 +140,12 @@
{
"modelName": "gpt-5-mini",
"displayName": "GPT-5-mini",
"serviceType": ["chat"],
"description": "高性价比模型,适合日常对话",
"contextWindow": 128000,
"maxOutputTokens": 32768,
"serviceType": [
"chat"
],
"description": "高性价比模型适合日常对话400K 上下文",
"contextWindow": 400000,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"fast",
@@ -150,17 +162,19 @@
{
"modelName": "gpt-5-nano",
"displayName": "GPT-5-nano",
"serviceType": ["fast"],
"description": "极速响应模型,适合简单任务",
"contextWindow": 128000,
"maxOutputTokens": 16384,
"serviceType": [
"fast"
],
"description": "极速响应模型适合简单任务400K 上下文",
"contextWindow": 400000,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"code",
"fast"
],
"inputPrice": 0.02,
"outputPrice": 0.08,
"inputPrice": 0.05,
"outputPrice": 0.4,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
@@ -168,9 +182,11 @@
{
"modelName": "gpt-4.1",
"displayName": "GPT-4.1",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "OpenAI GPT-4.1,支持 1M 上下文,编码和指令遵循能力大幅提升",
"contextWindow": 1000000,
"contextWindow": 1047576,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
@@ -180,8 +196,8 @@
"ultra_long_context",
"tool_use"
],
"inputPrice": 2.00,
"outputPrice": 8.00,
"inputPrice": 2,
"outputPrice": 8,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
@@ -189,9 +205,11 @@
{
"modelName": "gpt-4.1-mini",
"displayName": "GPT-4.1 mini",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "OpenAI GPT-4.1 mini1M 上下文,高性价比",
"contextWindow": 1000000,
"contextWindow": 1047576,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
@@ -200,8 +218,8 @@
"ultra_long_context",
"tool_use"
],
"inputPrice": 0.40,
"outputPrice": 1.60,
"inputPrice": 0.4,
"outputPrice": 1.6,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
@@ -209,9 +227,11 @@
{
"modelName": "gpt-4.1-nano",
"displayName": "GPT-4.1 nano",
"serviceType": ["fast"],
"serviceType": [
"fast"
],
"description": "OpenAI GPT-4.1 nano1M 上下文,极致性价比",
"contextWindow": 1000000,
"contextWindow": 1047576,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
@@ -219,8 +239,8 @@
"ultra_long_context",
"fast"
],
"inputPrice": 0.10,
"outputPrice": 0.40,
"inputPrice": 0.1,
"outputPrice": 0.4,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
@@ -228,7 +248,9 @@
{
"modelName": "gpt-4o",
"displayName": "GPT-4o",
"serviceType": ["vision"],
"serviceType": [
"vision"
],
"description": "多模态模型,支持图像理解",
"contextWindow": 128000,
"maxOutputTokens": 16384,
@@ -238,8 +260,8 @@
"image_understanding",
"tool_use"
],
"inputPrice": 2.50,
"outputPrice": 10.00,
"inputPrice": 2.5,
"outputPrice": 10,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
@@ -247,7 +269,9 @@
{
"modelName": "gpt-4o-mini",
"displayName": "GPT-4o mini",
"serviceType": ["vision"],
"serviceType": [
"vision"
],
"description": "OpenAI GPT-4o mini高性价比多模态模型",
"contextWindow": 128000,
"maxOutputTokens": 16384,
@@ -258,7 +282,7 @@
"tool_use"
],
"inputPrice": 0.15,
"outputPrice": 0.60,
"outputPrice": 0.6,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
@@ -266,35 +290,51 @@
{
"modelName": "text-embedding-3-small",
"displayName": "text-embedding-3-small",
"serviceType": ["embedding"],
"serviceType": [
"embedding"
],
"description": "轻量文本向量化模型1536 维",
"contextWindow": 8192,
"maxOutputTokens": 0,
"capabilities": [
"text_embedding",
"semantic_search"
],
"inputPrice": 0.02,
"defaultTemperature": 1,
"extra": {}
},
{
"modelName": "text-embedding-3-large",
"displayName": "text-embedding-3-large",
"serviceType": ["embedding"],
"serviceType": [
"embedding"
],
"description": "高精度文本向量化模型3072 维",
"contextWindow": 8192,
"maxOutputTokens": 0,
"capabilities": [
"text_embedding",
"semantic_search"
],
"inputPrice": 0.13,
"defaultTemperature": 1,
"extra": {}
},
{
"modelName": "tts-1",
"displayName": "TTS-1",
"serviceType": ["tts"],
"serviceType": [
"tts"
],
"description": "标准语音合成",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"tts"
],
"inputPrice": 15,
"defaultTemperature": 1,
"extra": {
"voices": [
"alloy",
@@ -315,11 +355,17 @@
{
"modelName": "tts-1-hd",
"displayName": "TTS-1-HD",
"serviceType": ["tts"],
"serviceType": [
"tts"
],
"description": "高清语音合成",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"tts"
],
"inputPrice": 30,
"defaultTemperature": 1,
"extra": {
"voices": [
"alloy",
@@ -340,12 +386,18 @@
{
"modelName": "whisper-1",
"displayName": "Whisper",
"serviceType": ["asr"],
"serviceType": [
"asr"
],
"description": "通用语音识别",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"asr",
"multilingual"
],
"inputPrice": 0.006,
"defaultTemperature": 1,
"extra": {
"maxAudioLength": 600,
"supportedInputFormats": [
@@ -363,7 +415,9 @@
{
"modelName": "o3",
"displayName": "o3",
"serviceType": ["responses"],
"serviceType": [
"responses"
],
"description": "OpenAI o3 推理模型200K 上下文,支持工具调用",
"contextWindow": 200000,
"maxOutputTokens": 100000,
@@ -375,8 +429,8 @@
"science",
"tool_use"
],
"inputPrice": 2.00,
"outputPrice": 8.00,
"inputPrice": 2,
"outputPrice": 8,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
@@ -384,7 +438,9 @@
{
"modelName": "o3-pro",
"displayName": "o3-pro",
"serviceType": ["responses"],
"serviceType": [
"responses"
],
"description": "OpenAI o3-pro 高级推理模型200K 上下文",
"contextWindow": 200000,
"maxOutputTokens": 100000,
@@ -395,8 +451,8 @@
"math",
"science"
],
"inputPrice": 20.00,
"outputPrice": 80.00,
"inputPrice": 20,
"outputPrice": 80,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
@@ -404,9 +460,11 @@
{
"modelName": "o3-mini",
"displayName": "o3-mini",
"serviceType": ["responses"],
"description": "OpenAI o3-mini 推理模型128K 上下文",
"contextWindow": 128000,
"serviceType": [
"responses"
],
"description": "OpenAI o3-mini 推理模型200K 上下文",
"contextWindow": 200000,
"maxOutputTokens": 100000,
"capabilities": [
"reasoning",
@@ -414,8 +472,8 @@
"code",
"fast"
],
"inputPrice": 1.10,
"outputPrice": 4.40,
"inputPrice": 1.1,
"outputPrice": 4.4,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
@@ -423,7 +481,9 @@
{
"modelName": "o4-mini",
"displayName": "o4-mini",
"serviceType": ["responses"],
"serviceType": [
"responses"
],
"description": "OpenAI o4-mini 推理模型200K 上下文,支持工具调用",
"contextWindow": 200000,
"maxOutputTokens": 100000,
@@ -434,8 +494,8 @@
"tool_use",
"vision"
],
"inputPrice": 1.10,
"outputPrice": 4.40,
"inputPrice": 1.1,
"outputPrice": 4.4,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
@@ -443,12 +503,17 @@
{
"modelName": "dall-e-3",
"displayName": "DALL-E 3",
"serviceType": ["image_gen"],
"serviceType": [
"image_gen"
],
"description": "高质量文生图模型",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"image_generation",
"text_rendering"
],
"defaultTemperature": 1,
"extra": {
"supportedImageSizes": [
"1024x1024",
@@ -464,9 +529,12 @@
{
"modelName": "gpt-4o-realtime",
"displayName": "GPT-4o Realtime",
"serviceType": ["omni"],
"serviceType": [
"omni"
],
"description": "全能实时模型,支持语音 + 文本 + 视觉",
"contextWindow": 128000,
"contextWindow": 32000,
"maxOutputTokens": 4096,
"capabilities": [
"chat",
"vision",
@@ -474,6 +542,9 @@
"asr",
"realtime"
],
"inputPrice": 4,
"outputPrice": 16,
"defaultTemperature": 1,
"extra": {
"supportedModes": [
"speech-to-speech",
@@ -485,13 +556,20 @@
{
"modelName": "gpt-4o-realtime-preview",
"displayName": "GPT-4o Realtime Preview",
"serviceType": ["realtime_voice"],
"serviceType": [
"realtime_voice"
],
"description": "实时语音交互模型",
"contextWindow": 32000,
"maxOutputTokens": 4096,
"capabilities": [
"realtime",
"speech_to_speech",
"low_latency"
],
"inputPrice": 5,
"outputPrice": 20,
"defaultTemperature": 1,
"extra": {
"supportedModes": [
"speech-to-speech",

View File

@@ -16,7 +16,7 @@
"displayName": "OpenRouter Auto",
"serviceType": ["chat"],
"description": "OpenRouter 自动路由,智能选择最优模型",
"contextWindow": 200000,
"contextWindow": 2000000,
"maxOutputTokens": 16384,
"capabilities": [
"chat",
@@ -29,19 +29,16 @@
"extra": {}
},
{
"modelName": "google/gemini-2.5-flash-exp:free",
"displayName": "Gemini 2.5 Flash (免费)",
"modelName": "openai/gpt-oss-120b:free",
"displayName": "GPT-OSS 120B (免费)",
"serviceType": ["chat"],
"description": "通过 OpenRouter 免费使用的 Gemini 2.5 Flash1M 上下文",
"contextWindow": 1048576,
"maxOutputTokens": 65535,
"description": "通过 OpenRouter 免费使用的 OpenAI GPT-OSS 120B",
"contextWindow": 131072,
"maxOutputTokens": 131072,
"capabilities": [
"chat",
"reasoning",
"vision",
"tool_use",
"fast",
"long_context"
"code"
],
"inputPrice": 0.00,
"outputPrice": 0.00,
@@ -54,8 +51,8 @@
"displayName": "Qwen3 Coder 480B (免费)",
"serviceType": ["chat"],
"description": "通过 OpenRouter 免费使用的 Qwen3 Coder 480B",
"contextWindow": 262144,
"maxOutputTokens": 32768,
"contextWindow": 262000,
"maxOutputTokens": 262000,
"capabilities": [
"code",
"reasoning",

View File

@@ -15,12 +15,13 @@
"modelName": "Qwen/Qwen3-Coder-480B-A35B-Instruct",
"displayName": "Qwen3 Coder 480B (硅基)",
"serviceType": ["chat"],
"description": "开源最强代码模型480B MoE 架构,擅长代码生成和 Agent 场景",
"description": "Qwen3-Coder-480B-A35B-Instruct480B MoE35B 激活),原生 256K 上下文,可通过外推扩展至 1M面向 Agentic Coding",
"contextWindow": 262144,
"maxOutputTokens": 32768,
"maxOutputTokens": 262144,
"capabilities": [
"chat",
"code",
"reasoning",
"long_context",
"agent",
"tool_use"
],
@@ -31,20 +32,19 @@
"extra": {}
},
{
"modelName": "Qwen/Qwen3-235B-A22B-Instruct",
"modelName": "Qwen/Qwen3-235B-A22B-Instruct-2507",
"displayName": "Qwen3 235B (硅基)",
"serviceType": ["chat"],
"description": "Qwen3 旗舰通用模型235B MoE 架构,多语言能力突出",
"description": "Qwen3-235B-A22B-Instruct-2507235B MoE22B 激活通用指令模型262K 上下文",
"contextWindow": 262144,
"maxOutputTokens": 38912,
"maxOutputTokens": 262144,
"capabilities": [
"chat",
"reasoning",
"code",
"multilingual",
"tool_use",
"agent",
"vision"
"long_context"
],
"inputPrice": 2.5,
"outputPrice": 10,
@@ -65,6 +65,7 @@
],
"inputPrice": 0,
"outputPrice": 0,
"defaultTemperature": 1,
"extra": {}
}
]

View File

@@ -18,11 +18,14 @@
"displayName": "Stable Diffusion 3.5 Large",
"serviceType": ["image_gen"],
"description": "Stability AI 旗舰文生图模型",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"image_generation",
"high_quality",
"controllable"
],
"defaultTemperature": 1,
"extra": {
"supportedImageSizes": [
"1024x1024",

View File

@@ -9,14 +9,19 @@
"enabled": false,
"status": "unconfigured",
"priceCurrency": "CNY",
"services": ["chat", "reasoning"],
"services": [
"chat",
"reasoning"
],
"models": [
{
"modelName": "hunyuan-2.0-thinking-20251109",
"displayName": "混元 2.0 Think",
"serviceType": ["reasoning"],
"serviceType": [
"reasoning"
],
"description": "腾讯混元最新推理模型128K输入/64K输出MoE架构406B总参数",
"contextWindow": 131072,
"contextWindow": 128000,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
@@ -31,11 +36,13 @@
"extra": {}
},
{
"modelName": "hunyuan-turbo-s",
"modelName": "hunyuan-turbos-latest",
"displayName": "混元 Turbo S",
"serviceType": ["chat"],
"description": "腾讯混元高速模型262K 上下文,支持推理和工具调用",
"contextWindow": 262144,
"serviceType": [
"chat"
],
"description": "腾讯混元高速模型32K输入/16K输出支持推理和工具调用",
"contextWindow": 32768,
"maxOutputTokens": 16384,
"capabilities": [
"chat",

View File

@@ -23,10 +23,12 @@
{
"modelName": "doubao-2.0-pro",
"displayName": "豆包 2.0 Pro",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "火山引擎豆包2.0旗舰模型256K上下文相比Gemini 3 Pro和GPT 5.2有较大成本优势",
"contextWindow": 256000,
"maxOutputTokens": 16384,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"reasoning",
@@ -44,10 +46,12 @@
{
"modelName": "doubao-seed-1.8",
"displayName": "豆包 Seed-1.8",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "火山引擎豆包1.8旗舰模型256K上下文支持深度思考和多模态",
"contextWindow": 256000,
"maxOutputTokens": 16384,
"maxOutputTokens": 32000,
"capabilities": [
"chat",
"reasoning",
@@ -65,10 +69,12 @@
{
"modelName": "doubao-seed-1.6",
"displayName": "豆包 Seed-1.6",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "火山引擎豆包1.6旗舰模型256K上下文",
"contextWindow": 256000,
"maxOutputTokens": 16384,
"maxOutputTokens": 32000,
"capabilities": [
"chat",
"reasoning",
@@ -86,7 +92,9 @@
{
"modelName": "doubao-seed-1.6-thinking",
"displayName": "豆包 Seed-1.6 思考版",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "火山引擎豆包1.6深度思考模型256K上下文",
"contextWindow": 256000,
"maxOutputTokens": 32768,
@@ -105,10 +113,12 @@
{
"modelName": "doubao-seed-1.6-flash",
"displayName": "豆包 Seed-1.6 Flash",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "火山引擎豆包1.6快速版成本较前代下降63%",
"contextWindow": 256000,
"maxOutputTokens": 8192,
"maxOutputTokens": 32000,
"capabilities": [
"chat",
"code",
@@ -124,10 +134,12 @@
{
"modelName": "doubao-seed-1.6-lite",
"displayName": "豆包 Seed-1.6 Lite",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "火山引擎豆包1.6轻量版,极致性价比",
"contextWindow": 128000,
"maxOutputTokens": 4096,
"contextWindow": 256000,
"maxOutputTokens": 32000,
"capabilities": [
"chat",
"code",
@@ -142,10 +154,12 @@
{
"modelName": "doubao-seed-1.6-vision",
"displayName": "豆包 Seed-1.6 视觉版",
"serviceType": ["vision"],
"serviceType": [
"vision"
],
"description": "火山引擎豆包1.6视觉模型256K上下文支持视频理解",
"contextWindow": 256000,
"maxOutputTokens": 16384,
"maxOutputTokens": 32000,
"capabilities": [
"chat",
"vision",
@@ -162,7 +176,9 @@
{
"modelName": "doubao-seed-code",
"displayName": "豆包 Seed-Code",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "火山引擎豆包编程专用模型256K上下文",
"contextWindow": 256000,
"maxOutputTokens": 32768,
@@ -180,10 +196,12 @@
{
"modelName": "deepseek-v3.2",
"displayName": "DeepSeek V3.2 (火山引擎)",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "火山引擎托管的DeepSeek V3.2128K上下文",
"contextWindow": 128000,
"maxOutputTokens": 8000,
"maxOutputTokens": 32000,
"capabilities": [
"chat",
"reasoning",
@@ -199,10 +217,12 @@
{
"modelName": "deepseek-r1",
"displayName": "DeepSeek R1 (火山引擎)",
"serviceType": ["reasoning"],
"description": "火山引擎托管的DeepSeek R1推理模型64K上下文",
"contextWindow": 64000,
"maxOutputTokens": 32768,
"serviceType": [
"reasoning"
],
"description": "火山引擎托管的DeepSeek R1推理模型128K上下文",
"contextWindow": 128000,
"maxOutputTokens": 65536,
"capabilities": [
"reasoning",
"math",
@@ -219,9 +239,11 @@
{
"modelName": "kimi-k2-volcengine",
"displayName": "Kimi K2 (火山引擎)",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "火山引擎托管的Kimi K2万亿参数MoE模型128K上下文",
"contextWindow": 128000,
"contextWindow": 256000,
"maxOutputTokens": 8192,
"capabilities": [
"chat",
@@ -240,10 +262,12 @@
{
"modelName": "glm-4-7",
"displayName": "GLM-4.7 (火山引擎)",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "火山引擎托管的智谱GLM-4.7200K上下文",
"contextWindow": 200000,
"maxOutputTokens": 200000,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"reasoning",
@@ -261,9 +285,12 @@
{
"modelName": "doubao-embedding",
"displayName": "豆包 Embedding",
"serviceType": ["embedding"],
"serviceType": [
"embedding"
],
"description": "火山引擎豆包标准向量模型2560维度",
"contextWindow": 4096,
"maxOutputTokens": 0,
"capabilities": [
"text_embedding",
"semantic_search",
@@ -271,18 +298,24 @@
"chinese_optimized"
],
"inputPrice": 0.5,
"defaultTemperature": 1,
"extra": {}
},
{
"modelName": "volc-mega-tts-clone",
"displayName": "火山声音复刻",
"serviceType": ["voice_clone"],
"serviceType": [
"voice_clone"
],
"description": "火山引擎声音复刻,支持极少样本",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"voice_clone",
"chinese_optimized",
"few_shot"
],
"defaultTemperature": 1,
"extra": {
"maxCloneSamples": 3,
"minCloneDuration": 5
@@ -291,14 +324,19 @@
{
"modelName": "volc-realtime-voice",
"displayName": "火山实时语音",
"serviceType": ["realtime_voice"],
"serviceType": [
"realtime_voice"
],
"description": "火山引擎实时语音交互",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"realtime",
"speech_to_speech",
"low_latency",
"chinese_optimized"
],
"defaultTemperature": 1,
"extra": {
"supportedModes": [
"speech-to-speech"
@@ -309,13 +347,18 @@
{
"modelName": "volc-simultaneous",
"displayName": "火山同声传译",
"serviceType": ["simultaneous_interpret"],
"serviceType": [
"simultaneous_interpret"
],
"description": "火山引擎同声传译,支持中英双向",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"simultaneous_interpretation",
"chinese_optimized",
"low_latency"
],
"defaultTemperature": 1,
"extra": {
"streamingSupported": true
}
@@ -323,13 +366,18 @@
{
"modelName": "volc-translation",
"displayName": "火山翻译",
"serviceType": ["translation"],
"serviceType": [
"translation"
],
"description": "火山引擎机器翻译,支持多语种互译",
"contextWindow": 0,
"maxOutputTokens": 0,
"capabilities": [
"translation",
"multilingual",
"chinese_optimized"
],
"defaultTemperature": 1,
"extra": {}
}
]

View File

@@ -12,12 +12,12 @@
"services": ["chat", "reasoning"],
"models": [
{
"modelName": "grok-4-0709",
"displayName": "Grok 4",
"modelName": "grok-4.20-0309-reasoning",
"displayName": "Grok 4.20 Reasoning",
"serviceType": ["chat", "reasoning"],
"description": "xAI 最新旗舰推理模型,262K 上下文,支持工具调用",
"contextWindow": 262144,
"maxOutputTokens": 8192,
"description": "xAI 旗舰推理模型,支持函数调用与结构化输出",
"contextWindow": 2000000,
"maxOutputTokens": 16384,
"capabilities": [
"chat",
"reasoning",
@@ -25,17 +25,17 @@
"vision",
"tool_use"
],
"inputPrice": 3.00,
"outputPrice": 15.00,
"inputPrice": 2.00,
"outputPrice": 6.00,
"defaultTemperature": 1,
"defaultTopP": 1,
"extra": {}
},
{
"modelName": "grok-4-1-fast",
"displayName": "Grok 4.1 Fast",
"serviceType": ["chat"],
"description": "xAI 超长上下文高速模型2M token 窗口",
"modelName": "grok-4-1-fast-reasoning",
"displayName": "Grok 4.1 Fast Reasoning",
"serviceType": ["chat", "reasoning"],
"description": "xAI 高速推理模型2M 上下文窗口",
"contextWindow": 2000000,
"maxOutputTokens": 16384,
"capabilities": [

View File

@@ -12,12 +12,12 @@
"services": ["chat", "reasoning"],
"models": [
{
"modelName": "x1",
"modelName": "spark-x",
"displayName": "讯飞星火 X1",
"serviceType": ["reasoning"],
"description": "讯飞最新推理模型,基于全国产算力训练,擅长数学和代码推理",
"contextWindow": 32768,
"maxOutputTokens": 16384,
"description": "讯飞深度推理模型X2输入64K/输出128K支持思考模式与函数调用",
"contextWindow": 65536,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"reasoning",

View File

@@ -18,15 +18,22 @@
"modelName": "embedding-3",
"displayName": "智谱 embedding-3",
"serviceType": ["embedding"],
"description": "智谱嵌入模型v3支持自定义维度,单条最大3072 tokens。走 OpenAI 兼容 /embeddings 端点Anthropic 协议不提供 embeddings",
"contextWindow": 3072,
"description": "智谱嵌入模型v3支持自定义维度;模型上下文窗口 8K单条输入最多 3072 tokens。走 OpenAI 兼容 /embeddings 端点Anthropic 协议不提供 embeddings",
"contextWindow": 8192,
"maxOutputTokens": 0,
"capabilities": [
"text_embedding",
"semantic_search",
"rag"
"rag",
"custom_dimensions"
],
"inputPrice": 0.5,
"extra": {}
"defaultTemperature": 1,
"extra": {
"maxInputTokensPerItem": 3072,
"maxBatchItems": 64,
"vectorDimensions": "256-2048"
}
}
]
}

View File

@@ -8,7 +8,7 @@
"apiKeyVerified": false,
"enabled": false,
"status": "unconfigured",
"priceCurrency": "CNY",
"priceCurrency": "USD",
"services": [
"chat",
"vision",
@@ -18,10 +18,72 @@
"embedding-3"
],
"models": [
{
"modelName": "glm-5.1",
"displayName": "GLM-5.1",
"serviceType": [
"chat"
],
"description": "智谱 GLM-5.1 最新旗舰模型,面向长程 Agentic Coding 与 Autonomous Agent 场景200K 上下文128K 最大输出",
"contextWindow": 200000,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"reasoning",
"code",
"multilingual",
"deep_thinking",
"long_context",
"math",
"tool_use",
"agent"
],
"inputPrice": 1.4,
"outputPrice": 4.4,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"cacheHitPrice": 0.26,
"thinking": {
"default": "enabled"
}
}
},
{
"modelName": "glm-5-turbo",
"displayName": "GLM-5-Turbo",
"serviceType": [
"chat"
],
"description": "智谱 GLM-5-Turbo面向 OpenClaw 等长链路任务优化200K 上下文128K 最大输出",
"contextWindow": 200000,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"reasoning",
"code",
"deep_thinking",
"long_context",
"tool_use",
"agent"
],
"inputPrice": 1.2,
"outputPrice": 4,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"cacheHitPrice": 0.24,
"thinking": {
"default": "enabled"
}
}
},
{
"modelName": "glm-5",
"displayName": "GLM-5",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "智谱GLM-5744B参数旗舰基座模型2026年2月发布面向Agentic Engineering编程能力接近Claude Opus",
"contextWindow": 200000,
"maxOutputTokens": 128000,
@@ -36,16 +98,20 @@
"tool_use",
"agent"
],
"inputPrice": 4,
"outputPrice": 18,
"defaultTemperature": 0.95,
"defaultTopP": 0.7,
"extra": {}
"inputPrice": 1,
"outputPrice": 3.2,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"cacheHitPrice": 0.2
}
},
{
"modelName": "glm-4.7",
"displayName": "GLM-4.7",
"serviceType": ["chat"],
"serviceType": [
"chat"
],
"description": "智谱GLM-4.7355B参数MoE架构旗舰模型200K上下文编程能力对齐Claude Sonnet",
"contextWindow": 200000,
"maxOutputTokens": 128000,
@@ -58,16 +124,20 @@
"long_context",
"tool_use"
],
"inputPrice": 4,
"outputPrice": 16,
"defaultTemperature": 0.95,
"defaultTopP": 0.7,
"extra": {}
"inputPrice": 0.6,
"outputPrice": 2.2,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"cacheHitPrice": 0.11
}
},
{
"modelName": "glm-4.7-thinking",
"displayName": "GLM-4.7 Thinking",
"serviceType": ["reasoning"],
"serviceType": [
"reasoning"
],
"description": "智谱GLM-4.7深度思考模式200K上下文交错式/保留式/轮级思考",
"contextWindow": 200000,
"maxOutputTokens": 128000,
@@ -78,19 +148,57 @@
"deep_thinking",
"long_context"
],
"inputPrice": 8,
"outputPrice": 32,
"defaultTemperature": 0.95,
"defaultTopP": 0.7,
"extra": {}
"inputPrice": 0.6,
"outputPrice": 2.2,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"cacheHitPrice": 0.11,
"aliasOf": "glm-4.7"
}
},
{
"modelName": "glm-5v-turbo",
"displayName": "GLM-5V-Turbo",
"serviceType": [
"vision"
],
"description": "智谱首个多模态 Coding 基座模型支持视频、图像、文本和文件输入200K 上下文128K 最大输出",
"contextWindow": 200000,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"vision",
"video_understanding",
"image_understanding",
"file_understanding",
"reasoning",
"code",
"deep_thinking",
"long_context",
"tool_use",
"agent"
],
"inputPrice": 1.2,
"outputPrice": 4,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"cacheHitPrice": 0.24,
"thinking": {
"default": "enabled"
}
}
},
{
"modelName": "glm-4.6v",
"displayName": "GLM-4.6V",
"serviceType": ["vision"],
"serviceType": [
"vision"
],
"description": "智谱GLM-4.6V多模态版106B/12B MoE支持图像视频理解与工具调用128K上下文",
"contextWindow": 128000,
"maxOutputTokens": 8192,
"maxOutputTokens": 32768,
"capabilities": [
"chat",
"vision",
@@ -99,28 +207,37 @@
"long_context",
"tool_use"
],
"inputPrice": 8,
"outputPrice": 32,
"extra": {}
"inputPrice": 0.3,
"outputPrice": 0.9,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"cacheHitPrice": 0.05
}
},
{
"modelName": "glm-4.6",
"displayName": "GLM-4.6",
"serviceType": ["chat"],
"description": "智谱GLM-4.6增强推理能力128K上下文",
"contextWindow": 128000,
"maxOutputTokens": 8192,
"serviceType": [
"chat"
],
"description": "智谱GLM-4.6增强推理能力200K上下文",
"contextWindow": 200000,
"maxOutputTokens": 128000,
"capabilities": [
"chat",
"reasoning",
"code",
"multilingual",
"deep_thinking",
"vision"
"deep_thinking"
],
"inputPrice": 5,
"outputPrice": 5,
"extra": {}
"inputPrice": 0.6,
"outputPrice": 2.2,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"cacheHitPrice": 0.11
}
}
]
}