diff --git a/compute/providers/dashscope.json b/compute/providers/dashscope.json index 58d795f..0a3facb 100644 --- a/compute/providers/dashscope.json +++ b/compute/providers/dashscope.json @@ -23,6 +23,88 @@ "translation" ], "models": [ + { + "modelName": "qwen3.6-plus", + "displayName": "阿里云 Qwen3.6-Plus", + "serviceType": [ + "chat", + "vision" + ], + "description": "通义千问3.6 Plus,支持文本/图像/视频输入,100万上下文,支持内置工具和 Function Calling", + "contextWindow": 1000000, + "maxOutputTokens": 65536, + "capabilities": [ + "chat", + "reasoning", + "code", + "multilingual", + "long_context", + "tool_use", + "agent", + "vision" + ], + "inputPrice": 2, + "outputPrice": 12, + "defaultTemperature": 0.6, + "defaultTopP": 0.95, + "extra": { + "pricingTiers": [ + { + "maxInputTokens": 256000, + "inputPrice": 2, + "outputPrice": 12, + "thinkingOutputPrice": 12 + }, + { + "maxInputTokens": 1000000, + "inputPrice": 8, + "outputPrice": 48, + "thinkingOutputPrice": 48 + } + ], + "thinkingMaxTokens": 81920 + } + }, + { + "modelName": "qwen3.6-flash", + "displayName": "阿里云 Qwen3.6-Flash", + "serviceType": [ + "chat", + "vision" + ], + "description": "通义千问3.6 Flash,高性价比多模态模型,100万上下文,支持内置工具和 Function Calling", + "contextWindow": 1000000, + "maxOutputTokens": 65536, + "capabilities": [ + "chat", + "reasoning", + "code", + "multilingual", + "long_context", + "tool_use", + "vision", + "fast" + ], + "inputPrice": 1.2, + "outputPrice": 7.2, + "defaultTemperature": 0.6, + "defaultTopP": 0.95, + "extra": { + "pricingTiers": [ + { + "maxInputTokens": 256000, + "inputPrice": 1.2, + "outputPrice": 7.2 + }, + { + "maxInputTokens": 1000000, + "inputPrice": 4.8, + "outputPrice": 28.8 + } + ], + "thinkingMaxTokens": 131072 + } + }, { "modelName": "qwen3.5-plus", "displayName": "阿里云 Qwen3.5-Plus", @@ -44,8 +126,8 @@ ], "inputPrice": 0.8, "outputPrice": 4.8, - "defaultTemperature": 0.7, - "defaultTopP": 0.8, + "defaultTemperature": 0.6, + "defaultTopP": 0.95, "extra": { "pricingTiers": [ { @@ -106,8 +188,8 @@ ], "inputPrice": 0.8, "outputPrice": 2, - "defaultTemperature": 0.6, - "defaultTopP": 0.8, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "pricingTiers": [ { @@ -149,8 +231,8 @@ ], "inputPrice": 0.367, "outputPrice": 1.468, - "defaultTemperature": 0.7, - "defaultTopP": 0.8, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "thinkingContextWindow": 131072, "thinkingOutputPrice": 3.67, @@ -173,7 +255,7 @@ ], "inputPrice": 0.5, "outputPrice": 2, - "defaultTemperature": 0.7, + "defaultTemperature": 1, "defaultTopP": 0.8, "extra": {} }, @@ -198,8 +280,8 @@ ], "inputPrice": 2.5, "outputPrice": 10, - "defaultTemperature": 0.7, - "defaultTopP": 0.8, + "defaultTemperature": null, + "defaultTopP": null, "extra": {} }, { @@ -221,6 +303,7 @@ "inputPrice": 1.5, "outputPrice": 6, "defaultTemperature": 0.7, + "defaultTopP": 0.8, "extra": {} }, { @@ -241,6 +324,7 @@ "inputPrice": 0.8, "outputPrice": 3, "defaultTemperature": 0.7, + "defaultTopP": 0.8, "extra": {} }, { @@ -257,8 +341,8 @@ "chinese_optimized" ], "inputPrice": 0.7, - "maxOutputTokens": 0, - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": {} }, { @@ -275,8 +359,8 @@ "rag" ], "inputPrice": 0.5, - "maxOutputTokens": 0, - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": {} }, { @@ -287,14 +371,14 @@ ], "description": "检索重排序,支持 100+ 语种", "contextWindow": 120000, - "maxOutputTokens": 0, "capabilities": [ "rerank", "semantic_reranking", "multilingual" ], "inputPrice": 1, - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": {} }, { @@ -304,14 +388,13 @@ "tts" ], "description": "通义语音合成,支持中英文", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "tts", "multilingual", "chinese_optimized" ], - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "voices": [ "longxiaochun", @@ -333,13 +416,12 @@ "asr" ], "description": "通义语音识别", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "asr", "chinese_optimized" ], - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "maxAudioLength": 3600, "supportedInputFormats": [ @@ -358,13 +440,12 @@ "image_gen" ], "description": "通义万相文生图", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "image_generation", "chinese_optimized" ], - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "supportedImageSizes": [ "1024x1024", @@ -386,13 +467,12 @@ "video_gen" ], "description": "通义万相文生视频", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "video_generation", "chinese_optimized" ], - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "maxVideoDuration": 10, "supportedResolutions": [ @@ -408,14 +488,13 @@ "voice_clone" ], "description": "通义声音复刻,少量样本即可克隆", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "voice_clone", "chinese_optimized", "few_shot" ], - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "maxCloneSamples": 5, "minCloneDuration": 3 @@ -438,7 +517,8 @@ "multimodal", "tool_use" ], - "defaultTemperature": 0.7, + "defaultTemperature": null, + "defaultTopP": 0.01, "extra": {} }, { @@ -455,7 +535,8 @@ "multilingual", "chinese_optimized" ], - "defaultTemperature": 0.7, + "defaultTemperature": null, + "defaultTopP": null, "extra": {} } ] diff --git a/compute/providers/google.json b/compute/providers/google.json index bc64796..fd3cfd4 100644 --- a/compute/providers/google.json +++ b/compute/providers/google.json @@ -15,6 +15,92 @@ "embedding" ], "models": [ + { + "modelName": "gemini-3.1-pro-preview", + "displayName": "Gemini 3.1 Pro Preview", + "serviceType": ["chat"], + "description": "Google Gemini 3.1 Pro Preview,面向复杂推理、编码和智能体工作流", + "contextWindow": 1048576, + "maxOutputTokens": 65536, + "capabilities": [ + "chat", + "reasoning", + "code", + "vision", + "ultra_long_context", + "tool_use" + ], + "inputPrice": 2.00, + "outputPrice": 12.00, + "defaultTemperature": 1, + "defaultTopP": 0.95, + "extra": { + "pricingNotes": "Standard paid tier text/image/video price for prompts <= 200K tokens; prompts > 200K are $4 input and $18 output per 1M tokens.", + "cachePricing": { + "inputCacheRead": 0.20, + "inputCacheReadOver200k": 0.40, + "storagePerMillionTokensPerHour": 4.50 + } + } + }, + { + "modelName": "gemini-3-flash-preview", + "displayName": "Gemini 3 Flash Preview", + "serviceType": ["chat"], + "description": "Google Gemini 3 Flash Preview,高速多模态推理模型", + "contextWindow": 1048576, + "maxOutputTokens": 65536, + "capabilities": [ + "chat", + "reasoning", + "code", + "vision", + "ultra_long_context", + "tool_use", + "fast" + ], + "inputPrice": 0.50, + "outputPrice": 3.00, + "defaultTemperature": 1, + "defaultTopP": 0.95, + "extra": { + "pricingNotes": "Standard paid tier text/image/video price; audio input is $1.00 per 1M tokens.", + "cachePricing": { + "inputCacheRead": 0.05, + "audioInputCacheRead": 0.10, + "storagePerMillionTokensPerHour": 1.00 + } + } + }, + { + "modelName": "gemini-3.1-flash-lite-preview", + "displayName": "Gemini 3.1 Flash-Lite Preview", + "serviceType": ["fast"], + "description": "Google Gemini 3.1 Flash-Lite Preview,低成本高吞吐多模态模型", + "contextWindow": 1048576, + "maxOutputTokens": 65536, + "capabilities": [ + "chat", + "reasoning", + "code", + "vision", + "ultra_long_context", + "tool_use", + "fast" + ], + "inputPrice": 0.25, + "outputPrice": 1.50, + "defaultTemperature": 1, + "defaultTopP": 0.95, + "extra": { + "pricingNotes": "Standard paid tier text/image/video price; audio input is $0.50 per 1M tokens.", + "cachePricing": { + "inputCacheRead": 0.025, + "audioInputCacheRead": 0.05, + "storagePerMillionTokensPerHour": 1.00 + } + } + }, { "modelName": "gemini-2.5-pro", "displayName": "Gemini 2.5 Pro", @@ -32,7 +118,7 @@ ], "inputPrice": 1.25, "outputPrice": 10, - "defaultTemperature": 1, + "defaultTemperature": null, "defaultTopP": 0.95, "extra": {} }, @@ -54,7 +140,7 @@ ], "inputPrice": 0.30, "outputPrice": 2.50, - "defaultTemperature": 1, + "defaultTemperature": null, "defaultTopP": 0.95, "extra": {} }, @@ -64,13 +150,13 @@ "serviceType": ["embedding"], "description": "Google 文本嵌入模型,768维度", "contextWindow": 2048, - "maxOutputTokens": 0, "capabilities": [ "text_embedding", "semantic_search" ], "inputPrice": 0.10, - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": {} } ] diff --git a/compute/providers/kling.json b/compute/providers/kling.json index ef35efb..0979a7a 100644 --- a/compute/providers/kling.json +++ b/compute/providers/kling.json @@ -18,15 +18,12 @@ "displayName": "可灵 V2.5 Turbo", "serviceType": ["video_gen"], "description": "可灵最新视频生成模型,高性价比", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "video_generation", "chinese_optimized", "high_quality", "fast" ], - "defaultTemperature": 1, "extra": { "maxVideoDuration": 10, "supportedResolutions": [ @@ -41,14 +38,11 @@ "displayName": "可灵 V2.5 Turbo Pro", "serviceType": ["video_gen"], "description": "可灵高品质视频生成", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "video_generation", "chinese_optimized", "ultra_quality" ], - "defaultTemperature": 1, "extra": { "maxVideoDuration": 10, "supportedResolutions": [ @@ -63,14 +57,11 @@ "displayName": "可灵 V2", "serviceType": ["video_gen"], "description": "可灵文生视频旗舰模型", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "video_generation", "chinese_optimized", "high_quality" ], - "defaultTemperature": 1, "extra": { "maxVideoDuration": 10, "supportedResolutions": [ @@ -84,14 +75,11 @@ "displayName": "可灵 V2 Master", "serviceType": ["video_gen"], "description": "可灵最高品质视频生成", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "video_generation", "chinese_optimized", "ultra_quality" ], - "defaultTemperature": 1, "extra": { "maxVideoDuration": 10, "supportedResolutions": [ diff --git a/compute/providers/local-whisper.json b/compute/providers/local-whisper.json index f0f97c8..f8c58ad 100644 --- a/compute/providers/local-whisper.json +++ b/compute/providers/local-whisper.json @@ -18,9 +18,6 @@ "displayName": "Whisper Large V3", "serviceType": ["asr"], "description": "本地部署的 Whisper 大模型", - "contextWindow": 0, - "maxOutputTokens": 0, - "defaultTemperature": 1, "capabilities": [ "asr", "multilingual" diff --git a/compute/providers/openai.json b/compute/providers/openai.json index b0de87d..ac56c30 100644 --- a/compute/providers/openai.json +++ b/compute/providers/openai.json @@ -295,13 +295,13 @@ ], "description": "轻量文本向量化模型,1536 维", "contextWindow": 8192, - "maxOutputTokens": 0, "capabilities": [ "text_embedding", "semantic_search" ], "inputPrice": 0.02, - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": {} }, { @@ -312,13 +312,13 @@ ], "description": "高精度文本向量化模型,3072 维", "contextWindow": 8192, - "maxOutputTokens": 0, "capabilities": [ "text_embedding", "semantic_search" ], "inputPrice": 0.13, - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": {} }, { @@ -328,13 +328,12 @@ "tts" ], "description": "标准语音合成", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "tts" ], "inputPrice": 15, - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "voices": [ "alloy", @@ -359,13 +358,12 @@ "tts" ], "description": "高清语音合成", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "tts" ], "inputPrice": 30, - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "voices": [ "alloy", @@ -390,14 +388,13 @@ "asr" ], "description": "通用语音识别", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "asr", "multilingual" ], "inputPrice": 0.006, - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "maxAudioLength": 600, "supportedInputFormats": [ @@ -507,13 +504,12 @@ "image_gen" ], "description": "高质量文生图模型", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "image_generation", "text_rendering" ], - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "supportedImageSizes": [ "1024x1024", @@ -544,7 +540,8 @@ ], "inputPrice": 4, "outputPrice": 16, - "defaultTemperature": 1, + "defaultTemperature": 0.7, + "defaultTopP": null, "extra": { "supportedModes": [ "speech-to-speech", @@ -569,7 +566,8 @@ ], "inputPrice": 5, "outputPrice": 20, - "defaultTemperature": 1, + "defaultTemperature": 0.7, + "defaultTopP": null, "extra": { "supportedModes": [ "speech-to-speech", diff --git a/compute/providers/stability.json b/compute/providers/stability.json index 0e8bc98..e12b65d 100644 --- a/compute/providers/stability.json +++ b/compute/providers/stability.json @@ -18,14 +18,11 @@ "displayName": "Stable Diffusion 3.5 Large", "serviceType": ["image_gen"], "description": "Stability AI 旗舰文生图模型", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "image_generation", "high_quality", "controllable" ], - "defaultTemperature": 1, "extra": { "supportedImageSizes": [ "1024x1024", diff --git a/compute/providers/volcengine.json b/compute/providers/volcengine.json index cea6456..b4f0714 100644 --- a/compute/providers/volcengine.json +++ b/compute/providers/volcengine.json @@ -39,8 +39,8 @@ ], "inputPrice": 3.2, "outputPrice": 16, - "defaultTemperature": 0.7, - "defaultTopP": 0.9, + "defaultTemperature": 1, + "defaultTopP": 0.7, "extra": {} }, { @@ -51,7 +51,7 @@ ], "description": "火山引擎豆包1.8旗舰模型,256K上下文,支持深度思考和多模态", "contextWindow": 256000, - "maxOutputTokens": 32000, + "maxOutputTokens": 16000, "capabilities": [ "chat", "reasoning", @@ -62,8 +62,8 @@ ], "inputPrice": 0.8, "outputPrice": 2, - "defaultTemperature": 0.7, - "defaultTopP": 0.9, + "defaultTemperature": 1, + "defaultTopP": 0.7, "extra": {} }, { @@ -85,8 +85,8 @@ ], "inputPrice": 0.8, "outputPrice": 8, - "defaultTemperature": 0.7, - "defaultTopP": 0.9, + "defaultTemperature": 1, + "defaultTopP": 0.7, "extra": {} }, { @@ -97,7 +97,7 @@ ], "description": "火山引擎豆包1.6深度思考模型,256K上下文", "contextWindow": 256000, - "maxOutputTokens": 32768, + "maxOutputTokens": 16000, "capabilities": [ "reasoning", "math", @@ -107,7 +107,8 @@ ], "inputPrice": 0.8, "outputPrice": 8, - "defaultTemperature": 0.3, + "defaultTemperature": 1, + "defaultTopP": 0.7, "extra": {} }, { @@ -118,7 +119,7 @@ ], "description": "火山引擎豆包1.6快速版,成本较前代下降63%", "contextWindow": 256000, - "maxOutputTokens": 32000, + "maxOutputTokens": 16000, "capabilities": [ "chat", "code", @@ -127,8 +128,8 @@ ], "inputPrice": 0.15, "outputPrice": 1.5, - "defaultTemperature": 0.7, - "defaultTopP": 0.9, + "defaultTemperature": 1, + "defaultTopP": 0.7, "extra": {} }, { @@ -147,8 +148,8 @@ ], "inputPrice": 0.3, "outputPrice": 0.6, - "defaultTemperature": 0.7, - "defaultTopP": 0.9, + "defaultTemperature": 1, + "defaultTopP": 0.7, "extra": {} }, { @@ -169,8 +170,8 @@ ], "inputPrice": 0.8, "outputPrice": 8, - "defaultTemperature": 0.7, - "defaultTopP": 0.9, + "defaultTemperature": 1, + "defaultTopP": 0.7, "extra": {} }, { @@ -190,7 +191,8 @@ ], "inputPrice": 1.2, "outputPrice": 8, - "defaultTemperature": 0.3, + "defaultTemperature": 1, + "defaultTopP": 0.7, "extra": {} }, { @@ -232,8 +234,8 @@ ], "inputPrice": 4, "outputPrice": 16, - "defaultTemperature": 1, - "defaultTopP": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": {} }, { @@ -255,8 +257,8 @@ ], "inputPrice": 4, "outputPrice": 16, - "defaultTemperature": 0.7, - "defaultTopP": 0.9, + "defaultTemperature": 0.6, + "defaultTopP": 1, "extra": {} }, { @@ -278,8 +280,8 @@ ], "inputPrice": 4, "outputPrice": 16, - "defaultTemperature": 0.7, - "defaultTopP": 0.9, + "defaultTemperature": 1, + "defaultTopP": 0.95, "extra": {} }, { @@ -290,7 +292,6 @@ ], "description": "火山引擎豆包标准向量模型,2560维度", "contextWindow": 4096, - "maxOutputTokens": 0, "capabilities": [ "text_embedding", "semantic_search", @@ -298,7 +299,8 @@ "chinese_optimized" ], "inputPrice": 0.5, - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": {} }, { @@ -308,14 +310,13 @@ "voice_clone" ], "description": "火山引擎声音复刻,支持极少样本", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "voice_clone", "chinese_optimized", "few_shot" ], - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "maxCloneSamples": 3, "minCloneDuration": 5 @@ -328,15 +329,14 @@ "realtime_voice" ], "description": "火山引擎实时语音交互", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "realtime", "speech_to_speech", "low_latency", "chinese_optimized" ], - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "supportedModes": [ "speech-to-speech" @@ -351,14 +351,13 @@ "simultaneous_interpret" ], "description": "火山引擎同声传译,支持中英双向", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "simultaneous_interpretation", "chinese_optimized", "low_latency" ], - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "streamingSupported": true } @@ -370,14 +369,13 @@ "translation" ], "description": "火山引擎机器翻译,支持多语种互译", - "contextWindow": 0, - "maxOutputTokens": 0, "capabilities": [ "translation", "multilingual", "chinese_optimized" ], - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": {} } ] diff --git a/compute/providers/zhipu-embedding.json b/compute/providers/zhipu-embedding.json index 6031ad8..0d78149 100644 --- a/compute/providers/zhipu-embedding.json +++ b/compute/providers/zhipu-embedding.json @@ -20,7 +20,6 @@ "serviceType": ["embedding"], "description": "智谱嵌入模型v3,支持自定义维度;模型上下文窗口 8K,单条输入最多 3072 tokens。走 OpenAI 兼容 /embeddings 端点(Anthropic 协议不提供 embeddings)", "contextWindow": 8192, - "maxOutputTokens": 0, "capabilities": [ "text_embedding", "semantic_search", @@ -28,7 +27,8 @@ "custom_dimensions" ], "inputPrice": 0.5, - "defaultTemperature": 1, + "defaultTemperature": null, + "defaultTopP": null, "extra": { "maxInputTokensPerItem": 3072, "maxBatchItems": 64,