fix: remove irrelevant text-model fields from non-text providers

Remove contextWindow: 0 and maxOutputTokens: 0 from non-text models
(tts, asr, image_gen, video_gen, voice_clone, translation, etc.) and
maxOutputTokens: 0 from embedding/rerank models across kling,
local-whisper, stability, openai, dashscope, google, volcengine,
and zhipu-embedding configs.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
2026-04-24 19:53:57 +08:00
parent 7159e1cf59
commit cc2fb7b9a5
8 changed files with 256 additions and 111 deletions

View File

@@ -15,6 +15,92 @@
"embedding"
],
"models": [
{
"modelName": "gemini-3.1-pro-preview",
"displayName": "Gemini 3.1 Pro Preview",
"serviceType": ["chat"],
"description": "Google Gemini 3.1 Pro Preview面向复杂推理、编码和智能体工作流",
"contextWindow": 1048576,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
"reasoning",
"code",
"vision",
"ultra_long_context",
"tool_use"
],
"inputPrice": 2.00,
"outputPrice": 12.00,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"pricingNotes": "Standard paid tier text/image/video price for prompts <= 200K tokens; prompts > 200K are $4 input and $18 output per 1M tokens.",
"cachePricing": {
"inputCacheRead": 0.20,
"inputCacheReadOver200k": 0.40,
"storagePerMillionTokensPerHour": 4.50
}
}
},
{
"modelName": "gemini-3-flash-preview",
"displayName": "Gemini 3 Flash Preview",
"serviceType": ["chat"],
"description": "Google Gemini 3 Flash Preview高速多模态推理模型",
"contextWindow": 1048576,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
"reasoning",
"code",
"vision",
"ultra_long_context",
"tool_use",
"fast"
],
"inputPrice": 0.50,
"outputPrice": 3.00,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"pricingNotes": "Standard paid tier text/image/video price; audio input is $1.00 per 1M tokens.",
"cachePricing": {
"inputCacheRead": 0.05,
"audioInputCacheRead": 0.10,
"storagePerMillionTokensPerHour": 1.00
}
}
},
{
"modelName": "gemini-3.1-flash-lite-preview",
"displayName": "Gemini 3.1 Flash-Lite Preview",
"serviceType": ["fast"],
"description": "Google Gemini 3.1 Flash-Lite Preview低成本高吞吐多模态模型",
"contextWindow": 1048576,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
"reasoning",
"code",
"vision",
"ultra_long_context",
"tool_use",
"fast"
],
"inputPrice": 0.25,
"outputPrice": 1.50,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"pricingNotes": "Standard paid tier text/image/video price; audio input is $0.50 per 1M tokens.",
"cachePricing": {
"inputCacheRead": 0.025,
"audioInputCacheRead": 0.05,
"storagePerMillionTokensPerHour": 1.00
}
}
},
{
"modelName": "gemini-2.5-pro",
"displayName": "Gemini 2.5 Pro",
@@ -32,7 +118,7 @@
],
"inputPrice": 1.25,
"outputPrice": 10,
"defaultTemperature": 1,
"defaultTemperature": null,
"defaultTopP": 0.95,
"extra": {}
},
@@ -54,7 +140,7 @@
],
"inputPrice": 0.30,
"outputPrice": 2.50,
"defaultTemperature": 1,
"defaultTemperature": null,
"defaultTopP": 0.95,
"extra": {}
},
@@ -64,13 +150,13 @@
"serviceType": ["embedding"],
"description": "Google 文本嵌入模型768维度",
"contextWindow": 2048,
"maxOutputTokens": 0,
"capabilities": [
"text_embedding",
"semantic_search"
],
"inputPrice": 0.10,
"defaultTemperature": 1,
"defaultTemperature": null,
"defaultTopP": null,
"extra": {}
}
]