修复算力模型采样默认值

This commit is contained in:
2026-04-25 21:39:51 +08:00
parent 10465e3570
commit 380e99c577
24 changed files with 1413 additions and 508 deletions

View File

@@ -15,12 +15,106 @@
"embedding"
],
"models": [
{
"modelName": "gemini-3.1-pro-preview",
"displayName": "Gemini 3.1 Pro Preview",
"serviceType": [
"chat"
],
"description": "Google Gemini 3.1 Pro Preview面向复杂推理、编码和智能体工作流",
"contextWindow": 1048576,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
"reasoning",
"code",
"vision",
"ultra_long_context",
"tool_use"
],
"inputPrice": 2.0,
"outputPrice": 12.0,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"pricingNotes": "Standard paid tier text/image/video price for prompts <= 200K tokens; prompts > 200K are $4 input and $18 output per 1M tokens.",
"cachePricing": {
"inputCacheRead": 0.2,
"inputCacheReadOver200k": 0.4,
"storagePerMillionTokensPerHour": 4.5
}
}
},
{
"modelName": "gemini-3-flash-preview",
"displayName": "Gemini 3 Flash Preview",
"serviceType": [
"chat"
],
"description": "Google Gemini 3 Flash Preview高速多模态推理模型",
"contextWindow": 1048576,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
"reasoning",
"code",
"vision",
"ultra_long_context",
"tool_use",
"fast"
],
"inputPrice": 0.5,
"outputPrice": 3.0,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"pricingNotes": "Standard paid tier text/image/video price; audio input is $1.00 per 1M tokens.",
"cachePricing": {
"inputCacheRead": 0.05,
"audioInputCacheRead": 0.1,
"storagePerMillionTokensPerHour": 1.0
}
}
},
{
"modelName": "gemini-3.1-flash-lite-preview",
"displayName": "Gemini 3.1 Flash-Lite Preview",
"serviceType": [
"fast"
],
"description": "Google Gemini 3.1 Flash-Lite Preview低成本高吞吐多模态模型",
"contextWindow": 1048576,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
"reasoning",
"code",
"vision",
"ultra_long_context",
"tool_use",
"fast"
],
"inputPrice": 0.25,
"outputPrice": 1.5,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {
"pricingNotes": "Standard paid tier text/image/video price; audio input is $0.50 per 1M tokens.",
"cachePricing": {
"inputCacheRead": 0.025,
"audioInputCacheRead": 0.05,
"storagePerMillionTokensPerHour": 1.0
}
}
},
{
"modelName": "gemini-2.5-pro",
"displayName": "Gemini 2.5 Pro",
"serviceType": ["chat"],
"description": "Google 最新旗舰模型100万上下文多模态",
"contextWindow": 1000000,
"serviceType": [
"chat"
],
"description": "Google 最新旗舰模型1,048,576 token 上下文,多模态",
"contextWindow": 1048576,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
@@ -39,9 +133,11 @@
{
"modelName": "gemini-2.5-flash",
"displayName": "Gemini 2.5 Flash",
"serviceType": ["chat"],
"description": "Google 高性价比模型100万上下文速度快",
"contextWindow": 1000000,
"serviceType": [
"chat"
],
"description": "Google 高性价比模型1,048,576 token 上下文,速度快",
"contextWindow": 1048576,
"maxOutputTokens": 65536,
"capabilities": [
"chat",
@@ -52,8 +148,8 @@
"tool_use",
"fast"
],
"inputPrice": 0.30,
"outputPrice": 2.50,
"inputPrice": 0.3,
"outputPrice": 2.5,
"defaultTemperature": 1,
"defaultTopP": 0.95,
"extra": {}
@@ -61,13 +157,16 @@
{
"modelName": "text-embedding-005",
"displayName": "Text Embedding 005",
"serviceType": ["embedding"],
"serviceType": [
"embedding"
],
"description": "Google 文本嵌入模型768维度",
"contextWindow": 2048,
"capabilities": [
"text_embedding",
"semantic_search"
],
"inputPrice": 0.10,
"inputPrice": 0.1,
"extra": {}
}
]