Skip to content

Commit e84edec

Browse files
authored
feat(model-specs): 新增模型规格库——跨 provider 模型参数统一维护(presetDataVersion 54→58)
* feat(model-specs): 新增模型规格库与 schema 契约 - compute/model-specs/:按厂商维护模型内在参数(上下文窗口/最大输出/能力/serviceType/默认温度,不含价签) - schemas/model-spec.schema.json:Draft-07 契约,spec 允许 null(新文件不影响老客户端 frozen 契约) - scripts/validate.mjs:pickSchemaKey 纳入 model-specs 校验 - manifest.presetDataVersion 54→55 * feat(model-specs): 新增小米 MiMo 系列模型规格;bump presetDataVersion 55→56 * feat(model-specs): 补全全量模型规格;presetDataVersion 56→57 * feat(model-specs): 新增 releasedAt/retiredAt 时间戳字段;补充 mimo 退役日期
1 parent 9633df0 commit e84edec

25 files changed

Lines changed: 2668 additions & 2 deletions

compute/model-specs/_index.json

Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
{
2+
"description": "模型规格库加载顺序索引。元素为对应 JSON 文件的 basename(不含 .json)。",
3+
"order": [
4+
"anthropic",
5+
"openai",
6+
"google",
7+
"deepseek",
8+
"qwen",
9+
"moonshot",
10+
"zhipu",
11+
"minimax",
12+
"xai",
13+
"mistral",
14+
"xiaomi",
15+
"baichuan",
16+
"baidu",
17+
"cohere",
18+
"kling",
19+
"lingyiwanwu",
20+
"perplexity",
21+
"stability",
22+
"tencent",
23+
"volcengine",
24+
"xunfei"
25+
]
26+
}

compute/model-specs/anthropic.json

Lines changed: 65 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,65 @@
1+
{
2+
"description": "Anthropic Claude 系列模型规格。参数来源:config-center compute/providers/anthropic.json。",
3+
"specs": [
4+
{
5+
"id": "claude-opus-4-7",
6+
"displayName": "Claude Opus 4.7",
7+
"family": "claude-opus",
8+
"match": { "patterns": ["claude-opus-4-7*"] },
9+
"spec": {
10+
"contextWindow": 1000000,
11+
"maxOutputTokens": 128000,
12+
"capabilities": ["chat", "reasoning", "code", "vision", "tool_use"],
13+
"serviceType": ["chat"],
14+
"defaultTemperature": 1,
15+
"supportsReasoning": true,
16+
"description": "Anthropic 当前最强通用模型,适合复杂推理和智能体编码任务"
17+
}
18+
},
19+
{
20+
"id": "claude-sonnet-4-6",
21+
"displayName": "Claude Sonnet 4.6",
22+
"family": "claude-sonnet",
23+
"match": { "patterns": ["claude-sonnet-4-6*"] },
24+
"spec": {
25+
"contextWindow": 1000000,
26+
"maxOutputTokens": 64000,
27+
"capabilities": ["chat", "reasoning", "code", "vision", "tool_use", "computer_use"],
28+
"serviceType": ["chat", "computer_use"],
29+
"defaultTemperature": 1,
30+
"supportsReasoning": true,
31+
"description": "Anthropic 高智能高速度模型,适合编码、工具使用和智能体任务"
32+
}
33+
},
34+
{
35+
"id": "claude-sonnet-4-5",
36+
"displayName": "Claude Sonnet 4.5",
37+
"family": "claude-sonnet",
38+
"match": { "patterns": ["claude-sonnet-4-5*"] },
39+
"spec": {
40+
"contextWindow": 1000000,
41+
"maxOutputTokens": 64000,
42+
"capabilities": ["chat", "reasoning", "code", "vision", "tool_use"],
43+
"serviceType": ["chat"],
44+
"defaultTemperature": 1,
45+
"supportsReasoning": true,
46+
"description": "Anthropic 主力模型,长文本与代码任务表现优异"
47+
}
48+
},
49+
{
50+
"id": "claude-haiku-4-5",
51+
"displayName": "Claude Haiku 4.5",
52+
"family": "claude-haiku",
53+
"match": { "patterns": ["claude-haiku-4-5*"] },
54+
"spec": {
55+
"contextWindow": 200000,
56+
"maxOutputTokens": 64000,
57+
"capabilities": ["chat", "reasoning", "code", "vision", "tool_use"],
58+
"serviceType": ["chat"],
59+
"defaultTemperature": 1,
60+
"supportsReasoning": true,
61+
"description": "Anthropic 最快模型,具备接近前沿模型的智能水平"
62+
}
63+
}
64+
]
65+
}

compute/model-specs/baichuan.json

Lines changed: 61 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,61 @@
1+
{
2+
"description": "百川智能 Baichuan 系列模型规格。参数来源:config-center compute/providers/baichuan.json。M3/M2 系列为医疗增强大模型,235B 参数,支持多模态。",
3+
"specs": [
4+
{
5+
"id": "Baichuan-M3-Plus",
6+
"displayName": "百川 M3-Plus",
7+
"family": "baichuan-m3",
8+
"match": { "exact": ["Baichuan-M3-Plus"] },
9+
"spec": {
10+
"contextWindow": 32000,
11+
"maxOutputTokens": 32000,
12+
"capabilities": ["chat", "reasoning", "code", "multilingual", "vision", "long_context", "medical"],
13+
"serviceType": ["chat"],
14+
"defaultTemperature": 0.3,
15+
"description": "百川智能M3-Plus医疗增强模型,235B参数,幻觉率仅2.6%"
16+
}
17+
},
18+
{
19+
"id": "Baichuan-M3",
20+
"displayName": "百川 M3",
21+
"family": "baichuan-m3",
22+
"match": { "exact": ["Baichuan-M3"] },
23+
"spec": {
24+
"contextWindow": 32000,
25+
"maxOutputTokens": 32000,
26+
"capabilities": ["chat", "reasoning", "code", "multilingual", "vision", "medical"],
27+
"serviceType": ["chat"],
28+
"defaultTemperature": 0.3,
29+
"description": "百川智能M3新一代开源医疗增强模型,235B参数"
30+
}
31+
},
32+
{
33+
"id": "Baichuan-M2-Plus",
34+
"displayName": "百川 M2-Plus",
35+
"family": "baichuan-m2",
36+
"match": { "exact": ["Baichuan-M2-Plus"] },
37+
"spec": {
38+
"contextWindow": 32000,
39+
"maxOutputTokens": 32000,
40+
"capabilities": ["chat", "reasoning", "code", "multilingual", "long_context"],
41+
"serviceType": ["chat"],
42+
"defaultTemperature": 0.3,
43+
"description": "百川智能M2-Plus旗舰模型,最强推理和创作能力"
44+
}
45+
},
46+
{
47+
"id": "Baichuan-M2",
48+
"displayName": "百川 M2",
49+
"family": "baichuan-m2",
50+
"match": { "exact": ["Baichuan-M2"] },
51+
"spec": {
52+
"contextWindow": 32000,
53+
"maxOutputTokens": 32000,
54+
"capabilities": ["chat", "reasoning", "code", "multilingual"],
55+
"serviceType": ["chat"],
56+
"defaultTemperature": 0.3,
57+
"description": "百川智能M2高性能通用模型"
58+
}
59+
}
60+
]
61+
}

compute/model-specs/baidu.json

Lines changed: 76 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,76 @@
1+
{
2+
"description": "百度文心 ERNIE 系列模型规格。参数来源:config-center compute/providers/baidu.json。ernie-x1.1 为纯推理模型,defaultTemperature 为 null;ernie-5.0-thinking-latest 同时支持 chat 和 reasoning。",
3+
"specs": [
4+
{
5+
"id": "ernie-5.0-thinking-latest",
6+
"displayName": "文心 ERNIE 5.0",
7+
"family": "ernie-5",
8+
"match": { "exact": ["ernie-5.0-thinking-latest"], "patterns": ["ernie-5.0-thinking*"] },
9+
"spec": {
10+
"contextWindow": 128000,
11+
"maxOutputTokens": 65536,
12+
"capabilities": ["chat", "reasoning", "vision", "multimodal", "tool_use"],
13+
"serviceType": ["chat", "reasoning"],
14+
"supportsReasoning": true,
15+
"description": "百度最新旗舰模型,支持深度推理、多模态和工具调用"
16+
}
17+
},
18+
{
19+
"id": "ernie-5.0",
20+
"displayName": "文心 ERNIE 5.0 非思考",
21+
"family": "ernie-5",
22+
"match": { "exact": ["ernie-5.0"] },
23+
"spec": {
24+
"contextWindow": 131072,
25+
"maxOutputTokens": 65536,
26+
"capabilities": ["chat", "vision", "multimodal", "tool_use"],
27+
"serviceType": ["chat"],
28+
"defaultTemperature": 0.95,
29+
"description": "百度 ERNIE 5.0 旗舰模型,128K 上下文,最大输出 65536 token"
30+
}
31+
},
32+
{
33+
"id": "ernie-4.5-turbo-128k",
34+
"displayName": "文心 ERNIE 4.5 Turbo",
35+
"family": "ernie-4.5",
36+
"match": { "exact": ["ernie-4.5-turbo-128k"], "patterns": ["ernie-4.5-turbo-128k*"] },
37+
"spec": {
38+
"contextWindow": 131072,
39+
"maxOutputTokens": 12288,
40+
"capabilities": ["chat", "code", "vision", "long_context", "fast"],
41+
"serviceType": ["chat"],
42+
"defaultTemperature": 0.8,
43+
"description": "百度高性价比长上下文模型,128K 窗口,最大输出 12288 token"
44+
}
45+
},
46+
{
47+
"id": "ernie-4.5-turbo-20260402",
48+
"displayName": "文心 ERNIE 4.5 Turbo 20260402",
49+
"family": "ernie-4.5",
50+
"match": { "exact": ["ernie-4.5-turbo-20260402"] },
51+
"spec": {
52+
"contextWindow": 131072,
53+
"maxOutputTokens": 12288,
54+
"capabilities": ["chat", "code", "vision", "long_context", "fast"],
55+
"serviceType": ["chat"],
56+
"defaultTemperature": 0.8,
57+
"description": "百度 ERNIE 4.5 Turbo 20260402 快照版,128K 上下文"
58+
}
59+
},
60+
{
61+
"id": "ernie-x1.1",
62+
"displayName": "文心 ERNIE X1.1",
63+
"family": "ernie-x1",
64+
"match": { "exact": ["ernie-x1.1"], "patterns": ["ernie-x1*"] },
65+
"spec": {
66+
"contextWindow": 65536,
67+
"maxOutputTokens": 65536,
68+
"capabilities": ["chat", "reasoning", "deep_thinking", "math", "code"],
69+
"serviceType": ["reasoning"],
70+
"defaultTemperature": null,
71+
"supportsReasoning": true,
72+
"description": "百度 ERNIE X1.1 深度思考推理模型,64K 上下文"
73+
}
74+
}
75+
]
76+
}

compute/model-specs/cohere.json

Lines changed: 57 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,57 @@
1+
{
2+
"description": "Cohere 系列模型规格。参数来源:config-center compute/providers/cohere.json。包含对话、Embedding 和 Rerank 三类服务。",
3+
"specs": [
4+
{
5+
"id": "command-a-03-2025",
6+
"displayName": "Command A",
7+
"family": "command-a",
8+
"match": { "exact": ["command-a-03-2025"], "patterns": ["command-a*"] },
9+
"spec": {
10+
"contextWindow": 256000,
11+
"maxOutputTokens": 8000,
12+
"capabilities": ["chat", "reasoning", "code", "vision", "tool_use", "rag", "long_context"],
13+
"serviceType": ["chat"],
14+
"defaultTemperature": 0.3,
15+
"description": "Cohere 旗舰对话模型,256K 上下文,擅长 RAG 和工具调用"
16+
}
17+
},
18+
{
19+
"id": "command-r7b-12-2024",
20+
"displayName": "Command R7B",
21+
"family": "command-r7b",
22+
"match": { "exact": ["command-r7b-12-2024"], "patterns": ["command-r7b*"] },
23+
"spec": {
24+
"contextWindow": 128000,
25+
"maxOutputTokens": 4000,
26+
"capabilities": ["chat", "reasoning", "tool_use", "rag", "fast"],
27+
"serviceType": ["fast"],
28+
"defaultTemperature": 0.3,
29+
"description": "Cohere 小型高速对话模型,适合高吞吐、低延迟场景"
30+
}
31+
},
32+
{
33+
"id": "embed-v4.0",
34+
"displayName": "Embed V4",
35+
"family": "embed-v4",
36+
"match": { "exact": ["embed-v4.0"], "patterns": ["embed-v4*"] },
37+
"spec": {
38+
"contextWindow": 128000,
39+
"capabilities": ["text_embedding", "multilingual"],
40+
"serviceType": ["embedding"],
41+
"description": "Cohere 最新 Embedding 模型,128K 上下文,多语言支持"
42+
}
43+
},
44+
{
45+
"id": "rerank-v3.5",
46+
"displayName": "Rerank V3.5",
47+
"family": "rerank-v3",
48+
"match": { "exact": ["rerank-v3.5"], "patterns": ["rerank-v3*"] },
49+
"spec": {
50+
"contextWindow": 4096,
51+
"capabilities": ["rerank", "semantic_reranking"],
52+
"serviceType": ["rerank"],
53+
"description": "Cohere 语义重排序模型,用于检索结果精排"
54+
}
55+
}
56+
]
57+
}

compute/model-specs/deepseek.json

Lines changed: 58 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,58 @@
1+
{
2+
"description": "DeepSeek 系列模型规格。参数来源:config-center compute/providers/deepseek.json。",
3+
"specs": [
4+
{
5+
"id": "deepseek-chat",
6+
"displayName": "DeepSeek Chat",
7+
"family": "deepseek-chat",
8+
"match": { "patterns": ["deepseek-chat*"] },
9+
"spec": {
10+
"contextWindow": 1000000,
11+
"maxOutputTokens": 384000,
12+
"capabilities": ["chat", "code", "reasoning", "multilingual", "tool_use"],
13+
"serviceType": ["chat"],
14+
"defaultTemperature": 1
15+
}
16+
},
17+
{
18+
"id": "deepseek-reasoner",
19+
"displayName": "DeepSeek Reasoner",
20+
"family": "deepseek-reasoner",
21+
"match": { "patterns": ["deepseek-reasoner*"] },
22+
"spec": {
23+
"contextWindow": 1000000,
24+
"maxOutputTokens": 384000,
25+
"capabilities": ["chat", "reasoning", "deep_thinking", "code", "math", "tool_use"],
26+
"serviceType": ["reasoning"],
27+
"defaultTemperature": null,
28+
"supportsReasoning": true
29+
}
30+
},
31+
{
32+
"id": "deepseek-v4-pro",
33+
"displayName": "DeepSeek V4 Pro",
34+
"family": "deepseek-v4",
35+
"spec": {
36+
"contextWindow": 1000000,
37+
"maxOutputTokens": 384000,
38+
"capabilities": ["chat", "code", "reasoning", "deep_thinking", "multilingual", "tool_use", "math"],
39+
"serviceType": ["chat", "reasoning"],
40+
"defaultTemperature": 1,
41+
"supportsReasoning": true
42+
}
43+
},
44+
{
45+
"id": "deepseek-v4-flash",
46+
"displayName": "DeepSeek V4 Flash",
47+
"family": "deepseek-v4",
48+
"spec": {
49+
"contextWindow": 1000000,
50+
"maxOutputTokens": 384000,
51+
"capabilities": ["chat", "code", "reasoning", "deep_thinking", "multilingual", "tool_use"],
52+
"serviceType": ["chat", "reasoning"],
53+
"defaultTemperature": 1,
54+
"supportsReasoning": true
55+
}
56+
}
57+
]
58+
}

0 commit comments

Comments
 (0)