whosellm 0.2.1__tar.gz → 0.2.3__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {whosellm-0.2.1 → whosellm-0.2.3}/.bumpversion.toml +1 -1
- whosellm-0.2.3/.claude/settings.json +5 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/CHANGELOG.md +21 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/PKG-INFO +1 -1
- {whosellm-0.2.1 → whosellm-0.2.3}/pyproject.toml +1 -1
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_deepseek.py +76 -20
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_deepseek_tencent.py +23 -1
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_gpt5.py +0 -3
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_auto_register.py +2 -1
- whosellm-0.2.3/tests/test_claude_4x_versions.py +124 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/uv.lock +1 -1
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/__init__.py +1 -1
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/config.py +5 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/anthropic.py +90 -17
- whosellm-0.2.3/whosellm/models/families/deepseek/deepseek_official.py +117 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/deepseek/tencent.py +22 -2
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_4_1.py +0 -1
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_5.py +0 -4
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_5_1.py +0 -1
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_5_2.py +0 -2
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_5_4.py +0 -4
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/zhipu.py +0 -5
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/patterns.py +14 -1
- whosellm-0.2.1/whosellm/models/families/deepseek/deepseek_official.py +0 -72
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/commands/interview.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/projects/-Users-jqq-PycharmProjects-llmeta/memory/MEMORY.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/projects/-Users-jqq-PycharmProjects-llmeta/memory/feedback_use_uv.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/code-review/SKILL.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/create-skill/SKILL.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/e2e-metadata/SKILL.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/evolve/SKILL.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/fix-review/SKILL.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/release/SKILL.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/SKILL.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/alibaba.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/anthropic.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/deepseek.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/gemini.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/openai.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/others.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/vidu.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/zhipu.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/update-provider-model/SKILL.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/update-provider-model/testing.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.coveragerc +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.github/workflows/publish.yml +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.github/workflows/tests.yml +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.gitignore +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.windsurf/workflows/addmodel.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.windsurf/workflows/arch.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/.windsurf/workflows/testllmeta.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/CLAUDE.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/LICENSE +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/README.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/docs/add_new_model_family.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/docs/refactor_proposal.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/docs/spec_model_family_redesign.md +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/examples/advanced_usage.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/examples/basic_usage.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/mypy.ini +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/pytest.ini +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/ruff.toml +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/__init__.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/e2e/__init__.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/e2e/conftest.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/e2e/test_anthropic.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/e2e/test_google.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/e2e/test_openai.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/e2e/test_zhipu.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/__init__.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/__init__.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_anthropic.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_gemini.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_glm45.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_glm45v.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_glm46.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_glm46v.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_glm5.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_gpt3_5.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_gpt4_1.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_gpt4o.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_o1.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_o3.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_o4.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_qwen.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_qwen3_vl_models.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_qwen_ollama.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_qwen_plus.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_llmeta.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_model_version.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_provider.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_registry_merge.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_specific_patterns.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_variant_priority_config.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/capabilities.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/model_version.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/__init__.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/base.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/dynamic_enum.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/__init__.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/alibaba.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/deepseek/__init__.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/gemini.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/__init__.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_3_5.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_4.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_4o.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_5_3.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_o1.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_o3.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_o4.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/others.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/vidu.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/registry.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/provider.py +0 -0
- {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/py.typed +0 -0
|
@@ -2,6 +2,27 @@
|
|
|
2
2
|
|
|
3
3
|
All notable changes to this project will be documented in this file.
|
|
4
4
|
|
|
5
|
+
## [0.2.3] - Unreleased
|
|
6
|
+
|
|
7
|
+
### Added
|
|
8
|
+
- 新增 Claude Opus 4.x 模型配置(官方规格核实):`claude-opus-4-8`、`claude-opus-4-7`(1M 上下文,128K 最大输出,结构化输出 + computer use)、`claude-opus-4-5`(200K 上下文,64K 最大输出)
|
|
9
|
+
|
|
10
|
+
### Fixed
|
|
11
|
+
- 修复 Claude 4.x 别名版本解析回退 bug:`claude-opus-4-5` / `4-7` / `4-8` 等**无日期别名**此前被 `claude-opus-4-{snapshot:8d}` 模式的"最大宽度"语义把单个数字 minor 误吞为 snapshot,导致版本回退为 `4.0`。改用精确 8 位的 `{snapshot:snapshot}` 自定义类型(`patterns._convert_snapshot`)后,单字段 snapshot 不再吞掉 minor,现存与未来未注册别名均能解析出正确版本(如 `4.8`),版本比较稳定可用
|
|
12
|
+
|
|
13
|
+
## [0.2.2] - 2026-04-24
|
|
14
|
+
|
|
15
|
+
### Added
|
|
16
|
+
- DeepSeek V4 系列模型支持:`deepseek-v4-flash`、`deepseek-v4-pro`(1M 上下文,384K 最大输出,支持思考/非思考双模式)
|
|
17
|
+
- DeepSeek 官方 Provider 支持版本号命名模式(`deepseek-v{major}.{minor}-{variant}` 等),V4 起可通过版本号直接调用
|
|
18
|
+
- 腾讯云 DeepSeek-V3.2(GA 版,685B MoE,稀疏注意力)
|
|
19
|
+
|
|
20
|
+
### Changed
|
|
21
|
+
- `deepseek-chat` / `deepseek-reasoner` 能力基线升级为 V4-flash 非思考/思考模式别名(1M 上下文,384K 输出)
|
|
22
|
+
|
|
23
|
+
### Fixed
|
|
24
|
+
- 腾讯云 `deepseek-r1-0528` 的 `supports_function_calling` 修正为 `False`(官方文档明确列为不支持)
|
|
25
|
+
|
|
5
26
|
## [Unreleased]
|
|
6
27
|
|
|
7
28
|
### Added
|
|
@@ -11,7 +11,7 @@ from whosellm.provider import Provider
|
|
|
11
11
|
|
|
12
12
|
|
|
13
13
|
def test_deepseek_default_capabilities() -> None:
|
|
14
|
-
"""验证 DeepSeek
|
|
14
|
+
"""验证 DeepSeek 官方家族默认能力(V4 基线) / Validate DeepSeek official family default capabilities (V4 baseline)"""
|
|
15
15
|
from whosellm import LLMeta
|
|
16
16
|
|
|
17
17
|
# 使用官方 Provider 前缀确保获取官方配置
|
|
@@ -20,8 +20,10 @@ def test_deepseek_default_capabilities() -> None:
|
|
|
20
20
|
|
|
21
21
|
assert capabilities.supports_streaming is True
|
|
22
22
|
assert capabilities.supports_function_calling is True
|
|
23
|
-
|
|
24
|
-
assert capabilities.
|
|
23
|
+
# V4 系列:1M 上下文,384K 最大输出
|
|
24
|
+
assert capabilities.max_tokens == 384_000
|
|
25
|
+
assert capabilities.context_window == 1_000_000
|
|
26
|
+
# deepseek-chat 是 v4-flash 非思考模式的别名
|
|
25
27
|
assert capabilities.supports_thinking is False
|
|
26
28
|
|
|
27
29
|
|
|
@@ -31,13 +33,13 @@ def test_deepseek_chat_specific_model() -> None:
|
|
|
31
33
|
|
|
32
34
|
assert config is not None
|
|
33
35
|
version, variant, capabilities = config
|
|
34
|
-
assert version == "
|
|
36
|
+
assert version == "4.0"
|
|
35
37
|
assert variant == "chat"
|
|
36
38
|
assert capabilities is not None
|
|
37
39
|
assert capabilities.supports_function_calling is True
|
|
38
40
|
assert capabilities.supports_streaming is True
|
|
39
|
-
assert capabilities.max_tokens ==
|
|
40
|
-
assert capabilities.context_window ==
|
|
41
|
+
assert capabilities.max_tokens == 384_000
|
|
42
|
+
assert capabilities.context_window == 1_000_000
|
|
41
43
|
|
|
42
44
|
|
|
43
45
|
def test_deepseek_chat_pattern_matching() -> None:
|
|
@@ -50,7 +52,7 @@ def test_deepseek_chat_pattern_matching() -> None:
|
|
|
50
52
|
|
|
51
53
|
assert model.family == ModelFamily.DEEPSEEK
|
|
52
54
|
assert model.variant == "chat"
|
|
53
|
-
assert model.version == "
|
|
55
|
+
assert model.version == "4.0"
|
|
54
56
|
assert model.provider == Provider.DEEPSEEK
|
|
55
57
|
|
|
56
58
|
|
|
@@ -60,10 +62,12 @@ def test_deepseek_reasoner_specific_model() -> None:
|
|
|
60
62
|
|
|
61
63
|
assert config is not None
|
|
62
64
|
version, variant, capabilities = config
|
|
63
|
-
assert version == "
|
|
65
|
+
assert version == "4.0"
|
|
64
66
|
assert variant == "reasoner"
|
|
65
67
|
assert capabilities is not None
|
|
66
68
|
assert capabilities.supports_thinking is True
|
|
69
|
+
assert capabilities.max_tokens == 384_000
|
|
70
|
+
assert capabilities.context_window == 1_000_000
|
|
67
71
|
|
|
68
72
|
|
|
69
73
|
def test_deepseek_base_pattern_without_variant() -> None:
|
|
@@ -71,17 +75,16 @@ def test_deepseek_base_pattern_without_variant() -> None:
|
|
|
71
75
|
from whosellm import LLMeta
|
|
72
76
|
|
|
73
77
|
# 使用 Provider 前缀确保匹配官方配置
|
|
74
|
-
# DeepSeek 官方只支持 chat 和 reasoner,默认使用 chat
|
|
75
78
|
model = LLMeta("deepseek::deepseek-chat")
|
|
76
79
|
|
|
77
80
|
assert model.family == ModelFamily.DEEPSEEK
|
|
78
81
|
assert model.variant == "chat"
|
|
79
|
-
assert model.version == "
|
|
82
|
+
assert model.version == "4.0"
|
|
80
83
|
assert model.capabilities.supports_function_calling is True
|
|
81
84
|
|
|
82
85
|
|
|
83
86
|
def test_deepseek_reasoner_does_not_use_chat_capabilities() -> None:
|
|
84
|
-
"""验证 reasoner 不会意外继承 chat
|
|
87
|
+
"""验证 reasoner 不会意外继承 chat 的能力 / Ensure reasoner capabilities override family defaults"""
|
|
85
88
|
from whosellm import LLMeta
|
|
86
89
|
|
|
87
90
|
model = LLMeta("deepseek::deepseek-reasoner")
|
|
@@ -95,7 +98,7 @@ def test_deepseek_no_structured_outputs() -> None:
|
|
|
95
98
|
"""验证 DeepSeek 官方模型不支持 structured_outputs(仅支持 json_object)"""
|
|
96
99
|
from whosellm import LLMeta
|
|
97
100
|
|
|
98
|
-
for model_id in ["deepseek-chat", "deepseek-reasoner"]:
|
|
101
|
+
for model_id in ["deepseek-chat", "deepseek-reasoner", "deepseek-v4-flash", "deepseek-v4-pro"]:
|
|
99
102
|
model = LLMeta(f"deepseek::{model_id}")
|
|
100
103
|
assert model.capabilities.supports_structured_outputs is False, (
|
|
101
104
|
f"{model_id}: DeepSeek API 仅支持 response_format={{type:'json_object'}},"
|
|
@@ -106,15 +109,68 @@ def test_deepseek_no_structured_outputs() -> None:
|
|
|
106
109
|
)
|
|
107
110
|
|
|
108
111
|
|
|
109
|
-
def
|
|
110
|
-
"""验证
|
|
112
|
+
def test_deepseek_v4_flash_specific_model() -> None:
|
|
113
|
+
"""验证 deepseek-v4-flash 特定模型配置 / Validate deepseek-v4-flash specific configuration"""
|
|
111
114
|
from whosellm import LLMeta
|
|
112
115
|
|
|
113
|
-
|
|
114
|
-
# 官方只支持 deepseek-chat-{suffix} 和 deepseek-reasoner-{suffix}
|
|
115
|
-
model = LLMeta("deepseek::deepseek-v3.2-exp")
|
|
116
|
+
model = LLMeta("deepseek::deepseek-v4-flash")
|
|
116
117
|
|
|
117
|
-
|
|
118
|
-
assert model.
|
|
118
|
+
assert model.family == ModelFamily.DEEPSEEK
|
|
119
|
+
assert model.provider == Provider.DEEPSEEK
|
|
120
|
+
assert model.version == "4.0"
|
|
121
|
+
assert model.variant == "flash"
|
|
122
|
+
|
|
123
|
+
caps = model.capabilities
|
|
124
|
+
assert caps.supports_thinking is True
|
|
125
|
+
assert caps.supports_function_calling is True
|
|
126
|
+
assert caps.supports_streaming is True
|
|
127
|
+
assert caps.supports_json_outputs is True
|
|
128
|
+
assert caps.supports_structured_outputs is False
|
|
129
|
+
assert caps.max_tokens == 384_000
|
|
130
|
+
assert caps.context_window == 1_000_000
|
|
131
|
+
|
|
132
|
+
|
|
133
|
+
def test_deepseek_v4_pro_specific_model() -> None:
|
|
134
|
+
"""验证 deepseek-v4-pro 特定模型配置 / Validate deepseek-v4-pro specific configuration"""
|
|
135
|
+
from whosellm import LLMeta
|
|
136
|
+
|
|
137
|
+
model = LLMeta("deepseek::deepseek-v4-pro")
|
|
138
|
+
|
|
139
|
+
assert model.family == ModelFamily.DEEPSEEK
|
|
140
|
+
assert model.provider == Provider.DEEPSEEK
|
|
141
|
+
assert model.version == "4.0"
|
|
142
|
+
assert model.variant == "pro"
|
|
143
|
+
|
|
144
|
+
caps = model.capabilities
|
|
145
|
+
assert caps.supports_thinking is True
|
|
146
|
+
assert caps.supports_function_calling is True
|
|
147
|
+
assert caps.max_tokens == 384_000
|
|
148
|
+
assert caps.context_window == 1_000_000
|
|
149
|
+
|
|
150
|
+
|
|
151
|
+
def test_deepseek_v4_variant_ordering() -> None:
|
|
152
|
+
"""验证 v4-flash < v4-pro 的排序关系 / Validate v4-flash < v4-pro ordering"""
|
|
153
|
+
from whosellm import LLMeta
|
|
154
|
+
|
|
155
|
+
flash = LLMeta("deepseek::deepseek-v4-flash")
|
|
156
|
+
pro = LLMeta("deepseek::deepseek-v4-pro")
|
|
157
|
+
|
|
158
|
+
assert flash < pro
|
|
159
|
+
|
|
160
|
+
|
|
161
|
+
def test_deepseek_versioned_pattern_matches_official_family() -> None:
|
|
162
|
+
"""验证带版本号的 DS 模型名能被官方 family 识别 / Validate versioned DS names match the official family"""
|
|
163
|
+
from whosellm import LLMeta
|
|
164
|
+
|
|
165
|
+
# V4 是 DS 官方首次开放版本号命名的系列
|
|
166
|
+
model = LLMeta("deepseek::deepseek-v4-flash")
|
|
167
|
+
assert model.family == ModelFamily.DEEPSEEK
|
|
119
168
|
assert model.provider == Provider.DEEPSEEK
|
|
120
|
-
assert model.
|
|
169
|
+
assert model.version == "4.0"
|
|
170
|
+
|
|
171
|
+
# 带小数版本号也能匹配 family(即使当前没有 specific_model 条目)
|
|
172
|
+
model_v32 = LLMeta("deepseek::deepseek-v3.2-exp")
|
|
173
|
+
assert model_v32.family == ModelFamily.DEEPSEEK
|
|
174
|
+
assert model_v32.provider == Provider.DEEPSEEK
|
|
175
|
+
assert model_v32.version == "3.2"
|
|
176
|
+
assert model_v32.variant == "exp"
|
|
@@ -66,6 +66,8 @@ def test_tencent_deepseek_r1_0528() -> None:
|
|
|
66
66
|
assert capabilities is not None
|
|
67
67
|
assert capabilities.supports_thinking is True
|
|
68
68
|
assert capabilities.context_window == 128000
|
|
69
|
+
# 腾讯云 LKE 官方文档明确列为不支持 Function Calling
|
|
70
|
+
assert capabilities.supports_function_calling is False
|
|
69
71
|
|
|
70
72
|
|
|
71
73
|
def test_tencent_deepseek_v3_1() -> None:
|
|
@@ -109,6 +111,22 @@ def test_tencent_deepseek_v3_2_exp() -> None:
|
|
|
109
111
|
assert capabilities.context_window == 128000
|
|
110
112
|
|
|
111
113
|
|
|
114
|
+
def test_tencent_deepseek_v3_2() -> None:
|
|
115
|
+
"""测试腾讯云 DeepSeek-V3.2(GA) / Test Tencent DeepSeek-V3.2 (GA)"""
|
|
116
|
+
config = get_specific_model_config("deepseek-v3.2")
|
|
117
|
+
|
|
118
|
+
assert config is not None
|
|
119
|
+
version, variant, capabilities = config
|
|
120
|
+
assert version == "v3.2"
|
|
121
|
+
assert variant == "v3.2"
|
|
122
|
+
assert capabilities is not None
|
|
123
|
+
assert capabilities.supports_thinking is True
|
|
124
|
+
assert capabilities.supports_function_calling is True
|
|
125
|
+
assert capabilities.supports_streaming is True
|
|
126
|
+
assert capabilities.max_tokens == 32000
|
|
127
|
+
assert capabilities.context_window == 128000
|
|
128
|
+
|
|
129
|
+
|
|
112
130
|
def test_tencent_deepseek_pattern_matching() -> None:
|
|
113
131
|
"""测试腾讯云 DeepSeek 模式匹配 / Test Tencent DeepSeek pattern matching"""
|
|
114
132
|
# 测试 V3 系列
|
|
@@ -158,8 +176,12 @@ def test_tencent_deepseek_no_collision_with_official() -> None:
|
|
|
158
176
|
assert tencent_v3.variant == "base"
|
|
159
177
|
|
|
160
178
|
# 不同的能力配置
|
|
161
|
-
|
|
179
|
+
# 官方 deepseek-chat 当前指向 V4-flash 非思考模式(1M 上下文,384K 输出)
|
|
180
|
+
assert official_chat.capabilities.max_tokens == 384_000
|
|
181
|
+
assert official_chat.capabilities.context_window == 1_000_000
|
|
182
|
+
# 腾讯云保持其自有的 DeepSeek 部署规格
|
|
162
183
|
assert tencent_v3.capabilities.max_tokens == 16000
|
|
184
|
+
assert tencent_v3.capabilities.context_window == 64000
|
|
163
185
|
|
|
164
186
|
|
|
165
187
|
def test_tencent_deepseek_invalid_model_names() -> None:
|
|
@@ -193,7 +193,6 @@ def test_gpt5_4_model():
|
|
|
193
193
|
assert m.capabilities.supports_computer_use is True
|
|
194
194
|
|
|
195
195
|
|
|
196
|
-
|
|
197
196
|
def test_gpt5_4_with_date_suffix():
|
|
198
197
|
"""测试带日期的GPT-5.4模型 / Test GPT-5.4 with date suffix"""
|
|
199
198
|
m = LLMeta("gpt-5.4-2026-03-05")
|
|
@@ -239,7 +238,6 @@ def test_gpt5_4_mini_model():
|
|
|
239
238
|
assert m.capabilities.supports_computer_use is True
|
|
240
239
|
|
|
241
240
|
|
|
242
|
-
|
|
243
241
|
def test_gpt5_4_mini_with_date_suffix():
|
|
244
242
|
"""测试带日期的GPT-5.4-mini模型 / Test GPT-5.4-mini with date suffix"""
|
|
245
243
|
m = LLMeta("gpt-5.4-mini-2026-03-17")
|
|
@@ -267,7 +265,6 @@ def test_gpt5_4_nano_model():
|
|
|
267
265
|
assert m.capabilities.supports_computer_use is False
|
|
268
266
|
|
|
269
267
|
|
|
270
|
-
|
|
271
268
|
def test_gpt5_4_nano_with_date_suffix():
|
|
272
269
|
"""测试带日期的GPT-5.4-nano模型 / Test GPT-5.4-nano with date suffix"""
|
|
273
270
|
m = LLMeta("gpt-5.4-nano-2026-03-17")
|
|
@@ -102,7 +102,8 @@ class TestAutoRegister(unittest.TestCase):
|
|
|
102
102
|
assert model.family == ModelFamily.DEEPSEEK
|
|
103
103
|
assert model.provider == Provider.DEEPSEEK
|
|
104
104
|
assert model.capabilities.supports_function_calling is True
|
|
105
|
-
|
|
105
|
+
# V4 起 deepseek-chat 别名为 v4-flash 非思考模式,上下文扩展为 1M
|
|
106
|
+
assert model.capabilities.context_window == 1_000_000
|
|
106
107
|
|
|
107
108
|
def test_auto_register_qwen_variant(self) -> None:
|
|
108
109
|
"""测试自动注册 Qwen 新型号 / Test auto-register Qwen new variant"""
|
|
@@ -0,0 +1,124 @@
|
|
|
1
|
+
# filename: test_claude_4x_versions.py
|
|
2
|
+
"""
|
|
3
|
+
回归测试:Claude 4.x 别名版本解析 + 版本比较稳定性
|
|
4
|
+
Regression tests: Claude 4.x alias version parsing + version-comparison stability
|
|
5
|
+
|
|
6
|
+
背景 / Context:
|
|
7
|
+
TFRobotV2 需要门控 Claude 4.6+ 移除的 assistant prefill。决定**用版本比较**判断
|
|
8
|
+
(`family == CLAUDE and parse_version(version) >= (4, 6)`),而非依赖能力位。
|
|
9
|
+
因此 whosellm 必须保证 4.x 别名(含未注册的新别名)版本解析正确、比较稳定。
|
|
10
|
+
|
|
11
|
+
根因:parse 的 ``{snapshot:8d}`` 是最大宽度,会把 ``claude-opus-4-5`` 的 ``5`` 当 snapshot,
|
|
12
|
+
使 minor 被吞、版本回退 4.0。修复后通过精确 8 位 snapshot 自定义类型解决。
|
|
13
|
+
"""
|
|
14
|
+
|
|
15
|
+
import pytest
|
|
16
|
+
|
|
17
|
+
from whosellm import LLMeta
|
|
18
|
+
from whosellm.models.base import ModelFamily, parse_version
|
|
19
|
+
|
|
20
|
+
# 官方 prefill 真值表(platform.claude.com,逐字核实):不支持 prefill 的恰为版本 >= 4.6
|
|
21
|
+
# Authoritative prefill truth table: models WITHOUT prefill are exactly version >= 4.6
|
|
22
|
+
_PREFILL_REMOVED = {
|
|
23
|
+
"claude-opus-4-8",
|
|
24
|
+
"claude-opus-4-7",
|
|
25
|
+
"claude-opus-4-6",
|
|
26
|
+
"claude-sonnet-4-6",
|
|
27
|
+
}
|
|
28
|
+
_PREFILL_SUPPORTED = {
|
|
29
|
+
"claude-opus-4-5",
|
|
30
|
+
"claude-opus-4-1",
|
|
31
|
+
"claude-opus-4-0",
|
|
32
|
+
"claude-sonnet-4-5",
|
|
33
|
+
"claude-sonnet-4-0",
|
|
34
|
+
"claude-haiku-4-5",
|
|
35
|
+
"claude-3-7-sonnet",
|
|
36
|
+
"claude-3-5-haiku",
|
|
37
|
+
}
|
|
38
|
+
|
|
39
|
+
|
|
40
|
+
class TestClaude4xAliasVersionParsing:
|
|
41
|
+
"""未注册/新增的 Claude 4.x 别名应解析出正确版本,而非回退 family 默认 4.0"""
|
|
42
|
+
|
|
43
|
+
@pytest.mark.parametrize(
|
|
44
|
+
"model_name,expected_version,expected_variant",
|
|
45
|
+
[
|
|
46
|
+
("claude-opus-4-8", "4.8", "opus"),
|
|
47
|
+
("claude-opus-4-7", "4.7", "opus"),
|
|
48
|
+
("claude-opus-4-6", "4.6", "opus"),
|
|
49
|
+
("claude-opus-4-5", "4.5", "opus"),
|
|
50
|
+
("claude-opus-4-5-20251101", "4.5", "opus"),
|
|
51
|
+
("claude-haiku-4-5-20251001", "4.5", "haiku"),
|
|
52
|
+
("claude-sonnet-4-6", "4.6", "sonnet"),
|
|
53
|
+
("claude-sonnet-4-5", "4.5", "sonnet"),
|
|
54
|
+
],
|
|
55
|
+
)
|
|
56
|
+
def test_alias_version(self, model_name: str, expected_version: str, expected_variant: str):
|
|
57
|
+
meta = LLMeta(model_name)
|
|
58
|
+
assert meta.version == expected_version, f"{model_name} 解析出错误版本 {meta.version}"
|
|
59
|
+
assert meta.variant == expected_variant
|
|
60
|
+
assert meta.family == ModelFamily.CLAUDE
|
|
61
|
+
|
|
62
|
+
def test_dated_4_0_snapshot_still_resolves_to_4_0(self):
|
|
63
|
+
"""带 8 位日期的原始 4.0 snapshot 仍应识别为 4.0,不被精确宽度修复破坏"""
|
|
64
|
+
meta = LLMeta("claude-opus-4-20250514")
|
|
65
|
+
assert meta.version == "4.0"
|
|
66
|
+
assert meta.variant == "opus"
|
|
67
|
+
|
|
68
|
+
def test_short_digit_not_swallowed_as_snapshot(self):
|
|
69
|
+
"""根因回归:单个数字 minor 不得被 {snapshot} 吞掉"""
|
|
70
|
+
assert LLMeta("claude-opus-4-5").version == "4.5"
|
|
71
|
+
assert LLMeta("claude-opus-4-7").version == "4.7"
|
|
72
|
+
assert LLMeta("claude-opus-4-8").version == "4.8"
|
|
73
|
+
|
|
74
|
+
|
|
75
|
+
class TestClaude4xCapabilities:
|
|
76
|
+
"""新增模型应带官方真实能力(非臆测/镜像)"""
|
|
77
|
+
|
|
78
|
+
@pytest.mark.parametrize(
|
|
79
|
+
"model_name,ctx,max_out",
|
|
80
|
+
[
|
|
81
|
+
("claude-opus-4-8", 1000000, 128000),
|
|
82
|
+
("claude-opus-4-7", 1000000, 128000),
|
|
83
|
+
("claude-opus-4-5", 200000, 64000),
|
|
84
|
+
],
|
|
85
|
+
)
|
|
86
|
+
def test_new_model_specs(self, model_name: str, ctx: int, max_out: int):
|
|
87
|
+
caps = LLMeta(model_name).capabilities
|
|
88
|
+
assert caps.context_window == ctx
|
|
89
|
+
assert caps.max_tokens == max_out
|
|
90
|
+
assert caps.supports_structured_outputs is True
|
|
91
|
+
assert caps.supports_computer_use is True
|
|
92
|
+
|
|
93
|
+
|
|
94
|
+
class TestClaude4xVersionComparison:
|
|
95
|
+
"""版本比较稳定可用——TFRobotV2 门控的基石"""
|
|
96
|
+
|
|
97
|
+
def test_monotonic_opus_chain(self):
|
|
98
|
+
assert LLMeta("claude-opus-4-5") < LLMeta("claude-opus-4-6")
|
|
99
|
+
assert LLMeta("claude-opus-4-6") < LLMeta("claude-opus-4-7")
|
|
100
|
+
assert LLMeta("claude-opus-4-7") < LLMeta("claude-opus-4-8")
|
|
101
|
+
|
|
102
|
+
def test_cross_minor(self):
|
|
103
|
+
assert LLMeta("claude-opus-4-1") < LLMeta("claude-opus-4-6")
|
|
104
|
+
assert LLMeta("claude-opus-4-0") < LLMeta("claude-opus-4-5")
|
|
105
|
+
|
|
106
|
+
def test_dated_alias_equivalent_version(self):
|
|
107
|
+
"""带日期与不带日期解析出相同版本元组"""
|
|
108
|
+
assert LLMeta("claude-opus-4-5").version == LLMeta("claude-opus-4-5-20251101").version
|
|
109
|
+
|
|
110
|
+
|
|
111
|
+
class TestVersionGateMatchesPrefillTruth:
|
|
112
|
+
"""关键:纯版本门控 `parse_version(version) >= (4, 6)` 的真假必须与官方 prefill 真值表完全一致"""
|
|
113
|
+
|
|
114
|
+
@pytest.mark.parametrize("model_name", sorted(_PREFILL_REMOVED))
|
|
115
|
+
def test_no_prefill_models_are_ge_4_6(self, model_name: str):
|
|
116
|
+
meta = LLMeta(model_name)
|
|
117
|
+
assert meta.family == ModelFamily.CLAUDE
|
|
118
|
+
assert parse_version(meta.version) >= (4, 6), f"{model_name} 应被版本门控判为不支持 prefill"
|
|
119
|
+
|
|
120
|
+
@pytest.mark.parametrize("model_name", sorted(_PREFILL_SUPPORTED))
|
|
121
|
+
def test_prefill_models_are_lt_4_6(self, model_name: str):
|
|
122
|
+
meta = LLMeta(model_name)
|
|
123
|
+
assert meta.family == ModelFamily.CLAUDE
|
|
124
|
+
assert parse_version(meta.version) < (4, 6), f"{model_name} 应被版本门控判为支持 prefill"
|
|
@@ -189,6 +189,11 @@ class ModelFamilyConfig:
|
|
|
189
189
|
else:
|
|
190
190
|
type_spec = ""
|
|
191
191
|
|
|
192
|
+
# 自定义 snapshot 类型要求精确 8 位(见 patterns._convert_snapshot)
|
|
193
|
+
# Custom snapshot type requires exactly 8 digits (see patterns._convert_snapshot)
|
|
194
|
+
if type_spec == "snapshot":
|
|
195
|
+
return "20240101"
|
|
196
|
+
|
|
192
197
|
if type_spec.endswith("d"):
|
|
193
198
|
width_str = type_spec[:-1].strip()
|
|
194
199
|
width = int(width_str) if width_str.isdigit() else 1
|
|
@@ -23,14 +23,14 @@ CLAUDE = ModelFamilyConfig(
|
|
|
23
23
|
variant_default="sonnet",
|
|
24
24
|
variant_priority_default=(3,), # sonnet 的默认优先级 / default priority for sonnet
|
|
25
25
|
patterns=[
|
|
26
|
-
"claude-{variant:variant}-{major:d}-{minor:d}@{snapshot:
|
|
27
|
-
"claude-{variant:variant}-{major:d}-{minor:d}-{snapshot:
|
|
26
|
+
"claude-{variant:variant}-{major:d}-{minor:d}@{snapshot:snapshot}",
|
|
27
|
+
"claude-{variant:variant}-{major:d}-{minor:d}-{snapshot:snapshot}",
|
|
28
28
|
"claude-{variant:variant}-{major:d}-{minor:d}",
|
|
29
|
-
"claude-{variant:variant}-{major:d}-{snapshot:
|
|
29
|
+
"claude-{variant:variant}-{major:d}-{snapshot:snapshot}",
|
|
30
30
|
"claude-{variant:variant}-{major:d}",
|
|
31
|
-
"claude-{major:d}-{minor:d}-{variant:variant}-{snapshot:
|
|
31
|
+
"claude-{major:d}-{minor:d}-{variant:variant}-{snapshot:snapshot}",
|
|
32
32
|
"claude-{major:d}-{minor:d}-{variant:variant}",
|
|
33
|
-
"claude-{major:d}-{variant:variant}-{snapshot:
|
|
33
|
+
"claude-{major:d}-{variant:variant}-{snapshot:snapshot}",
|
|
34
34
|
"claude-{major:d}-{variant:variant}",
|
|
35
35
|
],
|
|
36
36
|
capabilities=ModelCapabilities(
|
|
@@ -42,6 +42,46 @@ CLAUDE = ModelFamilyConfig(
|
|
|
42
42
|
context_window=200000,
|
|
43
43
|
),
|
|
44
44
|
specific_models={
|
|
45
|
+
"claude-opus-4-8": SpecificModelConfig(
|
|
46
|
+
version_default="4.8",
|
|
47
|
+
variant_default="opus",
|
|
48
|
+
variant_priority=(5,),
|
|
49
|
+
capabilities=ModelCapabilities(
|
|
50
|
+
supports_vision=True,
|
|
51
|
+
supports_thinking=True,
|
|
52
|
+
supports_function_calling=True,
|
|
53
|
+
supports_streaming=True,
|
|
54
|
+
supports_structured_outputs=True,
|
|
55
|
+
supports_computer_use=True,
|
|
56
|
+
max_tokens=128000,
|
|
57
|
+
context_window=1000000,
|
|
58
|
+
),
|
|
59
|
+
patterns=[
|
|
60
|
+
"claude-opus-4-8-{snapshot:snapshot}",
|
|
61
|
+
"claude-opus-4-8",
|
|
62
|
+
"claude-opus-4-8@{snapshot:snapshot}",
|
|
63
|
+
],
|
|
64
|
+
),
|
|
65
|
+
"claude-opus-4-7": SpecificModelConfig(
|
|
66
|
+
version_default="4.7",
|
|
67
|
+
variant_default="opus",
|
|
68
|
+
variant_priority=(5,),
|
|
69
|
+
capabilities=ModelCapabilities(
|
|
70
|
+
supports_vision=True,
|
|
71
|
+
supports_thinking=True,
|
|
72
|
+
supports_function_calling=True,
|
|
73
|
+
supports_streaming=True,
|
|
74
|
+
supports_structured_outputs=True,
|
|
75
|
+
supports_computer_use=True,
|
|
76
|
+
max_tokens=128000,
|
|
77
|
+
context_window=1000000,
|
|
78
|
+
),
|
|
79
|
+
patterns=[
|
|
80
|
+
"claude-opus-4-7-{snapshot:snapshot}",
|
|
81
|
+
"claude-opus-4-7",
|
|
82
|
+
"claude-opus-4-7@{snapshot:snapshot}",
|
|
83
|
+
],
|
|
84
|
+
),
|
|
45
85
|
"claude-opus-4-6": SpecificModelConfig(
|
|
46
86
|
version_default="4.6",
|
|
47
87
|
variant_default="opus",
|
|
@@ -57,9 +97,9 @@ CLAUDE = ModelFamilyConfig(
|
|
|
57
97
|
context_window=1000000,
|
|
58
98
|
),
|
|
59
99
|
patterns=[
|
|
60
|
-
"claude-opus-4-6-{snapshot:
|
|
100
|
+
"claude-opus-4-6-{snapshot:snapshot}",
|
|
61
101
|
"claude-opus-4-6",
|
|
62
|
-
"claude-opus-4-6@{snapshot:
|
|
102
|
+
"claude-opus-4-6@{snapshot:snapshot}",
|
|
63
103
|
],
|
|
64
104
|
),
|
|
65
105
|
"claude-sonnet-4-6": SpecificModelConfig(
|
|
@@ -77,9 +117,9 @@ CLAUDE = ModelFamilyConfig(
|
|
|
77
117
|
context_window=1000000,
|
|
78
118
|
),
|
|
79
119
|
patterns=[
|
|
80
|
-
"claude-sonnet-4-6-{snapshot:
|
|
120
|
+
"claude-sonnet-4-6-{snapshot:snapshot}",
|
|
81
121
|
"claude-sonnet-4-6",
|
|
82
|
-
"claude-sonnet-4-6@{snapshot:
|
|
122
|
+
"claude-sonnet-4-6@{snapshot:snapshot}",
|
|
83
123
|
],
|
|
84
124
|
),
|
|
85
125
|
"claude-sonnet-4-5": SpecificModelConfig(
|
|
@@ -97,7 +137,11 @@ CLAUDE = ModelFamilyConfig(
|
|
|
97
137
|
max_tokens=64000,
|
|
98
138
|
context_window=200000,
|
|
99
139
|
),
|
|
100
|
-
patterns=[
|
|
140
|
+
patterns=[
|
|
141
|
+
"claude-sonnet-4-5-{snapshot:snapshot}",
|
|
142
|
+
"claude-sonnet-4-5",
|
|
143
|
+
"claude-sonnet-4-5@{snapshot:snapshot}",
|
|
144
|
+
],
|
|
101
145
|
),
|
|
102
146
|
"claude-haiku-4-5": SpecificModelConfig(
|
|
103
147
|
version_default="4.5",
|
|
@@ -114,7 +158,32 @@ CLAUDE = ModelFamilyConfig(
|
|
|
114
158
|
max_tokens=64000,
|
|
115
159
|
context_window=200000,
|
|
116
160
|
),
|
|
117
|
-
patterns=[
|
|
161
|
+
patterns=[
|
|
162
|
+
"claude-haiku-4-5-{snapshot:snapshot}",
|
|
163
|
+
"claude-haiku-4-5",
|
|
164
|
+
"claude-haiku-4-5@{snapshot:snapshot}",
|
|
165
|
+
],
|
|
166
|
+
),
|
|
167
|
+
"claude-opus-4-5": SpecificModelConfig(
|
|
168
|
+
version_default="4.5",
|
|
169
|
+
variant_default="opus",
|
|
170
|
+
variant_priority=(5,),
|
|
171
|
+
capabilities=ModelCapabilities(
|
|
172
|
+
supports_vision=True,
|
|
173
|
+
supports_pdf=True,
|
|
174
|
+
supports_thinking=True,
|
|
175
|
+
supports_function_calling=True,
|
|
176
|
+
supports_streaming=True,
|
|
177
|
+
supports_structured_outputs=True,
|
|
178
|
+
supports_computer_use=True,
|
|
179
|
+
max_tokens=64000,
|
|
180
|
+
context_window=200000,
|
|
181
|
+
),
|
|
182
|
+
patterns=[
|
|
183
|
+
"claude-opus-4-5-{snapshot:snapshot}",
|
|
184
|
+
"claude-opus-4-5",
|
|
185
|
+
"claude-opus-4-5@{snapshot:snapshot}",
|
|
186
|
+
],
|
|
118
187
|
),
|
|
119
188
|
"claude-opus-4-1": SpecificModelConfig(
|
|
120
189
|
version_default="4.1",
|
|
@@ -131,7 +200,7 @@ CLAUDE = ModelFamilyConfig(
|
|
|
131
200
|
max_tokens=32000,
|
|
132
201
|
context_window=200000,
|
|
133
202
|
),
|
|
134
|
-
patterns=["claude-opus-4-1-{snapshot:
|
|
203
|
+
patterns=["claude-opus-4-1-{snapshot:snapshot}", "claude-opus-4-1", "claude-opus-4-1@{snapshot:snapshot}"],
|
|
135
204
|
),
|
|
136
205
|
"claude-sonnet-4-0": SpecificModelConfig(
|
|
137
206
|
version_default="4.0",
|
|
@@ -148,7 +217,11 @@ CLAUDE = ModelFamilyConfig(
|
|
|
148
217
|
max_tokens=64000,
|
|
149
218
|
context_window=200000,
|
|
150
219
|
),
|
|
151
|
-
patterns=[
|
|
220
|
+
patterns=[
|
|
221
|
+
"claude-sonnet-4-{snapshot:snapshot}",
|
|
222
|
+
"claude-sonnet-4-0",
|
|
223
|
+
"claude-sonnet-4-0@{snapshot:snapshot}",
|
|
224
|
+
],
|
|
152
225
|
),
|
|
153
226
|
"claude-3-7-sonnet": SpecificModelConfig(
|
|
154
227
|
version_default="3.7",
|
|
@@ -165,7 +238,7 @@ CLAUDE = ModelFamilyConfig(
|
|
|
165
238
|
max_tokens=64000,
|
|
166
239
|
context_window=200000,
|
|
167
240
|
),
|
|
168
|
-
patterns=["claude-3-7-sonnet-{snapshot:
|
|
241
|
+
patterns=["claude-3-7-sonnet-{snapshot:snapshot}", "claude-3-7-sonnet-latest", "claude-3-7-sonnet"],
|
|
169
242
|
),
|
|
170
243
|
"claude-opus-4-0": SpecificModelConfig(
|
|
171
244
|
version_default="4.0",
|
|
@@ -182,7 +255,7 @@ CLAUDE = ModelFamilyConfig(
|
|
|
182
255
|
max_tokens=32000,
|
|
183
256
|
context_window=200000,
|
|
184
257
|
),
|
|
185
|
-
patterns=["claude-opus-4-{snapshot:
|
|
258
|
+
patterns=["claude-opus-4-{snapshot:snapshot}", "claude-opus-4-0", "claude-opus-4-0@{snapshot:snapshot}"],
|
|
186
259
|
),
|
|
187
260
|
"claude-3-5-haiku": SpecificModelConfig(
|
|
188
261
|
version_default="3.5",
|
|
@@ -198,7 +271,7 @@ CLAUDE = ModelFamilyConfig(
|
|
|
198
271
|
max_tokens=8000,
|
|
199
272
|
context_window=200000,
|
|
200
273
|
),
|
|
201
|
-
patterns=["claude-3-5-haiku-{snapshot:
|
|
274
|
+
patterns=["claude-3-5-haiku-{snapshot:snapshot}", "claude-3-5-haiku-latest", "claude-3-5-haiku"],
|
|
202
275
|
),
|
|
203
276
|
"claude-3-haiku": SpecificModelConfig(
|
|
204
277
|
version_default="3.0",
|
|
@@ -213,7 +286,7 @@ CLAUDE = ModelFamilyConfig(
|
|
|
213
286
|
max_tokens=4096,
|
|
214
287
|
context_window=200000,
|
|
215
288
|
),
|
|
216
|
-
patterns=["claude-3-haiku-{snapshot:
|
|
289
|
+
patterns=["claude-3-haiku-{snapshot:snapshot}"],
|
|
217
290
|
),
|
|
218
291
|
},
|
|
219
292
|
)
|