whosellm 0.2.1__tar.gz → 0.2.3__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (116) hide show
  1. {whosellm-0.2.1 → whosellm-0.2.3}/.bumpversion.toml +1 -1
  2. whosellm-0.2.3/.claude/settings.json +5 -0
  3. {whosellm-0.2.1 → whosellm-0.2.3}/CHANGELOG.md +21 -0
  4. {whosellm-0.2.1 → whosellm-0.2.3}/PKG-INFO +1 -1
  5. {whosellm-0.2.1 → whosellm-0.2.3}/pyproject.toml +1 -1
  6. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_deepseek.py +76 -20
  7. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_deepseek_tencent.py +23 -1
  8. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_gpt5.py +0 -3
  9. {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_auto_register.py +2 -1
  10. whosellm-0.2.3/tests/test_claude_4x_versions.py +124 -0
  11. {whosellm-0.2.1 → whosellm-0.2.3}/uv.lock +1 -1
  12. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/__init__.py +1 -1
  13. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/config.py +5 -0
  14. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/anthropic.py +90 -17
  15. whosellm-0.2.3/whosellm/models/families/deepseek/deepseek_official.py +117 -0
  16. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/deepseek/tencent.py +22 -2
  17. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_4_1.py +0 -1
  18. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_5.py +0 -4
  19. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_5_1.py +0 -1
  20. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_5_2.py +0 -2
  21. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_5_4.py +0 -4
  22. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/zhipu.py +0 -5
  23. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/patterns.py +14 -1
  24. whosellm-0.2.1/whosellm/models/families/deepseek/deepseek_official.py +0 -72
  25. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/commands/interview.md +0 -0
  26. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/projects/-Users-jqq-PycharmProjects-llmeta/memory/MEMORY.md +0 -0
  27. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/projects/-Users-jqq-PycharmProjects-llmeta/memory/feedback_use_uv.md +0 -0
  28. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/code-review/SKILL.md +0 -0
  29. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/create-skill/SKILL.md +0 -0
  30. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/e2e-metadata/SKILL.md +0 -0
  31. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/evolve/SKILL.md +0 -0
  32. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/fix-review/SKILL.md +0 -0
  33. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/release/SKILL.md +0 -0
  34. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/SKILL.md +0 -0
  35. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/alibaba.md +0 -0
  36. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/anthropic.md +0 -0
  37. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/deepseek.md +0 -0
  38. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/gemini.md +0 -0
  39. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/openai.md +0 -0
  40. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/others.md +0 -0
  41. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/vidu.md +0 -0
  42. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/review-provider-model/providers/zhipu.md +0 -0
  43. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/update-provider-model/SKILL.md +0 -0
  44. {whosellm-0.2.1 → whosellm-0.2.3}/.claude/skills/update-provider-model/testing.md +0 -0
  45. {whosellm-0.2.1 → whosellm-0.2.3}/.coveragerc +0 -0
  46. {whosellm-0.2.1 → whosellm-0.2.3}/.github/workflows/publish.yml +0 -0
  47. {whosellm-0.2.1 → whosellm-0.2.3}/.github/workflows/tests.yml +0 -0
  48. {whosellm-0.2.1 → whosellm-0.2.3}/.gitignore +0 -0
  49. {whosellm-0.2.1 → whosellm-0.2.3}/.windsurf/workflows/addmodel.md +0 -0
  50. {whosellm-0.2.1 → whosellm-0.2.3}/.windsurf/workflows/arch.md +0 -0
  51. {whosellm-0.2.1 → whosellm-0.2.3}/.windsurf/workflows/testllmeta.md +0 -0
  52. {whosellm-0.2.1 → whosellm-0.2.3}/CLAUDE.md +0 -0
  53. {whosellm-0.2.1 → whosellm-0.2.3}/LICENSE +0 -0
  54. {whosellm-0.2.1 → whosellm-0.2.3}/README.md +0 -0
  55. {whosellm-0.2.1 → whosellm-0.2.3}/docs/add_new_model_family.md +0 -0
  56. {whosellm-0.2.1 → whosellm-0.2.3}/docs/refactor_proposal.md +0 -0
  57. {whosellm-0.2.1 → whosellm-0.2.3}/docs/spec_model_family_redesign.md +0 -0
  58. {whosellm-0.2.1 → whosellm-0.2.3}/examples/advanced_usage.py +0 -0
  59. {whosellm-0.2.1 → whosellm-0.2.3}/examples/basic_usage.py +0 -0
  60. {whosellm-0.2.1 → whosellm-0.2.3}/mypy.ini +0 -0
  61. {whosellm-0.2.1 → whosellm-0.2.3}/pytest.ini +0 -0
  62. {whosellm-0.2.1 → whosellm-0.2.3}/ruff.toml +0 -0
  63. {whosellm-0.2.1 → whosellm-0.2.3}/tests/__init__.py +0 -0
  64. {whosellm-0.2.1 → whosellm-0.2.3}/tests/e2e/__init__.py +0 -0
  65. {whosellm-0.2.1 → whosellm-0.2.3}/tests/e2e/conftest.py +0 -0
  66. {whosellm-0.2.1 → whosellm-0.2.3}/tests/e2e/test_anthropic.py +0 -0
  67. {whosellm-0.2.1 → whosellm-0.2.3}/tests/e2e/test_google.py +0 -0
  68. {whosellm-0.2.1 → whosellm-0.2.3}/tests/e2e/test_openai.py +0 -0
  69. {whosellm-0.2.1 → whosellm-0.2.3}/tests/e2e/test_zhipu.py +0 -0
  70. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/__init__.py +0 -0
  71. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/__init__.py +0 -0
  72. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_anthropic.py +0 -0
  73. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_gemini.py +0 -0
  74. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_glm45.py +0 -0
  75. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_glm45v.py +0 -0
  76. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_glm46.py +0 -0
  77. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_glm46v.py +0 -0
  78. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_glm5.py +0 -0
  79. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_gpt3_5.py +0 -0
  80. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_gpt4_1.py +0 -0
  81. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_gpt4o.py +0 -0
  82. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_o1.py +0 -0
  83. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_o3.py +0 -0
  84. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_o4.py +0 -0
  85. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_qwen.py +0 -0
  86. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_qwen3_vl_models.py +0 -0
  87. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_qwen_ollama.py +0 -0
  88. {whosellm-0.2.1 → whosellm-0.2.3}/tests/models/families/test_qwen_plus.py +0 -0
  89. {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_llmeta.py +0 -0
  90. {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_model_version.py +0 -0
  91. {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_provider.py +0 -0
  92. {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_registry_merge.py +0 -0
  93. {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_specific_patterns.py +0 -0
  94. {whosellm-0.2.1 → whosellm-0.2.3}/tests/test_variant_priority_config.py +0 -0
  95. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/capabilities.py +0 -0
  96. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/model_version.py +0 -0
  97. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/__init__.py +0 -0
  98. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/base.py +0 -0
  99. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/dynamic_enum.py +0 -0
  100. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/__init__.py +0 -0
  101. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/alibaba.py +0 -0
  102. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/deepseek/__init__.py +0 -0
  103. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/gemini.py +0 -0
  104. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/__init__.py +0 -0
  105. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_3_5.py +0 -0
  106. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_4.py +0 -0
  107. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_4o.py +0 -0
  108. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_gpt_5_3.py +0 -0
  109. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_o1.py +0 -0
  110. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_o3.py +0 -0
  111. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/openai/openai_o4.py +0 -0
  112. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/others.py +0 -0
  113. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/families/vidu.py +0 -0
  114. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/models/registry.py +0 -0
  115. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/provider.py +0 -0
  116. {whosellm-0.2.1 → whosellm-0.2.3}/whosellm/py.typed +0 -0
@@ -2,7 +2,7 @@
2
2
  # 文档 / Documentation: https://callowayproject.github.io/bump-my-version/
3
3
 
4
4
  [tool.bumpversion]
5
- current_version = "0.2.1"
5
+ current_version = "0.2.3"
6
6
  parse = """(?x)
7
7
  (?P<major>0|[1-9]\\d*)\\.
8
8
  (?P<minor>0|[1-9]\\d*)\\.
@@ -0,0 +1,5 @@
1
+ {
2
+ "enabledPlugins": {
3
+ "turingfocus-toolkit@turingfocus-skills": true
4
+ }
5
+ }
@@ -2,6 +2,27 @@
2
2
 
3
3
  All notable changes to this project will be documented in this file.
4
4
 
5
+ ## [0.2.3] - Unreleased
6
+
7
+ ### Added
8
+ - 新增 Claude Opus 4.x 模型配置(官方规格核实):`claude-opus-4-8`、`claude-opus-4-7`(1M 上下文,128K 最大输出,结构化输出 + computer use)、`claude-opus-4-5`(200K 上下文,64K 最大输出)
9
+
10
+ ### Fixed
11
+ - 修复 Claude 4.x 别名版本解析回退 bug:`claude-opus-4-5` / `4-7` / `4-8` 等**无日期别名**此前被 `claude-opus-4-{snapshot:8d}` 模式的"最大宽度"语义把单个数字 minor 误吞为 snapshot,导致版本回退为 `4.0`。改用精确 8 位的 `{snapshot:snapshot}` 自定义类型(`patterns._convert_snapshot`)后,单字段 snapshot 不再吞掉 minor,现存与未来未注册别名均能解析出正确版本(如 `4.8`),版本比较稳定可用
12
+
13
+ ## [0.2.2] - 2026-04-24
14
+
15
+ ### Added
16
+ - DeepSeek V4 系列模型支持:`deepseek-v4-flash`、`deepseek-v4-pro`(1M 上下文,384K 最大输出,支持思考/非思考双模式)
17
+ - DeepSeek 官方 Provider 支持版本号命名模式(`deepseek-v{major}.{minor}-{variant}` 等),V4 起可通过版本号直接调用
18
+ - 腾讯云 DeepSeek-V3.2(GA 版,685B MoE,稀疏注意力)
19
+
20
+ ### Changed
21
+ - `deepseek-chat` / `deepseek-reasoner` 能力基线升级为 V4-flash 非思考/思考模式别名(1M 上下文,384K 输出)
22
+
23
+ ### Fixed
24
+ - 腾讯云 `deepseek-r1-0528` 的 `supports_function_calling` 修正为 `False`(官方文档明确列为不支持)
25
+
5
26
  ## [Unreleased]
6
27
 
7
28
  ### Added
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: whosellm
3
- Version: 0.2.1
3
+ Version: 0.2.3
4
4
  Summary: A unified LLM model version and capability management library
5
5
  Author-email: JQQ <jqq1716@gmail.com>
6
6
  License: MIT
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "whosellm"
3
- version = "0.2.1"
3
+ version = "0.2.3"
4
4
  description = "A unified LLM model version and capability management library"
5
5
  authors = [
6
6
  {name = "JQQ", email = "jqq1716@gmail.com"}
@@ -11,7 +11,7 @@ from whosellm.provider import Provider
11
11
 
12
12
 
13
13
  def test_deepseek_default_capabilities() -> None:
14
- """验证 DeepSeek 官方家族默认能力 / Validate DeepSeek official family default capabilities"""
14
+ """验证 DeepSeek 官方家族默认能力(V4 基线) / Validate DeepSeek official family default capabilities (V4 baseline)"""
15
15
  from whosellm import LLMeta
16
16
 
17
17
  # 使用官方 Provider 前缀确保获取官方配置
@@ -20,8 +20,10 @@ def test_deepseek_default_capabilities() -> None:
20
20
 
21
21
  assert capabilities.supports_streaming is True
22
22
  assert capabilities.supports_function_calling is True
23
- assert capabilities.max_tokens == 8000
24
- assert capabilities.context_window == 128000
23
+ # V4 系列:1M 上下文,384K 最大输出
24
+ assert capabilities.max_tokens == 384_000
25
+ assert capabilities.context_window == 1_000_000
26
+ # deepseek-chat 是 v4-flash 非思考模式的别名
25
27
  assert capabilities.supports_thinking is False
26
28
 
27
29
 
@@ -31,13 +33,13 @@ def test_deepseek_chat_specific_model() -> None:
31
33
 
32
34
  assert config is not None
33
35
  version, variant, capabilities = config
34
- assert version == "1.0"
36
+ assert version == "4.0"
35
37
  assert variant == "chat"
36
38
  assert capabilities is not None
37
39
  assert capabilities.supports_function_calling is True
38
40
  assert capabilities.supports_streaming is True
39
- assert capabilities.max_tokens == 8000
40
- assert capabilities.context_window == 128000
41
+ assert capabilities.max_tokens == 384_000
42
+ assert capabilities.context_window == 1_000_000
41
43
 
42
44
 
43
45
  def test_deepseek_chat_pattern_matching() -> None:
@@ -50,7 +52,7 @@ def test_deepseek_chat_pattern_matching() -> None:
50
52
 
51
53
  assert model.family == ModelFamily.DEEPSEEK
52
54
  assert model.variant == "chat"
53
- assert model.version == "1.0"
55
+ assert model.version == "4.0"
54
56
  assert model.provider == Provider.DEEPSEEK
55
57
 
56
58
 
@@ -60,10 +62,12 @@ def test_deepseek_reasoner_specific_model() -> None:
60
62
 
61
63
  assert config is not None
62
64
  version, variant, capabilities = config
63
- assert version == "1.0"
65
+ assert version == "4.0"
64
66
  assert variant == "reasoner"
65
67
  assert capabilities is not None
66
68
  assert capabilities.supports_thinking is True
69
+ assert capabilities.max_tokens == 384_000
70
+ assert capabilities.context_window == 1_000_000
67
71
 
68
72
 
69
73
  def test_deepseek_base_pattern_without_variant() -> None:
@@ -71,17 +75,16 @@ def test_deepseek_base_pattern_without_variant() -> None:
71
75
  from whosellm import LLMeta
72
76
 
73
77
  # 使用 Provider 前缀确保匹配官方配置
74
- # DeepSeek 官方只支持 chat 和 reasoner,默认使用 chat
75
78
  model = LLMeta("deepseek::deepseek-chat")
76
79
 
77
80
  assert model.family == ModelFamily.DEEPSEEK
78
81
  assert model.variant == "chat"
79
- assert model.version == "1.0"
82
+ assert model.version == "4.0"
80
83
  assert model.capabilities.supports_function_calling is True
81
84
 
82
85
 
83
86
  def test_deepseek_reasoner_does_not_use_chat_capabilities() -> None:
84
- """验证 reasoner 不会意外继承 chat 的函数调用能力 / Ensure reasoner capabilities override family defaults"""
87
+ """验证 reasoner 不会意外继承 chat 的能力 / Ensure reasoner capabilities override family defaults"""
85
88
  from whosellm import LLMeta
86
89
 
87
90
  model = LLMeta("deepseek::deepseek-reasoner")
@@ -95,7 +98,7 @@ def test_deepseek_no_structured_outputs() -> None:
95
98
  """验证 DeepSeek 官方模型不支持 structured_outputs(仅支持 json_object)"""
96
99
  from whosellm import LLMeta
97
100
 
98
- for model_id in ["deepseek-chat", "deepseek-reasoner"]:
101
+ for model_id in ["deepseek-chat", "deepseek-reasoner", "deepseek-v4-flash", "deepseek-v4-pro"]:
99
102
  model = LLMeta(f"deepseek::{model_id}")
100
103
  assert model.capabilities.supports_structured_outputs is False, (
101
104
  f"{model_id}: DeepSeek API 仅支持 response_format={{type:'json_object'}},"
@@ -106,15 +109,68 @@ def test_deepseek_no_structured_outputs() -> None:
106
109
  )
107
110
 
108
111
 
109
- def test_deepseek_official_invalid_model_names() -> None:
110
- """验证 DeepSeek 官方不支持的模型名称会被识别为 UNKNOWN / Validate unsupported official model names are recognized as UNKNOWN"""
112
+ def test_deepseek_v4_flash_specific_model() -> None:
113
+ """验证 deepseek-v4-flash 特定模型配置 / Validate deepseek-v4-flash specific configuration"""
111
114
  from whosellm import LLMeta
112
115
 
113
- # DeepSeek 官方不提供 deepseek-v3.2-exp 这样的命名方式
114
- # 官方只支持 deepseek-chat-{suffix} 和 deepseek-reasoner-{suffix}
115
- model = LLMeta("deepseek::deepseek-v3.2-exp")
116
+ model = LLMeta("deepseek::deepseek-v4-flash")
116
117
 
117
- # 当使用 Provider 前缀时,Provider 会被保留,但 family 会是 UNKNOWN
118
- assert model.family == ModelFamily.UNKNOWN
118
+ assert model.family == ModelFamily.DEEPSEEK
119
+ assert model.provider == Provider.DEEPSEEK
120
+ assert model.version == "4.0"
121
+ assert model.variant == "flash"
122
+
123
+ caps = model.capabilities
124
+ assert caps.supports_thinking is True
125
+ assert caps.supports_function_calling is True
126
+ assert caps.supports_streaming is True
127
+ assert caps.supports_json_outputs is True
128
+ assert caps.supports_structured_outputs is False
129
+ assert caps.max_tokens == 384_000
130
+ assert caps.context_window == 1_000_000
131
+
132
+
133
+ def test_deepseek_v4_pro_specific_model() -> None:
134
+ """验证 deepseek-v4-pro 特定模型配置 / Validate deepseek-v4-pro specific configuration"""
135
+ from whosellm import LLMeta
136
+
137
+ model = LLMeta("deepseek::deepseek-v4-pro")
138
+
139
+ assert model.family == ModelFamily.DEEPSEEK
140
+ assert model.provider == Provider.DEEPSEEK
141
+ assert model.version == "4.0"
142
+ assert model.variant == "pro"
143
+
144
+ caps = model.capabilities
145
+ assert caps.supports_thinking is True
146
+ assert caps.supports_function_calling is True
147
+ assert caps.max_tokens == 384_000
148
+ assert caps.context_window == 1_000_000
149
+
150
+
151
+ def test_deepseek_v4_variant_ordering() -> None:
152
+ """验证 v4-flash < v4-pro 的排序关系 / Validate v4-flash < v4-pro ordering"""
153
+ from whosellm import LLMeta
154
+
155
+ flash = LLMeta("deepseek::deepseek-v4-flash")
156
+ pro = LLMeta("deepseek::deepseek-v4-pro")
157
+
158
+ assert flash < pro
159
+
160
+
161
+ def test_deepseek_versioned_pattern_matches_official_family() -> None:
162
+ """验证带版本号的 DS 模型名能被官方 family 识别 / Validate versioned DS names match the official family"""
163
+ from whosellm import LLMeta
164
+
165
+ # V4 是 DS 官方首次开放版本号命名的系列
166
+ model = LLMeta("deepseek::deepseek-v4-flash")
167
+ assert model.family == ModelFamily.DEEPSEEK
119
168
  assert model.provider == Provider.DEEPSEEK
120
- assert model.variant == "" # 无法匹配到任何 variant
169
+ assert model.version == "4.0"
170
+
171
+ # 带小数版本号也能匹配 family(即使当前没有 specific_model 条目)
172
+ model_v32 = LLMeta("deepseek::deepseek-v3.2-exp")
173
+ assert model_v32.family == ModelFamily.DEEPSEEK
174
+ assert model_v32.provider == Provider.DEEPSEEK
175
+ assert model_v32.version == "3.2"
176
+ assert model_v32.variant == "exp"
@@ -66,6 +66,8 @@ def test_tencent_deepseek_r1_0528() -> None:
66
66
  assert capabilities is not None
67
67
  assert capabilities.supports_thinking is True
68
68
  assert capabilities.context_window == 128000
69
+ # 腾讯云 LKE 官方文档明确列为不支持 Function Calling
70
+ assert capabilities.supports_function_calling is False
69
71
 
70
72
 
71
73
  def test_tencent_deepseek_v3_1() -> None:
@@ -109,6 +111,22 @@ def test_tencent_deepseek_v3_2_exp() -> None:
109
111
  assert capabilities.context_window == 128000
110
112
 
111
113
 
114
+ def test_tencent_deepseek_v3_2() -> None:
115
+ """测试腾讯云 DeepSeek-V3.2(GA) / Test Tencent DeepSeek-V3.2 (GA)"""
116
+ config = get_specific_model_config("deepseek-v3.2")
117
+
118
+ assert config is not None
119
+ version, variant, capabilities = config
120
+ assert version == "v3.2"
121
+ assert variant == "v3.2"
122
+ assert capabilities is not None
123
+ assert capabilities.supports_thinking is True
124
+ assert capabilities.supports_function_calling is True
125
+ assert capabilities.supports_streaming is True
126
+ assert capabilities.max_tokens == 32000
127
+ assert capabilities.context_window == 128000
128
+
129
+
112
130
  def test_tencent_deepseek_pattern_matching() -> None:
113
131
  """测试腾讯云 DeepSeek 模式匹配 / Test Tencent DeepSeek pattern matching"""
114
132
  # 测试 V3 系列
@@ -158,8 +176,12 @@ def test_tencent_deepseek_no_collision_with_official() -> None:
158
176
  assert tencent_v3.variant == "base"
159
177
 
160
178
  # 不同的能力配置
161
- assert official_chat.capabilities.max_tokens == 8000
179
+ # 官方 deepseek-chat 当前指向 V4-flash 非思考模式(1M 上下文,384K 输出)
180
+ assert official_chat.capabilities.max_tokens == 384_000
181
+ assert official_chat.capabilities.context_window == 1_000_000
182
+ # 腾讯云保持其自有的 DeepSeek 部署规格
162
183
  assert tencent_v3.capabilities.max_tokens == 16000
184
+ assert tencent_v3.capabilities.context_window == 64000
163
185
 
164
186
 
165
187
  def test_tencent_deepseek_invalid_model_names() -> None:
@@ -193,7 +193,6 @@ def test_gpt5_4_model():
193
193
  assert m.capabilities.supports_computer_use is True
194
194
 
195
195
 
196
-
197
196
  def test_gpt5_4_with_date_suffix():
198
197
  """测试带日期的GPT-5.4模型 / Test GPT-5.4 with date suffix"""
199
198
  m = LLMeta("gpt-5.4-2026-03-05")
@@ -239,7 +238,6 @@ def test_gpt5_4_mini_model():
239
238
  assert m.capabilities.supports_computer_use is True
240
239
 
241
240
 
242
-
243
241
  def test_gpt5_4_mini_with_date_suffix():
244
242
  """测试带日期的GPT-5.4-mini模型 / Test GPT-5.4-mini with date suffix"""
245
243
  m = LLMeta("gpt-5.4-mini-2026-03-17")
@@ -267,7 +265,6 @@ def test_gpt5_4_nano_model():
267
265
  assert m.capabilities.supports_computer_use is False
268
266
 
269
267
 
270
-
271
268
  def test_gpt5_4_nano_with_date_suffix():
272
269
  """测试带日期的GPT-5.4-nano模型 / Test GPT-5.4-nano with date suffix"""
273
270
  m = LLMeta("gpt-5.4-nano-2026-03-17")
@@ -102,7 +102,8 @@ class TestAutoRegister(unittest.TestCase):
102
102
  assert model.family == ModelFamily.DEEPSEEK
103
103
  assert model.provider == Provider.DEEPSEEK
104
104
  assert model.capabilities.supports_function_calling is True
105
- assert model.capabilities.context_window == 128000
105
+ # V4 deepseek-chat 别名为 v4-flash 非思考模式,上下文扩展为 1M
106
+ assert model.capabilities.context_window == 1_000_000
106
107
 
107
108
  def test_auto_register_qwen_variant(self) -> None:
108
109
  """测试自动注册 Qwen 新型号 / Test auto-register Qwen new variant"""
@@ -0,0 +1,124 @@
1
+ # filename: test_claude_4x_versions.py
2
+ """
3
+ 回归测试:Claude 4.x 别名版本解析 + 版本比较稳定性
4
+ Regression tests: Claude 4.x alias version parsing + version-comparison stability
5
+
6
+ 背景 / Context:
7
+ TFRobotV2 需要门控 Claude 4.6+ 移除的 assistant prefill。决定**用版本比较**判断
8
+ (`family == CLAUDE and parse_version(version) >= (4, 6)`),而非依赖能力位。
9
+ 因此 whosellm 必须保证 4.x 别名(含未注册的新别名)版本解析正确、比较稳定。
10
+
11
+ 根因:parse 的 ``{snapshot:8d}`` 是最大宽度,会把 ``claude-opus-4-5`` 的 ``5`` 当 snapshot,
12
+ 使 minor 被吞、版本回退 4.0。修复后通过精确 8 位 snapshot 自定义类型解决。
13
+ """
14
+
15
+ import pytest
16
+
17
+ from whosellm import LLMeta
18
+ from whosellm.models.base import ModelFamily, parse_version
19
+
20
+ # 官方 prefill 真值表(platform.claude.com,逐字核实):不支持 prefill 的恰为版本 >= 4.6
21
+ # Authoritative prefill truth table: models WITHOUT prefill are exactly version >= 4.6
22
+ _PREFILL_REMOVED = {
23
+ "claude-opus-4-8",
24
+ "claude-opus-4-7",
25
+ "claude-opus-4-6",
26
+ "claude-sonnet-4-6",
27
+ }
28
+ _PREFILL_SUPPORTED = {
29
+ "claude-opus-4-5",
30
+ "claude-opus-4-1",
31
+ "claude-opus-4-0",
32
+ "claude-sonnet-4-5",
33
+ "claude-sonnet-4-0",
34
+ "claude-haiku-4-5",
35
+ "claude-3-7-sonnet",
36
+ "claude-3-5-haiku",
37
+ }
38
+
39
+
40
+ class TestClaude4xAliasVersionParsing:
41
+ """未注册/新增的 Claude 4.x 别名应解析出正确版本,而非回退 family 默认 4.0"""
42
+
43
+ @pytest.mark.parametrize(
44
+ "model_name,expected_version,expected_variant",
45
+ [
46
+ ("claude-opus-4-8", "4.8", "opus"),
47
+ ("claude-opus-4-7", "4.7", "opus"),
48
+ ("claude-opus-4-6", "4.6", "opus"),
49
+ ("claude-opus-4-5", "4.5", "opus"),
50
+ ("claude-opus-4-5-20251101", "4.5", "opus"),
51
+ ("claude-haiku-4-5-20251001", "4.5", "haiku"),
52
+ ("claude-sonnet-4-6", "4.6", "sonnet"),
53
+ ("claude-sonnet-4-5", "4.5", "sonnet"),
54
+ ],
55
+ )
56
+ def test_alias_version(self, model_name: str, expected_version: str, expected_variant: str):
57
+ meta = LLMeta(model_name)
58
+ assert meta.version == expected_version, f"{model_name} 解析出错误版本 {meta.version}"
59
+ assert meta.variant == expected_variant
60
+ assert meta.family == ModelFamily.CLAUDE
61
+
62
+ def test_dated_4_0_snapshot_still_resolves_to_4_0(self):
63
+ """带 8 位日期的原始 4.0 snapshot 仍应识别为 4.0,不被精确宽度修复破坏"""
64
+ meta = LLMeta("claude-opus-4-20250514")
65
+ assert meta.version == "4.0"
66
+ assert meta.variant == "opus"
67
+
68
+ def test_short_digit_not_swallowed_as_snapshot(self):
69
+ """根因回归:单个数字 minor 不得被 {snapshot} 吞掉"""
70
+ assert LLMeta("claude-opus-4-5").version == "4.5"
71
+ assert LLMeta("claude-opus-4-7").version == "4.7"
72
+ assert LLMeta("claude-opus-4-8").version == "4.8"
73
+
74
+
75
+ class TestClaude4xCapabilities:
76
+ """新增模型应带官方真实能力(非臆测/镜像)"""
77
+
78
+ @pytest.mark.parametrize(
79
+ "model_name,ctx,max_out",
80
+ [
81
+ ("claude-opus-4-8", 1000000, 128000),
82
+ ("claude-opus-4-7", 1000000, 128000),
83
+ ("claude-opus-4-5", 200000, 64000),
84
+ ],
85
+ )
86
+ def test_new_model_specs(self, model_name: str, ctx: int, max_out: int):
87
+ caps = LLMeta(model_name).capabilities
88
+ assert caps.context_window == ctx
89
+ assert caps.max_tokens == max_out
90
+ assert caps.supports_structured_outputs is True
91
+ assert caps.supports_computer_use is True
92
+
93
+
94
+ class TestClaude4xVersionComparison:
95
+ """版本比较稳定可用——TFRobotV2 门控的基石"""
96
+
97
+ def test_monotonic_opus_chain(self):
98
+ assert LLMeta("claude-opus-4-5") < LLMeta("claude-opus-4-6")
99
+ assert LLMeta("claude-opus-4-6") < LLMeta("claude-opus-4-7")
100
+ assert LLMeta("claude-opus-4-7") < LLMeta("claude-opus-4-8")
101
+
102
+ def test_cross_minor(self):
103
+ assert LLMeta("claude-opus-4-1") < LLMeta("claude-opus-4-6")
104
+ assert LLMeta("claude-opus-4-0") < LLMeta("claude-opus-4-5")
105
+
106
+ def test_dated_alias_equivalent_version(self):
107
+ """带日期与不带日期解析出相同版本元组"""
108
+ assert LLMeta("claude-opus-4-5").version == LLMeta("claude-opus-4-5-20251101").version
109
+
110
+
111
+ class TestVersionGateMatchesPrefillTruth:
112
+ """关键:纯版本门控 `parse_version(version) >= (4, 6)` 的真假必须与官方 prefill 真值表完全一致"""
113
+
114
+ @pytest.mark.parametrize("model_name", sorted(_PREFILL_REMOVED))
115
+ def test_no_prefill_models_are_ge_4_6(self, model_name: str):
116
+ meta = LLMeta(model_name)
117
+ assert meta.family == ModelFamily.CLAUDE
118
+ assert parse_version(meta.version) >= (4, 6), f"{model_name} 应被版本门控判为不支持 prefill"
119
+
120
+ @pytest.mark.parametrize("model_name", sorted(_PREFILL_SUPPORTED))
121
+ def test_prefill_models_are_lt_4_6(self, model_name: str):
122
+ meta = LLMeta(model_name)
123
+ assert meta.family == ModelFamily.CLAUDE
124
+ assert parse_version(meta.version) < (4, 6), f"{model_name} 应被版本门控判为支持 prefill"
@@ -968,7 +968,7 @@ wheels = [
968
968
 
969
969
  [[package]]
970
970
  name = "whosellm"
971
- version = "0.2.1"
971
+ version = "0.2.3"
972
972
  source = { editable = "." }
973
973
  dependencies = [
974
974
  { name = "parse" },
@@ -7,7 +7,7 @@
7
7
  LLMeta - 统一的大语言模型版本和能力管理库 / A unified LLM model version and capability management library
8
8
  """
9
9
 
10
- __version__ = "0.2.1"
10
+ __version__ = "0.2.3"
11
11
 
12
12
  from whosellm.capabilities import ModelCapabilities
13
13
  from whosellm.model_version import LLMeta
@@ -189,6 +189,11 @@ class ModelFamilyConfig:
189
189
  else:
190
190
  type_spec = ""
191
191
 
192
+ # 自定义 snapshot 类型要求精确 8 位(见 patterns._convert_snapshot)
193
+ # Custom snapshot type requires exactly 8 digits (see patterns._convert_snapshot)
194
+ if type_spec == "snapshot":
195
+ return "20240101"
196
+
192
197
  if type_spec.endswith("d"):
193
198
  width_str = type_spec[:-1].strip()
194
199
  width = int(width_str) if width_str.isdigit() else 1
@@ -23,14 +23,14 @@ CLAUDE = ModelFamilyConfig(
23
23
  variant_default="sonnet",
24
24
  variant_priority_default=(3,), # sonnet 的默认优先级 / default priority for sonnet
25
25
  patterns=[
26
- "claude-{variant:variant}-{major:d}-{minor:d}@{snapshot:8d}",
27
- "claude-{variant:variant}-{major:d}-{minor:d}-{snapshot:8d}",
26
+ "claude-{variant:variant}-{major:d}-{minor:d}@{snapshot:snapshot}",
27
+ "claude-{variant:variant}-{major:d}-{minor:d}-{snapshot:snapshot}",
28
28
  "claude-{variant:variant}-{major:d}-{minor:d}",
29
- "claude-{variant:variant}-{major:d}-{snapshot:8d}",
29
+ "claude-{variant:variant}-{major:d}-{snapshot:snapshot}",
30
30
  "claude-{variant:variant}-{major:d}",
31
- "claude-{major:d}-{minor:d}-{variant:variant}-{snapshot:8d}",
31
+ "claude-{major:d}-{minor:d}-{variant:variant}-{snapshot:snapshot}",
32
32
  "claude-{major:d}-{minor:d}-{variant:variant}",
33
- "claude-{major:d}-{variant:variant}-{snapshot:8d}",
33
+ "claude-{major:d}-{variant:variant}-{snapshot:snapshot}",
34
34
  "claude-{major:d}-{variant:variant}",
35
35
  ],
36
36
  capabilities=ModelCapabilities(
@@ -42,6 +42,46 @@ CLAUDE = ModelFamilyConfig(
42
42
  context_window=200000,
43
43
  ),
44
44
  specific_models={
45
+ "claude-opus-4-8": SpecificModelConfig(
46
+ version_default="4.8",
47
+ variant_default="opus",
48
+ variant_priority=(5,),
49
+ capabilities=ModelCapabilities(
50
+ supports_vision=True,
51
+ supports_thinking=True,
52
+ supports_function_calling=True,
53
+ supports_streaming=True,
54
+ supports_structured_outputs=True,
55
+ supports_computer_use=True,
56
+ max_tokens=128000,
57
+ context_window=1000000,
58
+ ),
59
+ patterns=[
60
+ "claude-opus-4-8-{snapshot:snapshot}",
61
+ "claude-opus-4-8",
62
+ "claude-opus-4-8@{snapshot:snapshot}",
63
+ ],
64
+ ),
65
+ "claude-opus-4-7": SpecificModelConfig(
66
+ version_default="4.7",
67
+ variant_default="opus",
68
+ variant_priority=(5,),
69
+ capabilities=ModelCapabilities(
70
+ supports_vision=True,
71
+ supports_thinking=True,
72
+ supports_function_calling=True,
73
+ supports_streaming=True,
74
+ supports_structured_outputs=True,
75
+ supports_computer_use=True,
76
+ max_tokens=128000,
77
+ context_window=1000000,
78
+ ),
79
+ patterns=[
80
+ "claude-opus-4-7-{snapshot:snapshot}",
81
+ "claude-opus-4-7",
82
+ "claude-opus-4-7@{snapshot:snapshot}",
83
+ ],
84
+ ),
45
85
  "claude-opus-4-6": SpecificModelConfig(
46
86
  version_default="4.6",
47
87
  variant_default="opus",
@@ -57,9 +97,9 @@ CLAUDE = ModelFamilyConfig(
57
97
  context_window=1000000,
58
98
  ),
59
99
  patterns=[
60
- "claude-opus-4-6-{snapshot:8d}",
100
+ "claude-opus-4-6-{snapshot:snapshot}",
61
101
  "claude-opus-4-6",
62
- "claude-opus-4-6@{snapshot:8d}",
102
+ "claude-opus-4-6@{snapshot:snapshot}",
63
103
  ],
64
104
  ),
65
105
  "claude-sonnet-4-6": SpecificModelConfig(
@@ -77,9 +117,9 @@ CLAUDE = ModelFamilyConfig(
77
117
  context_window=1000000,
78
118
  ),
79
119
  patterns=[
80
- "claude-sonnet-4-6-{snapshot:8d}",
120
+ "claude-sonnet-4-6-{snapshot:snapshot}",
81
121
  "claude-sonnet-4-6",
82
- "claude-sonnet-4-6@{snapshot:8d}",
122
+ "claude-sonnet-4-6@{snapshot:snapshot}",
83
123
  ],
84
124
  ),
85
125
  "claude-sonnet-4-5": SpecificModelConfig(
@@ -97,7 +137,11 @@ CLAUDE = ModelFamilyConfig(
97
137
  max_tokens=64000,
98
138
  context_window=200000,
99
139
  ),
100
- patterns=["claude-sonnet-4-5-{snapshot:8d}", "claude-sonnet-4-5", "claude-sonnet-4-5@{snapshot:8d}"],
140
+ patterns=[
141
+ "claude-sonnet-4-5-{snapshot:snapshot}",
142
+ "claude-sonnet-4-5",
143
+ "claude-sonnet-4-5@{snapshot:snapshot}",
144
+ ],
101
145
  ),
102
146
  "claude-haiku-4-5": SpecificModelConfig(
103
147
  version_default="4.5",
@@ -114,7 +158,32 @@ CLAUDE = ModelFamilyConfig(
114
158
  max_tokens=64000,
115
159
  context_window=200000,
116
160
  ),
117
- patterns=["claude-haiku-4-5-{snapshot:8d}", "claude-haiku-4-5", "claude-haiku-4-5@{snapshot:8d}"],
161
+ patterns=[
162
+ "claude-haiku-4-5-{snapshot:snapshot}",
163
+ "claude-haiku-4-5",
164
+ "claude-haiku-4-5@{snapshot:snapshot}",
165
+ ],
166
+ ),
167
+ "claude-opus-4-5": SpecificModelConfig(
168
+ version_default="4.5",
169
+ variant_default="opus",
170
+ variant_priority=(5,),
171
+ capabilities=ModelCapabilities(
172
+ supports_vision=True,
173
+ supports_pdf=True,
174
+ supports_thinking=True,
175
+ supports_function_calling=True,
176
+ supports_streaming=True,
177
+ supports_structured_outputs=True,
178
+ supports_computer_use=True,
179
+ max_tokens=64000,
180
+ context_window=200000,
181
+ ),
182
+ patterns=[
183
+ "claude-opus-4-5-{snapshot:snapshot}",
184
+ "claude-opus-4-5",
185
+ "claude-opus-4-5@{snapshot:snapshot}",
186
+ ],
118
187
  ),
119
188
  "claude-opus-4-1": SpecificModelConfig(
120
189
  version_default="4.1",
@@ -131,7 +200,7 @@ CLAUDE = ModelFamilyConfig(
131
200
  max_tokens=32000,
132
201
  context_window=200000,
133
202
  ),
134
- patterns=["claude-opus-4-1-{snapshot:8d}", "claude-opus-4-1", "claude-opus-4-1@{snapshot:8d}"],
203
+ patterns=["claude-opus-4-1-{snapshot:snapshot}", "claude-opus-4-1", "claude-opus-4-1@{snapshot:snapshot}"],
135
204
  ),
136
205
  "claude-sonnet-4-0": SpecificModelConfig(
137
206
  version_default="4.0",
@@ -148,7 +217,11 @@ CLAUDE = ModelFamilyConfig(
148
217
  max_tokens=64000,
149
218
  context_window=200000,
150
219
  ),
151
- patterns=["claude-sonnet-4-{snapshot:8d}", "claude-sonnet-4-0", "claude-sonnet-4-0@{snapshot:8d}"],
220
+ patterns=[
221
+ "claude-sonnet-4-{snapshot:snapshot}",
222
+ "claude-sonnet-4-0",
223
+ "claude-sonnet-4-0@{snapshot:snapshot}",
224
+ ],
152
225
  ),
153
226
  "claude-3-7-sonnet": SpecificModelConfig(
154
227
  version_default="3.7",
@@ -165,7 +238,7 @@ CLAUDE = ModelFamilyConfig(
165
238
  max_tokens=64000,
166
239
  context_window=200000,
167
240
  ),
168
- patterns=["claude-3-7-sonnet-{snapshot:8d}", "claude-3-7-sonnet-latest", "claude-3-7-sonnet"],
241
+ patterns=["claude-3-7-sonnet-{snapshot:snapshot}", "claude-3-7-sonnet-latest", "claude-3-7-sonnet"],
169
242
  ),
170
243
  "claude-opus-4-0": SpecificModelConfig(
171
244
  version_default="4.0",
@@ -182,7 +255,7 @@ CLAUDE = ModelFamilyConfig(
182
255
  max_tokens=32000,
183
256
  context_window=200000,
184
257
  ),
185
- patterns=["claude-opus-4-{snapshot:8d}", "claude-opus-4-0", "claude-opus-4-0@{snapshot:8d}"],
258
+ patterns=["claude-opus-4-{snapshot:snapshot}", "claude-opus-4-0", "claude-opus-4-0@{snapshot:snapshot}"],
186
259
  ),
187
260
  "claude-3-5-haiku": SpecificModelConfig(
188
261
  version_default="3.5",
@@ -198,7 +271,7 @@ CLAUDE = ModelFamilyConfig(
198
271
  max_tokens=8000,
199
272
  context_window=200000,
200
273
  ),
201
- patterns=["claude-3-5-haiku-{snapshot:8d}", "claude-3-5-haiku-latest", "claude-3-5-haiku"],
274
+ patterns=["claude-3-5-haiku-{snapshot:snapshot}", "claude-3-5-haiku-latest", "claude-3-5-haiku"],
202
275
  ),
203
276
  "claude-3-haiku": SpecificModelConfig(
204
277
  version_default="3.0",
@@ -213,7 +286,7 @@ CLAUDE = ModelFamilyConfig(
213
286
  max_tokens=4096,
214
287
  context_window=200000,
215
288
  ),
216
- patterns=["claude-3-haiku-{snapshot:8d}"],
289
+ patterns=["claude-3-haiku-{snapshot:snapshot}"],
217
290
  ),
218
291
  },
219
292
  )