lm-deluge 0.0.88__py3-none-any.whl → 0.0.89__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -52,6 +52,7 @@ async def _build_gemini_request(
52
52
 
53
53
  # Handle reasoning models (thinking)
54
54
  is_gemini_3 = "gemini-3" in model.name.lower()
55
+ is_gemini_3_flash = "gemini-3-flash" in model.name.lower()
55
56
  if is_gemini_3:
56
57
  # gemini3 MUST think
57
58
  if not sampling_params.reasoning_effort:
@@ -62,13 +63,24 @@ async def _build_gemini_request(
62
63
  if effort_key == "xhigh":
63
64
  maybe_warn("WARN_XHIGH_TO_HIGH", model_name=model.name)
64
65
  effort_key = "high"
65
- level_map = {
66
- "none": "low",
67
- "minimal": "low",
68
- "low": "low",
69
- "medium": "high", # change when supported
70
- "high": "high",
71
- }
66
+ if is_gemini_3_flash:
67
+ # Flash supports minimal, low, medium, high
68
+ level_map = {
69
+ "none": "low",
70
+ "minimal": "minimal",
71
+ "low": "low",
72
+ "medium": "medium",
73
+ "high": "high",
74
+ }
75
+ else:
76
+ # Pro only supports low, high
77
+ level_map = {
78
+ "none": "low",
79
+ "minimal": "low",
80
+ "low": "low",
81
+ "medium": "high",
82
+ "high": "high",
83
+ }
72
84
  effort = level_map[effort_key]
73
85
  thinking_config = {"thinkingLevel": effort}
74
86
  request_json["generationConfig"]["thinkingConfig"] = thinking_config
@@ -153,6 +153,19 @@ GOOGLE_MODELS = {
153
153
  # Note: >200k tokens pricing is $4/$18 per million
154
154
  "reasoning_model": True,
155
155
  },
156
+ "gemini-3-flash-preview": {
157
+ "id": "gemini-3-flash-preview",
158
+ "name": "gemini-3-flash-preview",
159
+ "api_base": "https://generativelanguage.googleapis.com/v1alpha",
160
+ "api_key_env_var": "GEMINI_API_KEY",
161
+ "supports_json": True,
162
+ "supports_logprobs": False,
163
+ "api_spec": "gemini",
164
+ "input_cost": 0.5,
165
+ "cached_input_cost": 0.125, # estimated
166
+ "output_cost": 3.0,
167
+ "reasoning_model": True,
168
+ },
156
169
  # Gemini 2.5 Computer Use model
157
170
  "gemini-2.5-computer-use": {
158
171
  "id": "gemini-2.5-computer-use",
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: lm_deluge
3
- Version: 0.0.88
3
+ Version: 0.0.89
4
4
  Summary: Python utility for using LLM API models.
5
5
  Author-email: Benjamin Anderson <ben@trytaylor.ai>
6
6
  Requires-Python: >=3.10
@@ -21,7 +21,7 @@ lm_deluge/api_requests/base.py,sha256=05j5nrZhgNon2YRFXT_L-yVXKlvdodwOJan6Z6WpSp
21
21
  lm_deluge/api_requests/bedrock.py,sha256=mY1xTvgfCLyqLlfFFmu_baKgkVq1Df1_MJXeN_G1jWQ,15597
22
22
  lm_deluge/api_requests/chat_reasoning.py,sha256=sJvstvKFqsSBUjYcwxzGt2_FH4cEp3Z6gKcBPyPjGwk,236
23
23
  lm_deluge/api_requests/common.py,sha256=BZ3vRO5TB669_UsNKugkkuFSzoLHOYJIKt4nV4sf4vc,422
24
- lm_deluge/api_requests/gemini.py,sha256=_L1V1O7N70rvnp28kXfCaWXluQXEBfMbvSk3S7SrZcI,12730
24
+ lm_deluge/api_requests/gemini.py,sha256=osVbTVCdVef6sfE0XsG13olsnDHB2J70_c6G2IP-sIg,13189
25
25
  lm_deluge/api_requests/mistral.py,sha256=8JZP2CDf1XZfaPcTk0WS4q-VfYYj58ptpoH8LD3MQG4,4528
26
26
  lm_deluge/api_requests/openai.py,sha256=cEoMpMPKrVTz2Zjm5pdD8sQpOHDB9O8ndwf9TGqLPcA,29889
27
27
  lm_deluge/api_requests/response.py,sha256=vG194gAH5p7ulpNy4qy5Pryfb1p3ZV21-YGoj__ru3E,7436
@@ -38,7 +38,7 @@ lm_deluge/models/cerebras.py,sha256=u2FMXJF6xMr0euDRKLKMo_NVTOcvSrrEpehbHr8sSeE,
38
38
  lm_deluge/models/cohere.py,sha256=iXjYtM6jy_YL73Op8OfNsrMNopwae9y-Sw-4vF9cEBw,3406
39
39
  lm_deluge/models/deepseek.py,sha256=b5t_ep6fE-2cKD2mmImBaLcJUbYrfizYnjG96sfKNTk,2072
40
40
  lm_deluge/models/fireworks.py,sha256=yvt2Ggzye4aUqCqY74ta67Vu7FrQaLFjdFtN4P7D-dc,638
41
- lm_deluge/models/google.py,sha256=IDePlNOvF0lvpv3UhkUD8g30TUJqoaJHQGzTglyGg80,6560
41
+ lm_deluge/models/google.py,sha256=ka5tBdpYT26zxsE1wzrl81Rt5XgpBQkPIOXOq5pSpRE,7033
42
42
  lm_deluge/models/grok.py,sha256=rSvN3fKiO_WPNa5O_TzVTDj9-RqqjeXFBiC9OAcGZ4Q,3340
43
43
  lm_deluge/models/groq.py,sha256=Mi5WE1xOBGoZlymD0UN6kzhH_NOmfJYU4N2l-TO0Z8Q,2552
44
44
  lm_deluge/models/kimi.py,sha256=B_ZL4_0q6hS1VVskBWlBR569nNSjC8RgA2lj1eCjRRE,1183
@@ -110,8 +110,8 @@ lm_deluge/util/schema.py,sha256=q6uwhA4s1lM2dHT1Kwc46E7OY1VecMOtTEI0PTFn6tA,1320
110
110
  lm_deluge/util/spatial.py,sha256=BsF_UKhE-x0xBirc-bV1xSKZRTUhsOBdGqsMKme20C8,4099
111
111
  lm_deluge/util/validation.py,sha256=hz5dDb3ebvZrZhnaWxOxbNSVMI6nmaOODBkk0htAUhs,1575
112
112
  lm_deluge/util/xml.py,sha256=Ft4zajoYBJR3HHCt2oHwGfymGLdvp_gegVmJ-Wqk4Ck,10547
113
- lm_deluge-0.0.88.dist-info/licenses/LICENSE,sha256=uNNXGXPCw2TC7CUs7SEBkA-Mz6QBQFWUUEWDMgEs1dU,1058
114
- lm_deluge-0.0.88.dist-info/METADATA,sha256=SNJZGw7OHpfMUVG5CvYyeBQ0lNiLUg1FbZis2XXj2eg,14057
115
- lm_deluge-0.0.88.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
116
- lm_deluge-0.0.88.dist-info/top_level.txt,sha256=hqU-TJX93yBwpgkDtYcXyLr3t7TLSCCZ_reytJjwBaE,10
117
- lm_deluge-0.0.88.dist-info/RECORD,,
113
+ lm_deluge-0.0.89.dist-info/licenses/LICENSE,sha256=uNNXGXPCw2TC7CUs7SEBkA-Mz6QBQFWUUEWDMgEs1dU,1058
114
+ lm_deluge-0.0.89.dist-info/METADATA,sha256=JHgKoBFnOQJ8y1HTpeWhFYBi4H4SJoJ3ZwsfGMJFc_U,14057
115
+ lm_deluge-0.0.89.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
116
+ lm_deluge-0.0.89.dist-info/top_level.txt,sha256=hqU-TJX93yBwpgkDtYcXyLr3t7TLSCCZ_reytJjwBaE,10
117
+ lm_deluge-0.0.89.dist-info/RECORD,,