python-fastllm 0.0.16__tar.gz → 0.0.18__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/PKG-INFO +1 -1
- python_fastllm-0.0.18/fastllm/__init__.py +1 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/acomplete.py +2 -1
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/chat.py +5 -4
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/types.py +16 -5
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/python_fastllm.egg-info/PKG-INFO +1 -1
- python_fastllm-0.0.16/fastllm/__init__.py +0 -1
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/README.md +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/_modidx.py +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/anthropic.py +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/codex.py +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/gemini.py +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/openai_chat.py +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/openai_responses.py +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/specs/anthropic.json +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/specs/anthropic.yml +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/specs/gemini.json +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/specs/openai.with-code-samples.json +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/specs/openai.with-code-samples.yml +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/specs/spec_manifest.json +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/fastllm/streaming.py +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/pyproject.toml +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/python_fastllm.egg-info/SOURCES.txt +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/python_fastllm.egg-info/dependency_links.txt +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/python_fastllm.egg-info/entry_points.txt +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/python_fastllm.egg-info/requires.txt +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/python_fastllm.egg-info/top_level.txt +0 -0
- {python_fastllm-0.0.16 → python_fastllm-0.0.18}/setup.cfg +0 -0
|
@@ -0,0 +1 @@
|
|
|
1
|
+
__version__ = "0.0.18"
|
|
@@ -43,7 +43,8 @@ vendor_mapping = {
|
|
|
43
43
|
"openrouter": ('openai_chat', "https://openrouter.ai/api/v1", "OPENROUTER_API_KEY"),
|
|
44
44
|
"together": ('openai_chat', "https://api.together.xyz/v1", "TOGETHER_API_KEY"),
|
|
45
45
|
"fireworks_ai": ('openai_chat', "https://api.fireworks.ai/inference/v1", "FIREWORKS_API_KEY"),
|
|
46
|
-
"qwen": ('openai_chat', "https://dashscope.aliyuncs.com/compatible-mode/v1", "QWEN_API_KEY")
|
|
46
|
+
"qwen": ('openai_chat', "https://dashscope.aliyuncs.com/compatible-mode/v1", "QWEN_API_KEY"),
|
|
47
|
+
"minimax": ('anthropic', "https://api.minimax.io/anthropic", "MINIMAX_API_KEY")
|
|
47
48
|
}
|
|
48
49
|
|
|
49
50
|
# %% ../nbs/06_acomplete.ipynb #77d27ea7
|
|
@@ -620,10 +620,11 @@ def _handle_stop_reason(res):
|
|
|
620
620
|
# %% ../nbs/07_chat.ipynb #daf876f4
|
|
621
621
|
class StopReasonCallback(ChatCallback):
|
|
622
622
|
order = 40
|
|
623
|
-
async def after_acomplete(self):
|
|
624
|
-
action,
|
|
625
|
-
if action
|
|
626
|
-
|
|
623
|
+
async def after_acomplete(self):
|
|
624
|
+
action,msg = _handle_stop_reason(self.turn_res)
|
|
625
|
+
if action != 'warning': return
|
|
626
|
+
add_warning(self.chat.turn_res, msg)
|
|
627
|
+
if self.stream: yield dict(text=f"warning: {msg}\n\n")
|
|
627
628
|
|
|
628
629
|
# %% ../nbs/07_chat.ipynb #aa7630b2
|
|
629
630
|
def _active_fence_langs(tool_schemas):
|
|
@@ -340,10 +340,12 @@ for model in ('kimi-k2.5', 'kimi-k2.6'):
|
|
|
340
340
|
register_model_info('gemini-3.1-flash-lite', vendor_name='gemini', base='gemini-3.1-flash-lite-preview')
|
|
341
341
|
register_model_info('models/gemini-3.1-flash-lite', vendor_name='gemini', base='gemini-3.1-flash-lite-preview')
|
|
342
342
|
|
|
343
|
-
|
|
344
|
-
|
|
345
|
-
|
|
346
|
-
|
|
343
|
+
register_model_info('accounts/fireworks/models/kimi-k2p5', vendor_name='fireworks_ai', base='accounts/fireworks/models/kimi-k2p5',
|
|
344
|
+
supports_reasoning=True, supports_vision=True,
|
|
345
|
+
input_cost_per_token=0.60e-6, cache_read_input_token_cost=0.10e-6, output_cost_per_token=3.0e-6)
|
|
346
|
+
register_model_info('accounts/fireworks/models/kimi-k2p6', vendor_name='fireworks_ai', base='accounts/fireworks/models/kimi-k2p5',
|
|
347
|
+
supports_reasoning=True, supports_vision=True,
|
|
348
|
+
input_cost_per_token=0.95e-6, cache_read_input_token_cost=0.16e-6, output_cost_per_token=4.0e-6)
|
|
347
349
|
|
|
348
350
|
# %% ../nbs/00_types.ipynb #948d55d0
|
|
349
351
|
deepseek_v4_common = dict(**modern_llm, supports_assistant_prefill=True,
|
|
@@ -363,6 +365,15 @@ register_model_info('mimo-v2.5-pro', vendor_name='mimo', **mimo_v25_common, base
|
|
|
363
365
|
register_model_info('mimo-v2.5', vendor_name='mimo', **mimo_v25_common, base='deepseek-v4-pro', base_vendor_name='deepseek',
|
|
364
366
|
input_cost_per_token=0.14e-6, output_cost_per_token=0.28e-6, cache_read_input_token_cost=0.0028e-6, search_context_cost_per_query=0.005,
|
|
365
367
|
supports_vision=True, supports_image_input=True)
|
|
368
|
+
register_model_info('mimo-v2.5-pro-ultraspeed', vendor_name='mimo', **mimo_v25_common, base='deepseek-v4-pro', base_vendor_name='deepseek',
|
|
369
|
+
input_cost_per_token=1.305e-6, output_cost_per_token=2.61e-6, cache_read_input_token_cost=0.0108e-6, search_context_cost_per_query=0.005)
|
|
370
|
+
|
|
371
|
+
# %% ../nbs/00_types.ipynb #defb1c5c
|
|
372
|
+
register_model_info('MiniMax-M3', vendor_name='minimax', **modern_llm, max_input_tokens=512_000, max_output_tokens=512_000, max_tokens=512_000, input_cost_per_token=0.3e-6, output_cost_per_token=1.2e-6, cache_read_input_token_cost=0.06e-6, supports_vision=True, supports_video_input=True)
|
|
373
|
+
|
|
374
|
+
register_model_info('claude-fable-5', vendor_name='anthropic', base="claude-opus-4-8",
|
|
375
|
+
input_cost_per_token=10e-6, cache_creation_input_token_cost=12.5e-6, output_cost_per_token=50e-6,
|
|
376
|
+
cache_read_input_token_cost=1e-6, search_context_cost_per_query=0.005)
|
|
366
377
|
|
|
367
378
|
# %% ../nbs/00_types.ipynb #2c23d11e
|
|
368
379
|
codex_pricing = dict(
|
|
@@ -388,7 +399,7 @@ def approx_pricing(nm, vendor_name, out=10, cache=80, inp=10, markup=0):
|
|
|
388
399
|
p = get_model_pricing(nm, vendor_name)
|
|
389
400
|
ic = p.get('cache_creation_input_token_cost', p['input_cost_per_token'])
|
|
390
401
|
res = (p['output_cost_per_token']*out + p['cache_read_input_token_cost']*cache + ic*inp) / (out+cache+inp)
|
|
391
|
-
if nm in ('claude-opus-4-7','claude-opus-4-8'): res *= 1.5
|
|
402
|
+
if nm in ('claude-opus-4-7','claude-opus-4-8','claude-fable-5'): res *= 1.5
|
|
392
403
|
return res*(1+markup)
|
|
393
404
|
|
|
394
405
|
# %% ../nbs/00_types.ipynb #8bfca02d
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
__version__ = "0.0.16"
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{python_fastllm-0.0.16 → python_fastllm-0.0.18}/python_fastllm.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|