PyPI - python-fastllm - Versions diffs - 0.0.1__py3-none-any.whl - Mend

python-fastllm 0.0.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

fastllm/__init__.py +1 -0
fastllm/_modidx.py +245 -0
fastllm/acomplete.py +122 -0
fastllm/anthropic.py +298 -0
fastllm/chat.py +622 -0
fastllm/gemini.py +304 -0
fastllm/openai_chat.py +219 -0
fastllm/openai_responses.py +260 -0
fastllm/specs/anthropic.json +1 -0
fastllm/specs/anthropic.yml +15684 -0
fastllm/specs/gemini.json +6951 -0
fastllm/specs/openai.with-code-samples.json +1 -0
fastllm/specs/openai.with-code-samples.yml +73650 -0
fastllm/specs/spec_manifest.json +17 -0
fastllm/streaming.py +162 -0
fastllm/types.py +301 -0
python_fastllm-0.0.1.dist-info/METADATA +395 -0
python_fastllm-0.0.1.dist-info/RECORD +21 -0
python_fastllm-0.0.1.dist-info/WHEEL +5 -0
python_fastllm-0.0.1.dist-info/entry_points.txt +2 -0
python_fastllm-0.0.1.dist-info/top_level.txt +1 -0

fastllm/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ __version__ = "0.0.1"

fastllm/_modidx.py ADDED Viewed

@@ -0,0 +1,245 @@
+# Autogenerated by nbdev
+d = { 'settings': { 'branch': 'main',
+                'doc_baseurl': '/',
+                'doc_host': '',
+                'git_url': 'https://github.com/AnswerDotAI/fastllm',
+                'lib_path': 'fastllm'},
+  'syms': { 'fastllm.acomplete': { 'fastllm.acomplete.ContextWindowExceededError': ( 'acomplete.html#contextwindowexceedederror',
+                                                                                     'fastllm/acomplete.py'),
+                                   'fastllm.acomplete._classify_error': ('acomplete.html#_classify_error', 'fastllm/acomplete.py'),
+                                   'fastllm.acomplete._classify_error_stream': ( 'acomplete.html#_classify_error_stream',
+                                                                                 'fastllm/acomplete.py'),
+                                   'fastllm.acomplete._is_ctx_exceeded': ('acomplete.html#_is_ctx_exceeded', 'fastllm/acomplete.py'),
+                                   'fastllm.acomplete.acomplete': ('acomplete.html#acomplete', 'fastllm/acomplete.py'),
+                                   'fastllm.acomplete.mk_client': ('acomplete.html#mk_client', 'fastllm/acomplete.py')},
+            'fastllm.anthropic': { 'fastllm.anthropic._ant_cc': ('anthropic.html#_ant_cc', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic._ant_part_type': ('anthropic.html#_ant_part_type', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.acollect_stream': ('anthropic.html#acollect_stream', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.cost': ('anthropic.html#cost', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.delta_index_fn': ('anthropic.html#delta_index_fn', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.denorm_assistant': ('anthropic.html#denorm_assistant', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.denorm_file': ('anthropic.html#denorm_file', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.denorm_image': ('anthropic.html#denorm_image', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.denorm_msgs': ('anthropic.html#denorm_msgs', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.denorm_reasoning': ('anthropic.html#denorm_reasoning', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.denorm_system': ('anthropic.html#denorm_system', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.denorm_tool': ('anthropic.html#denorm_tool', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.denorm_tool_choice': ('anthropic.html#denorm_tool_choice', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.denorm_tool_result': ('anthropic.html#denorm_tool_result', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.denorm_tool_schs': ('anthropic.html#denorm_tool_schs', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.denorm_tool_use': ('anthropic.html#denorm_tool_use', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.denorm_user': ('anthropic.html#denorm_user', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.denorm_web_search': ('anthropic.html#denorm_web_search', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.get_hdrs': ('anthropic.html#get_hdrs', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.mk_payload': ('anthropic.html#mk_payload', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.norm_finish': ('anthropic.html#norm_finish', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.norm_parts': ('anthropic.html#norm_parts', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.norm_sse_event': ('anthropic.html#norm_sse_event', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.norm_tool_call': ('anthropic.html#norm_tool_call', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.norm_tool_calls': ('anthropic.html#norm_tool_calls', 'fastllm/anthropic.py'),
+                                   'fastllm.anthropic.norm_usage': ('anthropic.html#norm_usage', 'fastllm/anthropic.py')},
+            'fastllm.chat': { 'fastllm.chat.AsyncChat': ('chat.html#asyncchat', 'fastllm/chat.py'),
+                              'fastllm.chat.AsyncChat.__call__': ('chat.html#asyncchat.__call__', 'fastllm/chat.py'),
+                              'fastllm.chat.AsyncChat.__init__': ('chat.html#asyncchat.__init__', 'fastllm/chat.py'),
+                              'fastllm.chat.AsyncChat._call': ('chat.html#asyncchat._call', 'fastllm/chat.py'),
+                              'fastllm.chat.AsyncChat._prep_call': ('chat.html#asyncchat._prep_call', 'fastllm/chat.py'),
+                              'fastllm.chat.AsyncChat._prep_msg': ('chat.html#asyncchat._prep_msg', 'fastllm/chat.py'),
+                              'fastllm.chat.AsyncChat._track': ('chat.html#asyncchat._track', 'fastllm/chat.py'),
+                              'fastllm.chat.AsyncChat.print_hist': ('chat.html#asyncchat.print_hist', 'fastllm/chat.py'),
+                              'fastllm.chat.AsyncChat.tcdict': ('chat.html#asyncchat.tcdict', 'fastllm/chat.py'),
+                              'fastllm.chat.AsyncStreamFormatter': ('chat.html#asyncstreamformatter', 'fastllm/chat.py'),
+                              'fastllm.chat.AsyncStreamFormatter.format_stream': ( 'chat.html#asyncstreamformatter.format_stream',
+                                                                                   'fastllm/chat.py'),
+                              'fastllm.chat.FullResponse': ('chat.html#fullresponse', 'fastllm/chat.py'),
+                              'fastllm.chat.StopResponse': ('chat.html#stopresponse', 'fastllm/chat.py'),
+                              'fastllm.chat.StreamFormatter': ('chat.html#streamformatter', 'fastllm/chat.py'),
+                              'fastllm.chat.StreamFormatter.__init__': ('chat.html#streamformatter.__init__', 'fastllm/chat.py'),
+                              'fastllm.chat.StreamFormatter.format_item': ('chat.html#streamformatter.format_item', 'fastllm/chat.py'),
+                              'fastllm.chat.StreamFormatter.format_stream': ('chat.html#streamformatter.format_stream', 'fastllm/chat.py'),
+                              'fastllm.chat.ToolResponse': ('chat.html#toolresponse', 'fastllm/chat.py'),
+                              'fastllm.chat.UsageStats': ('chat.html#usagestats', 'fastllm/chat.py'),
+                              'fastllm.chat.UsageStats.__add__': ('chat.html#usagestats.__add__', 'fastllm/chat.py'),
+                              'fastllm.chat.UsageStats.__init__': ('chat.html#usagestats.__init__', 'fastllm/chat.py'),
+                              'fastllm.chat.UsageStats.__radd__': ('chat.html#usagestats.__radd__', 'fastllm/chat.py'),
+                              'fastllm.chat.UsageStats.__repr__': ('chat.html#usagestats.__repr__', 'fastllm/chat.py'),
+                              'fastllm.chat.UsageStats.fmt': ('chat.html#usagestats.fmt', 'fastllm/chat.py'),
+                              'fastllm.chat.UsageStats.from_response': ('chat.html#usagestats.from_response', 'fastllm/chat.py'),
+                              'fastllm.chat._add_cache_control': ('chat.html#_add_cache_control', 'fastllm/chat.py'),
+                              'fastllm.chat._alite_call_func': ('chat.html#_alite_call_func', 'fastllm/chat.py'),
+                              'fastllm.chat._apply_cache_idxs': ('chat.html#_apply_cache_idxs', 'fastllm/chat.py'),
+                              'fastllm.chat._bytes2content': ('chat.html#_bytes2content', 'fastllm/chat.py'),
+                              'fastllm.chat._call_func': ('chat.html#_call_func', 'fastllm/chat.py'),
+                              'fastllm.chat._extract_tool_parts': ('chat.html#_extract_tool_parts', 'fastllm/chat.py'),
+                              'fastllm.chat._handle_stop_reason': ('chat.html#_handle_stop_reason', 'fastllm/chat.py'),
+                              'fastllm.chat._has_cache': ('chat.html#_has_cache', 'fastllm/chat.py'),
+                              'fastllm.chat._has_search': ('chat.html#_has_search', 'fastllm/chat.py'),
+                              'fastllm.chat._has_stop': ('chat.html#_has_stop', 'fastllm/chat.py'),
+                              'fastllm.chat._inject_tool_reminder': ('chat.html#_inject_tool_reminder', 'fastllm/chat.py'),
+                              'fastllm.chat._lite_call_func': ('chat.html#_lite_call_func', 'fastllm/chat.py'),
+                              'fastllm.chat._mk_content': ('chat.html#_mk_content', 'fastllm/chat.py'),
+                              'fastllm.chat._mk_prefill': ('chat.html#_mk_prefill', 'fastllm/chat.py'),
+                              'fastllm.chat._mk_tool_result': ('chat.html#_mk_tool_result', 'fastllm/chat.py'),
+                              'fastllm.chat._srv_tc_summary': ('chat.html#_srv_tc_summary', 'fastllm/chat.py'),
+                              'fastllm.chat._srvtools': ('chat.html#_srvtools', 'fastllm/chat.py'),
+                              'fastllm.chat._tc_summary': ('chat.html#_tc_summary', 'fastllm/chat.py'),
+                              'fastllm.chat._think_kw': ('chat.html#_think_kw', 'fastllm/chat.py'),
+                              'fastllm.chat._trunc_content': ('chat.html#_trunc_content', 'fastllm/chat.py'),
+                              'fastllm.chat._trunc_param': ('chat.html#_trunc_param', 'fastllm/chat.py'),
+                              'fastllm.chat._trunc_str': ('chat.html#_trunc_str', 'fastllm/chat.py'),
+                              'fastllm.chat._usrtools': ('chat.html#_usrtools', 'fastllm/chat.py'),
+                              'fastllm.chat.add_warning': ('chat.html#add_warning', 'fastllm/chat.py'),
+                              'fastllm.chat.adisplay_stream': ('chat.html#adisplay_stream', 'fastllm/chat.py'),
+                              'fastllm.chat.astream_with_complete': ('chat.html#astream_with_complete', 'fastllm/chat.py'),
+                              'fastllm.chat.cite_footnote': ('chat.html#cite_footnote', 'fastllm/chat.py'),
+                              'fastllm.chat.contents': ('chat.html#contents', 'fastllm/chat.py'),
+                              'fastllm.chat.fmt2hist': ('chat.html#fmt2hist', 'fastllm/chat.py'),
+                              'fastllm.chat.lite_mk_func': ('chat.html#lite_mk_func', 'fastllm/chat.py'),
+                              'fastllm.chat.mk_msg': ('chat.html#mk_msg', 'fastllm/chat.py'),
+                              'fastllm.chat.mk_msgs': ('chat.html#mk_msgs', 'fastllm/chat.py'),
+                              'fastllm.chat.mk_srv_tc_details': ('chat.html#mk_srv_tc_details', 'fastllm/chat.py'),
+                              'fastllm.chat.mk_tr_details': ('chat.html#mk_tr_details', 'fastllm/chat.py'),
+                              'fastllm.chat.postproc': ('chat.html#postproc', 'fastllm/chat.py'),
+                              'fastllm.chat.remove_cache_ckpts': ('chat.html#remove_cache_ckpts', 'fastllm/chat.py'),
+                              'fastllm.chat.search_count': ('chat.html#search_count', 'fastllm/chat.py'),
+                              'fastllm.chat.split_tools': ('chat.html#split_tools', 'fastllm/chat.py'),
+                              'fastllm.chat.stop_reason': ('chat.html#stop_reason', 'fastllm/chat.py'),
+                              'fastllm.chat.structured': ('chat.html#structured', 'fastllm/chat.py')},
+            'fastllm.gemini': { 'fastllm.gemini._gem_filter_sch': ('gemini.html#_gem_filter_sch', 'fastllm/gemini.py'),
+                                'fastllm.gemini._gem_part_type': ('gemini.html#_gem_part_type', 'fastllm/gemini.py'),
+                                'fastllm.gemini.acollect_stream': ('gemini.html#acollect_stream', 'fastllm/gemini.py'),
+                                'fastllm.gemini.cost': ('gemini.html#cost', 'fastllm/gemini.py'),
+                                'fastllm.gemini.delta_index_fn': ('gemini.html#delta_index_fn', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_assistant': ('gemini.html#denorm_assistant', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_audio': ('gemini.html#denorm_audio', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_file': ('gemini.html#denorm_file', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_image': ('gemini.html#denorm_image', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_msgs': ('gemini.html#denorm_msgs', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_reasoning': ('gemini.html#denorm_reasoning', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_system': ('gemini.html#denorm_system', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_tool': ('gemini.html#denorm_tool', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_tool_choice': ('gemini.html#denorm_tool_choice', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_tool_result': ('gemini.html#denorm_tool_result', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_tool_schs': ('gemini.html#denorm_tool_schs', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_tool_use': ('gemini.html#denorm_tool_use', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_user': ('gemini.html#denorm_user', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_video': ('gemini.html#denorm_video', 'fastllm/gemini.py'),
+                                'fastllm.gemini.denorm_web_search': ('gemini.html#denorm_web_search', 'fastllm/gemini.py'),
+                                'fastllm.gemini.get_hdrs': ('gemini.html#get_hdrs', 'fastllm/gemini.py'),
+                                'fastllm.gemini.mk_payload': ('gemini.html#mk_payload', 'fastllm/gemini.py'),
+                                'fastllm.gemini.norm_finish': ('gemini.html#norm_finish', 'fastllm/gemini.py'),
+                                'fastllm.gemini.norm_parts': ('gemini.html#norm_parts', 'fastllm/gemini.py'),
+                                'fastllm.gemini.norm_sse_event': ('gemini.html#norm_sse_event', 'fastllm/gemini.py'),
+                                'fastllm.gemini.norm_tool_calls': ('gemini.html#norm_tool_calls', 'fastllm/gemini.py'),
+                                'fastllm.gemini.norm_usage': ('gemini.html#norm_usage', 'fastllm/gemini.py')},
+            'fastllm.openai_chat': { 'fastllm.openai_chat.acollect_stream': ('oai_chat.html#acollect_stream', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.cost': ('oai_chat.html#cost', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.delta_index_fn': ('oai_chat.html#delta_index_fn', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_assistant': ('oai_chat.html#denorm_assistant', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_audio': ('oai_chat.html#denorm_audio', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_file': ('oai_chat.html#denorm_file', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_image': ('oai_chat.html#denorm_image', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_msgs': ('oai_chat.html#denorm_msgs', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_reasoning': ('oai_chat.html#denorm_reasoning', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_system': ('oai_chat.html#denorm_system', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_tool': ('oai_chat.html#denorm_tool', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_tool_choice': ( 'oai_chat.html#denorm_tool_choice',
+                                                                                 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_tool_result': ( 'oai_chat.html#denorm_tool_result',
+                                                                                 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_tool_schs': ('oai_chat.html#denorm_tool_schs', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_tool_use': ('oai_chat.html#denorm_tool_use', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_user': ('oai_chat.html#denorm_user', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.denorm_web_search': ('oai_chat.html#denorm_web_search', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.get_hdrs': ('oai_chat.html#get_hdrs', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.mk_payload': ('oai_chat.html#mk_payload', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.norm_finish': ('oai_chat.html#norm_finish', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.norm_parts': ('oai_chat.html#norm_parts', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.norm_sse_event': ('oai_chat.html#norm_sse_event', 'fastllm/openai_chat.py'),
+                                     'fastllm.openai_chat.norm_tool_calls': ('oai_chat.html#norm_tool_calls', 'fastllm/openai_chat.py')},
+            'fastllm.openai_responses': { 'fastllm.openai_responses.acollect_stream': ( 'oai_responses.html#acollect_stream',
+                                                                                        'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.cost': ('oai_responses.html#cost', 'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.delta_index_fn': ( 'oai_responses.html#delta_index_fn',
+                                                                                       'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.denorm_assistant': ( 'oai_responses.html#denorm_assistant',
+                                                                                         'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.denorm_file': ( 'oai_responses.html#denorm_file',
+                                                                                    'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.denorm_image': ( 'oai_responses.html#denorm_image',
+                                                                                     'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.denorm_msgs': ( 'oai_responses.html#denorm_msgs',
+                                                                                    'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.denorm_reasoning': ( 'oai_responses.html#denorm_reasoning',
+                                                                                         'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.denorm_system': ( 'oai_responses.html#denorm_system',
+                                                                                      'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.denorm_tool': ( 'oai_responses.html#denorm_tool',
+                                                                                    'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.denorm_tool_choice': ( 'oai_responses.html#denorm_tool_choice',
+                                                                                           'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.denorm_tool_result': ( 'oai_responses.html#denorm_tool_result',
+                                                                                           'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.denorm_tool_schs': ( 'oai_responses.html#denorm_tool_schs',
+                                                                                         'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.denorm_tool_use': ( 'oai_responses.html#denorm_tool_use',
+                                                                                        'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.denorm_user': ( 'oai_responses.html#denorm_user',
+                                                                                    'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.denorm_web_search': ( 'oai_responses.html#denorm_web_search',
+                                                                                          'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.get_hdrs': ( 'oai_responses.html#get_hdrs',
+                                                                                 'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.mk_payload': ( 'oai_responses.html#mk_payload',
+                                                                                   'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.norm_finish': ( 'oai_responses.html#norm_finish',
+                                                                                    'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.norm_parts': ( 'oai_responses.html#norm_parts',
+                                                                                   'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.norm_sse_event': ( 'oai_responses.html#norm_sse_event',
+                                                                                       'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.norm_tool_call': ( 'oai_responses.html#norm_tool_call',
+                                                                                       'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.norm_tool_calls': ( 'oai_responses.html#norm_tool_calls',
+                                                                                        'fastllm/openai_responses.py'),
+                                          'fastllm.openai_responses.norm_usage': ( 'oai_responses.html#norm_usage',
+                                                                                   'fastllm/openai_responses.py')},
+            'fastllm.streaming': { 'fastllm.streaming.Delta': ('streaming.html#delta', 'fastllm/streaming.py'),
+                                   'fastllm.streaming.PartAccum': ('streaming.html#partaccum', 'fastllm/streaming.py'),
+                                   'fastllm.streaming.PartAccum.append': ('streaming.html#partaccum.append', 'fastllm/streaming.py'),
+                                   'fastllm.streaming.PartAccum.finalize': ('streaming.html#partaccum.finalize', 'fastllm/streaming.py'),
+                                   'fastllm.streaming._trim_delta': ('streaming.html#_trim_delta', 'fastllm/streaming.py'),
+                                   'fastllm.streaming.accum_completion': ('streaming.html#accum_completion', 'fastllm/streaming.py'),
+                                   'fastllm.streaming.completion_text': ('streaming.html#completion_text', 'fastllm/streaming.py'),
+                                   'fastllm.streaming.fake_stream': ('streaming.html#fake_stream', 'fastllm/streaming.py'),
+                                   'fastllm.streaming.mk_acollect_stream': ('streaming.html#mk_acollect_stream', 'fastllm/streaming.py'),
+                                   'fastllm.streaming.norm_and_yield': ('streaming.html#norm_and_yield', 'fastllm/streaming.py'),
+                                   'fastllm.streaming.stop_sequences': ('streaming.html#stop_sequences', 'fastllm/streaming.py')},
+            'fastllm.types': { 'fastllm.types.APIRegistry': ('types.html#apiregistry', 'fastllm/types.py'),
+                               'fastllm.types.APIRegistry.__init__': ('types.html#apiregistry.__init__', 'fastllm/types.py'),
+                               'fastllm.types.APIRegistry.register': ('types.html#apiregistry.register', 'fastllm/types.py'),
+                               'fastllm.types.Completion': ('types.html#completion', 'fastllm/types.py'),
+                               'fastllm.types.Completion._repr_markdown_': ('types.html#completion._repr_markdown_', 'fastllm/types.py'),
+                               'fastllm.types.Completion.cost': ('types.html#completion.cost', 'fastllm/types.py'),
+                               'fastllm.types.Msg': ('types.html#msg', 'fastllm/types.py'),
+                               'fastllm.types.Msg._repr_markdown_': ('types.html#msg._repr_markdown_', 'fastllm/types.py'),
+                               'fastllm.types.Part': ('types.html#part', 'fastllm/types.py'),
+                               'fastllm.types.Part._repr_markdown_': ('types.html#part._repr_markdown_', 'fastllm/types.py'),
+                               'fastllm.types.ToolCall': ('types.html#toolcall', 'fastllm/types.py'),
+                               'fastllm.types.ToolCall._repr_markdown_': ('types.html#toolcall._repr_markdown_', 'fastllm/types.py'),
+                               'fastllm.types.Usage': ('types.html#usage', 'fastllm/types.py'),
+                               'fastllm.types._trunc_strs': ('types.html#_trunc_strs', 'fastllm/types.py'),
+                               'fastllm.types.data_url': ('types.html#data_url', 'fastllm/types.py'),
+                               'fastllm.types.display_list': ('types.html#display_list', 'fastllm/types.py'),
+                               'fastllm.types.fn_schema': ('types.html#fn_schema', 'fastllm/types.py'),
+                               'fastllm.types.get_api_key': ('types.html#get_api_key', 'fastllm/types.py'),
+                               'fastllm.types.get_model_info': ('types.html#get_model_info', 'fastllm/types.py'),
+                               'fastllm.types.get_model_meta': ('types.html#get_model_meta', 'fastllm/types.py'),
+                               'fastllm.types.infer_api_name': ('types.html#infer_api_name', 'fastllm/types.py'),
+                               'fastllm.types.mk_completion': ('types.html#mk_completion', 'fastllm/types.py'),
+                               'fastllm.types.mk_tool_res_msg': ('types.html#mk_tool_res_msg', 'fastllm/types.py'),
+                               'fastllm.types.model_prices_meta': ('types.html#model_prices_meta', 'fastllm/types.py'),
+                               'fastllm.types.part_txt': ('types.html#part_txt', 'fastllm/types.py'),
+                               'fastllm.types.payload_kwargs': ('types.html#payload_kwargs', 'fastllm/types.py'),
+                               'fastllm.types.sys_text': ('types.html#sys_text', 'fastllm/types.py'),
+                               'fastllm.types.url_mime': ('types.html#url_mime', 'fastllm/types.py')}}}

fastllm/acomplete.py ADDED Viewed

@@ -0,0 +1,122 @@
+"""A high level unified function make api calls"""
+# AUTOGENERATED! DO NOT EDIT! File to edit: ../nbs/06_acomplete.ipynb.
+# %% auto #0
+__all__ = ['specs_path', 'ant_spec', 'oai_spec', 'gem_spec', 'vendor_mapping', 'api2spec', 'mk_client',
+           'ContextWindowExceededError', 'acomplete']
+# %% ../nbs/06_acomplete.ipynb #f2f57253
+import json
+from importlib.resources import files
+from fastcore.utils import *
+from fastcore.meta import *
+from fastspec.spec import *
+from fastspec.oapi import *
+from fastspec.errors import APIError
+from .types import *
+from .streaming import *
+from .openai_responses import *
+from .streaming import stop_sequences as _stop_sequences
+from .openai_chat import *
+from .anthropic import *
+from .gemini import *
+# %% ../nbs/06_acomplete.ipynb #6d11ac28
+specs_path = files('fastllm') / 'specs'
+ant_spec  = SpecParser.from_openapi(dict2obj(json.loads((specs_path/'anthropic.json').read_text())))
+oai_spec  = SpecParser.from_openapi(dict2obj(json.loads((specs_path/'openai.with-code-samples.json').read_text())))
+gem_spec  = SpecParser.from_discovery(dict2obj(json.loads((specs_path/'gemini.json').read_text())))
+# %% ../nbs/06_acomplete.ipynb #32ee2546
+_codex_json = '~/.codex/auth.json', 'tokens','access_token'
+vendor_mapping = {
+    "openai":       ('openai', 'https://api.openai.com/v1', 'OPENAI_API_KEY'),
+    "anthropic":    ('anthropic', 'https://api.anthropic.com', 'ANTHROPIC_API_KEY'),
+    "gemini":       ('gemini', 'https://generativelanguage.googleapis.com/', 'GEMINI_API_KEY'),
+    "openai_chat":  ('openai_chat', 'https://api.openai.com/v1', 'OPENAI_API_KEY'),
+    "codex":        ('openai', 'https://chatgpt.com/backend-api/codex', 'CODEX_AUTH_TOKEN', _codex_json),
+    "moonshot":     ('openai_chat', "https://api.moonshot.ai/v1", "MOONSHOT_API_KEY"),
+    "deepseek":     ('openai_chat', "https://api.deepseek.com/v1", "DEEPSEEK_API_KEY"),
+    "openrouter":   ('openai_chat', "https://openrouter.ai/api/v1", "OPENROUTER_API_KEY"),
+    "together":     ('openai_chat', "https://api.together.xyz/v1", "TOGETHER_API_KEY"),
+    "fireworks_ai": ('openai_chat', "https://api.fireworks.ai/inference/v1", "FIREWORKS_API_KEY"),
+    "qwen":         ('openai_chat', "https://dashscope.aliyuncs.com/compatible-mode/v1", "QWEN_API_KEY")
+}
+# %% ../nbs/06_acomplete.ipynb #77d27ea7
+api2spec = {'openai':oai_spec, 'openai_chat':oai_spec, 'anthropic':ant_spec, 'gemini':gem_spec}
+# %% ../nbs/06_acomplete.ipynb #79075d95
+@flexicache()
+def mk_client(model, vendor_name=None, api_name=None, api_key=None, base_url=None, xtra_hdrs=None):
+    err_msg = f"please pass a valid one vendor: {', '.join(list(vendor_mapping))} or pass `api_name`,`base_url` and `api_key`"
+    if vendor_name:
+        override_base_url = base_url
+        try:
+            api_name, base_url, env_api_nm, *auth_json = vendor_mapping[vendor_name]
+            base_url = override_base_url or base_url
+            if auth_json and not api_key and not os.getenv(env_api_nm):
+                fn,keys = auth_json[0]  # pyright: ignore[reportAssignmentType]
+                auth_fn = Path(fn).expanduser()
+                if auth_fn.exists(): api_key = nested_idx(json.loads(auth_fn.read_text()), *keys)
+            api_key = get_api_key(api_key, env_api_nm)
+        except KeyError: raise ValueError(f"Unknown vendor '{vendor_name}', {err_msg}")
+    elif api_name and base_url and api_key:  vendor_name = ifnone(vendor_name, 'custom')
+    elif (api_name:=infer_api_name(model)):  base_url, vendor_name = None, api_name
+    else: raise ValueError(f"Model {model} can't be auto resolved, {err_msg}")
+    api = api_registry.apis[api_name]
+    spec, hdrs = api2spec[api_name], api.get_hdrs(api_key)
+    cli = OpenAPIClient(spec, headers=merge(hdrs, ifnone(xtra_hdrs, {})))
+    if base_url is not None:
+        for op in cli.ops: op.base_url = base_url  # pyright: ignore[reportAttributeAccessIssue]
+    return cli, api_name, vendor_name
+# %% ../nbs/06_acomplete.ipynb #df851a5c
+class ContextWindowExceededError(APIError): pass
+def _is_ctx_exceeded(code, msg):
+    m = (msg or "").lower()
+    if any(x in m for x in ("string_above_max_length", "invalid 'user'")): return False
+    if str(code or "").lower() == "context_length_exceeded": return True
+    return any(s in m for s in ("exceed context limit", "maximum context length", "maximum context limit",
+    "longer than the model's context length", "input tokens exceed the configured limit",
+    "exceeds the maximum number of tokens allowed", "prompt is too long"))
+def _classify_error(exc):
+    "Upgrade generic `APIError` to a specific subclass if applicable."
+    if not isinstance(exc, APIError): return exc
+    if _is_ctx_exceeded(exc.code, exc.message):
+        return ContextWindowExceededError(exc.message, provider=exc.provider, model=exc.model,
+            endpoint=exc.endpoint, status_code=exc.status_code, error_type=exc.error_type,
+            code=exc.code, request_id=exc.request_id, retryable=exc.retryable, raw=exc.raw)
+    return exc
+async def _classify_error_stream(gen):
+    "Wrap an async generator to upgrade `APIError`s as they're raised during iteration."
+    try:
+        async for x in gen: yield x
+    except APIError as e: raise _classify_error(e) from e
+# %% ../nbs/06_acomplete.ipynb #2379ec94
+@delegates(payload_kwargs)
+async def acomplete(msgs, model, api_name=None, vendor_name=None, api_key=None, base_url=None, xtra_body=None, xtra_hdrs=None,
+    stream=False, stop_callables=None, stop_sequences=None, **kwargs):
+    "Unified completion across different APIs."
+    cli, api_name, vendor_name = mk_client(model, vendor_name, api_name, api_key, base_url, xtra_hdrs)
+    api = api_registry.apis[api_name]
+    if stop_sequences: stop_callables = L(stop_callables) + [_stop_sequences(stop_sequences)]
+    payload = api.mk_payload(msgs, model, stream=stream, stop_callables=stop_callables, **kwargs)
+    payload = merge(payload, ifnone(xtra_body, {}))
+    if vendor_name == 'codex':
+        for k in 'temperature max_tokens max_output_tokens max_completion_tokens metadata'.split(): payload.pop(k, None)
+        payload['store'] = False
+    if nested_idx(payload, 'messages', -1, 'role') == 'assistant':
+        if vendor_name == 'deepseek' and 'v4' in model:   payload['messages'][-1]['prefix'] = True
+        if vendor_name == 'moonshot' and 'kimi' in model: payload['messages'][-1]['partial'] = True
+    func = attrgetter(api.op_path[stream])(cli)
+    try: resp = await func(**payload)
+    except APIError as e: raise _classify_error(e) from e
+    if stream: return _classify_error_stream(api.acollect_stream(resp, model=model, vendor_name=vendor_name, stop_callables=stop_callables))
+    return mk_completion(resp, model=model, api_name=api_name, vendor_name=vendor_name)