PyPI - ommlds - Versions diffs - 0.0.0.dev456__py3-none-any.whl → 0.0.0.dev485__py3-none-any.whl - Mend

ommlds 0.0.0.dev456py3-none-any.whl → 0.0.0.dev485py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (212) hide show

ommlds/.omlish-manifests.json +314 -33
ommlds/__about__.py +15 -9
ommlds/_hacks/__init__.py +4 -0
ommlds/_hacks/funcs.py +110 -0
ommlds/_hacks/names.py +158 -0
ommlds/_hacks/params.py +73 -0
ommlds/_hacks/patches.py +0 -3
ommlds/backends/anthropic/protocol/__init__.py +13 -1
ommlds/backends/anthropic/protocol/_dataclasses.py +1625 -0
ommlds/backends/anthropic/protocol/sse/assemble.py +22 -6
ommlds/backends/anthropic/protocol/sse/events.py +13 -0
ommlds/backends/google/protocol/__init__.py +13 -0
ommlds/backends/google/protocol/_dataclasses.py +5997 -0
ommlds/backends/google/protocol/types.py +5 -1
ommlds/backends/groq/__init__.py +7 -0
ommlds/backends/groq/_dataclasses.py +3901 -0
ommlds/backends/groq/_marshal.py +23 -0
ommlds/backends/groq/protocol.py +249 -0
ommlds/backends/llamacpp/logging.py +4 -1
ommlds/backends/mlx/caching.py +7 -3
ommlds/backends/mlx/cli.py +10 -7
ommlds/backends/mlx/generation.py +18 -16
ommlds/backends/mlx/limits.py +10 -6
ommlds/backends/mlx/loading.py +65 -5
ommlds/backends/ollama/__init__.py +7 -0
ommlds/backends/ollama/_dataclasses.py +3458 -0
ommlds/backends/ollama/protocol.py +170 -0
ommlds/backends/openai/protocol/__init__.py +15 -1
ommlds/backends/openai/protocol/_dataclasses.py +7708 -0
ommlds/backends/tavily/__init__.py +7 -0
ommlds/backends/tavily/_dataclasses.py +1734 -0
ommlds/backends/tavily/protocol.py +301 -0
ommlds/backends/tinygrad/models/llama3/__init__.py +22 -14
ommlds/backends/transformers/__init__.py +14 -0
ommlds/backends/transformers/filecache.py +109 -0
ommlds/backends/transformers/streamers.py +73 -0
ommlds/cli/__init__.py +7 -0
ommlds/cli/_dataclasses.py +2562 -0
ommlds/cli/asyncs.py +30 -0
ommlds/cli/backends/catalog.py +93 -0
ommlds/cli/backends/configs.py +9 -0
ommlds/cli/backends/inject.py +31 -36
ommlds/cli/backends/injection.py +16 -0
ommlds/cli/backends/types.py +46 -0
ommlds/cli/content/messages.py +34 -0
ommlds/cli/content/strings.py +42 -0
ommlds/cli/inject.py +15 -32
ommlds/cli/inputs/__init__.py +0 -0
ommlds/cli/inputs/asyncs.py +32 -0
ommlds/cli/inputs/sync.py +75 -0
ommlds/cli/main.py +267 -128
ommlds/cli/rendering/__init__.py +0 -0
ommlds/cli/rendering/configs.py +9 -0
ommlds/cli/rendering/inject.py +31 -0
ommlds/cli/rendering/markdown.py +52 -0
ommlds/cli/rendering/raw.py +73 -0
ommlds/cli/rendering/types.py +21 -0
ommlds/cli/secrets.py +21 -0
ommlds/cli/sessions/base.py +1 -1
ommlds/cli/sessions/chat/chat/__init__.py +0 -0
ommlds/cli/sessions/chat/chat/ai/__init__.py +0 -0
ommlds/cli/sessions/chat/chat/ai/configs.py +11 -0
ommlds/cli/sessions/chat/chat/ai/inject.py +74 -0
ommlds/cli/sessions/chat/chat/ai/injection.py +14 -0
ommlds/cli/sessions/chat/chat/ai/rendering.py +70 -0
ommlds/cli/sessions/chat/chat/ai/services.py +79 -0
ommlds/cli/sessions/chat/chat/ai/tools.py +44 -0
ommlds/cli/sessions/chat/chat/ai/types.py +28 -0
ommlds/cli/sessions/chat/chat/state/__init__.py +0 -0
ommlds/cli/sessions/chat/chat/state/configs.py +11 -0
ommlds/cli/sessions/chat/chat/state/inject.py +36 -0
ommlds/cli/sessions/chat/chat/state/inmemory.py +33 -0
ommlds/cli/sessions/chat/chat/state/storage.py +52 -0
ommlds/cli/sessions/chat/chat/state/types.py +38 -0
ommlds/cli/sessions/chat/chat/user/__init__.py +0 -0
ommlds/cli/sessions/chat/chat/user/configs.py +17 -0
ommlds/cli/sessions/chat/chat/user/inject.py +62 -0
ommlds/cli/sessions/chat/chat/user/interactive.py +31 -0
ommlds/cli/sessions/chat/chat/user/oneshot.py +25 -0
ommlds/cli/sessions/chat/chat/user/types.py +15 -0
ommlds/cli/sessions/chat/configs.py +27 -0
ommlds/cli/sessions/chat/driver.py +43 -0
ommlds/cli/sessions/chat/inject.py +33 -65
ommlds/cli/sessions/chat/phases/__init__.py +0 -0
ommlds/cli/sessions/chat/phases/inject.py +27 -0
ommlds/cli/sessions/chat/phases/injection.py +14 -0
ommlds/cli/sessions/chat/phases/manager.py +29 -0
ommlds/cli/sessions/chat/phases/types.py +29 -0
ommlds/cli/sessions/chat/session.py +27 -0
ommlds/cli/sessions/chat/tools/__init__.py +0 -0
ommlds/cli/sessions/chat/tools/configs.py +22 -0
ommlds/cli/sessions/chat/tools/confirmation.py +46 -0
ommlds/cli/sessions/chat/tools/execution.py +66 -0
ommlds/cli/sessions/chat/tools/fs/__init__.py +0 -0
ommlds/cli/sessions/chat/tools/fs/configs.py +12 -0
ommlds/cli/sessions/chat/tools/fs/inject.py +35 -0
ommlds/cli/sessions/chat/tools/inject.py +88 -0
ommlds/cli/sessions/chat/tools/injection.py +44 -0
ommlds/cli/sessions/chat/tools/rendering.py +58 -0
ommlds/cli/sessions/chat/tools/todo/__init__.py +0 -0
ommlds/cli/sessions/chat/tools/todo/configs.py +12 -0
ommlds/cli/sessions/chat/tools/todo/inject.py +31 -0
ommlds/cli/sessions/chat/tools/weather/__init__.py +0 -0
ommlds/cli/sessions/chat/tools/weather/configs.py +12 -0
ommlds/cli/sessions/chat/tools/weather/inject.py +22 -0
ommlds/cli/{tools/weather.py → sessions/chat/tools/weather/tools.py} +1 -1
ommlds/cli/sessions/completion/configs.py +21 -0
ommlds/cli/sessions/completion/inject.py +42 -0
ommlds/cli/sessions/completion/session.py +35 -0
ommlds/cli/sessions/embedding/configs.py +21 -0
ommlds/cli/sessions/embedding/inject.py +42 -0
ommlds/cli/sessions/embedding/session.py +33 -0
ommlds/cli/sessions/inject.py +28 -11
ommlds/cli/state/__init__.py +0 -0
ommlds/cli/state/inject.py +28 -0
ommlds/cli/{state.py → state/storage.py} +41 -24
ommlds/minichain/__init__.py +46 -17
ommlds/minichain/_dataclasses.py +15401 -0
ommlds/minichain/backends/catalogs/base.py +20 -1
ommlds/minichain/backends/catalogs/simple.py +2 -2
ommlds/minichain/backends/catalogs/strings.py +10 -8
ommlds/minichain/backends/impls/anthropic/chat.py +31 -65
ommlds/minichain/backends/impls/anthropic/names.py +3 -4
ommlds/minichain/backends/impls/anthropic/protocol.py +109 -0
ommlds/minichain/backends/impls/anthropic/stream.py +53 -31
ommlds/minichain/backends/impls/duckduckgo/search.py +5 -1
ommlds/minichain/backends/impls/dummy/__init__.py +0 -0
ommlds/minichain/backends/impls/dummy/chat.py +69 -0
ommlds/minichain/backends/impls/google/chat.py +9 -2
ommlds/minichain/backends/impls/google/search.py +6 -1
ommlds/minichain/backends/impls/google/stream.py +122 -32
ommlds/minichain/backends/impls/groq/__init__.py +0 -0
ommlds/minichain/backends/impls/groq/chat.py +75 -0
ommlds/minichain/backends/impls/groq/names.py +48 -0
ommlds/minichain/backends/impls/groq/protocol.py +143 -0
ommlds/minichain/backends/impls/groq/stream.py +125 -0
ommlds/minichain/backends/impls/huggingface/repos.py +1 -5
ommlds/minichain/backends/impls/llamacpp/chat.py +15 -3
ommlds/minichain/backends/impls/llamacpp/completion.py +7 -3
ommlds/minichain/backends/impls/llamacpp/stream.py +38 -19
ommlds/minichain/backends/impls/mistral.py +9 -2
ommlds/minichain/backends/impls/mlx/chat.py +100 -23
ommlds/minichain/backends/impls/ollama/__init__.py +0 -0
ommlds/minichain/backends/impls/ollama/chat.py +199 -0
ommlds/minichain/backends/impls/openai/chat.py +14 -7
ommlds/minichain/backends/impls/openai/completion.py +9 -2
ommlds/minichain/backends/impls/openai/embedding.py +9 -2
ommlds/minichain/backends/impls/openai/format.py +115 -109
ommlds/minichain/backends/impls/openai/names.py +31 -5
ommlds/minichain/backends/impls/openai/stream.py +33 -27
ommlds/minichain/backends/impls/sentencepiece/tokens.py +9 -6
ommlds/minichain/backends/impls/tavily.py +66 -0
ommlds/minichain/backends/impls/tinygrad/chat.py +17 -14
ommlds/minichain/backends/impls/tokenizers/tokens.py +9 -6
ommlds/minichain/backends/impls/transformers/sentence.py +5 -2
ommlds/minichain/backends/impls/transformers/tokens.py +10 -7
ommlds/minichain/backends/impls/transformers/transformers.py +139 -20
ommlds/minichain/backends/strings/parsing.py +1 -1
ommlds/minichain/backends/strings/resolving.py +4 -1
ommlds/minichain/chat/choices/stream/__init__.py +0 -0
ommlds/minichain/chat/choices/stream/adapters.py +35 -0
ommlds/minichain/chat/choices/stream/joining.py +31 -0
ommlds/minichain/chat/choices/stream/services.py +45 -0
ommlds/minichain/chat/choices/stream/types.py +43 -0
ommlds/minichain/chat/stream/_marshal.py +4 -4
ommlds/minichain/chat/stream/joining.py +85 -0
ommlds/minichain/chat/stream/services.py +15 -15
ommlds/minichain/chat/stream/types.py +24 -18
ommlds/minichain/llms/types.py +4 -0
ommlds/minichain/registries/globals.py +18 -4
ommlds/minichain/resources.py +28 -3
ommlds/minichain/search.py +1 -1
ommlds/minichain/standard.py +8 -0
ommlds/minichain/stream/services.py +19 -16
ommlds/minichain/tools/reflect.py +5 -1
ommlds/nanochat/LICENSE +21 -0
ommlds/nanochat/__init__.py +0 -0
ommlds/nanochat/rustbpe/LICENSE +21 -0
ommlds/nanochat/tokenizers.py +406 -0
ommlds/specs/__init__.py +0 -0
ommlds/specs/mcp/__init__.py +0 -0
ommlds/specs/mcp/_marshal.py +23 -0
ommlds/specs/mcp/clients.py +146 -0
ommlds/specs/mcp/protocol.py +371 -0
ommlds/tools/git.py +13 -6
ommlds/tools/ocr.py +1 -8
ommlds/wiki/analyze.py +2 -2
ommlds/wiki/text/mfh.py +1 -5
ommlds/wiki/text/wtp.py +1 -3
ommlds/wiki/utils/xml.py +5 -5
{ommlds-0.0.0.dev456.dist-info → ommlds-0.0.0.dev485.dist-info}/METADATA +22 -19
{ommlds-0.0.0.dev456.dist-info → ommlds-0.0.0.dev485.dist-info}/RECORD +198 -95
ommlds/cli/backends/standard.py +0 -20
ommlds/cli/sessions/chat/base.py +0 -42
ommlds/cli/sessions/chat/code.py +0 -129
ommlds/cli/sessions/chat/interactive.py +0 -71
ommlds/cli/sessions/chat/printing.py +0 -97
ommlds/cli/sessions/chat/prompt.py +0 -151
ommlds/cli/sessions/chat/state.py +0 -110
ommlds/cli/sessions/chat/tools.py +0 -100
ommlds/cli/sessions/completion/completion.py +0 -44
ommlds/cli/sessions/embedding/embedding.py +0 -42
ommlds/cli/tools/config.py +0 -14
ommlds/cli/tools/inject.py +0 -75
ommlds/minichain/backends/impls/openai/format2.py +0 -210
ommlds/minichain/chat/stream/adapters.py +0 -80
/ommlds/{huggingface.py → backends/huggingface.py} +0 -0
/ommlds/cli/{tools → content}/__init__.py +0 -0
{ommlds-0.0.0.dev456.dist-info → ommlds-0.0.0.dev485.dist-info}/WHEEL +0 -0
{ommlds-0.0.0.dev456.dist-info → ommlds-0.0.0.dev485.dist-info}/entry_points.txt +0 -0
{ommlds-0.0.0.dev456.dist-info → ommlds-0.0.0.dev485.dist-info}/licenses/LICENSE +0 -0
{ommlds-0.0.0.dev456.dist-info → ommlds-0.0.0.dev485.dist-info}/top_level.txt +0 -0

ommlds/minichain/backends/impls/llamacpp/chat.py CHANGED Viewed

@@ -2,13 +2,10 @@ import contextlib
 import os.path
 import typing as ta
-import llama_cpp as lcc
 from omlish import check
 from omlish import lang
 from omlish import typedvalues as tv
-from .....backends import llamacpp as lcu
 from ....chat.choices.services import ChatChoicesRequest
 from ....chat.choices.services import ChatChoicesResponse
 from ....chat.choices.services import static_check_is_chat_choices_service
@@ -27,6 +24,21 @@ from .format import ROLES_MAP
 from .format import get_msg_content
+with lang.auto_proxy_import(globals()):
+    import llama_cpp as lcc
+    from .....backends import llamacpp as lcu
+##
+# @omlish-manifest $.minichain.backends.strings.manifests.BackendStringsManifest(
+#     ['ChatChoicesService'],
+#     'llamacpp',
+# )
 ##

ommlds/minichain/backends/impls/llamacpp/completion.py CHANGED Viewed

@@ -2,11 +2,9 @@ import contextlib
 import os.path
 import typing as ta
-import llama_cpp as lcc
+from omlish import lang
 from omlish import typedvalues as tv
-from .....backends import llamacpp as lcu
 from ....completion import CompletionOption
 from ....completion import CompletionRequest
 from ....completion import CompletionResponse
@@ -18,6 +16,12 @@ from ....llms.types import Temperature
 from ....models.configs import ModelPath
+with lang.auto_proxy_import(globals()):
+    import llama_cpp as lcc
+    from .....backends import llamacpp as lcu
 ##

ommlds/minichain/backends/impls/llamacpp/stream.py CHANGED Viewed

@@ -2,20 +2,17 @@ import contextlib
 import threading
 import typing as ta  # noqa
-import llama_cpp as lcc
 from omlish import check
 from omlish import lang
 from omlish import typedvalues as tv
-from .....backends import llamacpp as lcu
 from ....chat.choices.services import ChatChoicesOutputs
-from ....chat.stream.services import ChatChoicesStreamRequest
-from ....chat.stream.services import ChatChoicesStreamResponse
-from ....chat.stream.services import static_check_is_chat_choices_stream_service
-from ....chat.stream.types import AiChoiceDeltas
-from ....chat.stream.types import AiChoicesDeltas
-from ....chat.stream.types import ContentAiChoiceDelta
+from ....chat.choices.stream.services import ChatChoicesStreamRequest
+from ....chat.choices.stream.services import ChatChoicesStreamResponse
+from ....chat.choices.stream.services import static_check_is_chat_choices_stream_service
+from ....chat.choices.stream.types import AiChoiceDeltas
+from ....chat.choices.stream.types import AiChoicesDeltas
+from ....chat.stream.types import ContentAiDelta
 from ....configs import Config
 from ....models.configs import ModelPath
 from ....resources import UseResources
@@ -26,6 +23,21 @@ from .format import ROLES_MAP
 from .format import get_msg_content
+with lang.auto_proxy_import(globals()):
+    import llama_cpp as lcc
+    from .....backends import llamacpp as lcu
+##
+# @omlish-manifest $.minichain.backends.strings.manifests.BackendStringsManifest(
+#     ['ChatChoicesStreamService'],
+#     'llamacpp',
+# )
 ##
@@ -76,18 +88,25 @@ class LlamacppChatChoicesStreamService(lang.ExitStacked):
             rs.enter_context(lang.defer(close_output))
             async def inner(sink: StreamResponseSink[AiChoicesDeltas]) -> ta.Sequence[ChatChoicesOutputs] | None:
+                last_role: ta.Any = None
                 for chunk in output:
                     check.state(chunk['object'] == 'chat.completion.chunk')
-                    l: list[AiChoiceDeltas] = []
-                    for choice in chunk['choices']:
-                        # FIXME: check role is assistant
-                        # FIXME: stop reason
-                        if not (delta := choice.get('delta', {})):
-                            continue
-                        if not (content := delta.get('content', '')):
-                            continue
-                        l.append(AiChoiceDeltas([ContentAiChoiceDelta(content)]))
-                    await sink.emit(AiChoicesDeltas(l))
+                    choice = check.single(chunk['choices'])
+                    if not (delta := choice.get('delta', {})):
+                        continue
+                    # FIXME: check role is assistant
+                    if (role := delta.get('role')) != last_role:
+                        last_role = role
+                    # FIXME: stop reason
+                    if (content := delta.get('content', '')):
+                        await sink.emit(AiChoicesDeltas([AiChoiceDeltas([ContentAiDelta(content)])]))
                 return None
             return await new_stream_response(rs, inner)

ommlds/minichain/backends/impls/mistral.py CHANGED Viewed

@@ -40,10 +40,16 @@ class MistralChatChoicesService:
         AiMessage: 'assistant',
     }
-    def __init__(self, *, api_key: str | None = None) -> None:
+    def __init__(
+            self,
+            *,
+            api_key: str | None = None,
+            http_client: http.AsyncHttpClient | None = None,
+    ) -> None:
         super().__init__()
         self._api_key = api_key
+        self._http_client = http_client
     def _get_msg_content(self, m: Message) -> str | None:
         if isinstance(m, AiMessage):
@@ -73,7 +79,7 @@ class MistralChatChoicesService:
             ],
         }
-        resp = http.request(
+        resp = await http.async_request(
             'https://api.mistral.ai/v1/chat/completions',
             method='POST',
             data=json.dumps_compact(req_dct).encode('utf-8'),
@@ -82,6 +88,7 @@ class MistralChatChoicesService:
                 'Accept': 'application/json',
                 'Authorization': f'Bearer {key}',
             },
+            client=self._http_client,
         )
         if resp.status == 429:

ommlds/minichain/backends/impls/mlx/chat.py CHANGED Viewed

@@ -1,32 +1,46 @@
+import contextlib
 import typing as ta
 from omlish import check
 from omlish import lang
 from omlish import typedvalues as tv
-from .....backends import mlx as mlxu
+from ....chat.choices.services import ChatChoicesOutputs
 from ....chat.choices.services import ChatChoicesRequest
 from ....chat.choices.services import ChatChoicesResponse
 from ....chat.choices.services import static_check_is_chat_choices_service
+from ....chat.choices.stream.services import ChatChoicesStreamRequest
+from ....chat.choices.stream.services import ChatChoicesStreamResponse
+from ....chat.choices.stream.services import static_check_is_chat_choices_stream_service
+from ....chat.choices.stream.types import AiChoiceDeltas
+from ....chat.choices.stream.types import AiChoicesDeltas
 from ....chat.choices.types import AiChoice
 from ....chat.choices.types import ChatChoicesOptions
 from ....chat.messages import AiMessage
 from ....chat.messages import Message
 from ....chat.messages import SystemMessage
 from ....chat.messages import UserMessage
+from ....chat.stream.types import ContentAiDelta
 from ....configs import Config
 from ....llms.types import MaxTokens
 from ....models.configs import ModelPath
 from ....models.configs import ModelRepo
 from ....models.configs import ModelSpecifier
+from ....resources import UseResources
 from ....standard import DefaultOptions
+from ....stream.services import StreamResponseSink
+from ....stream.services import new_stream_response
+with lang.auto_proxy_import(globals()):
+    from .....backends import mlx as mlxu
 ##
 # @omlish-manifest $.minichain.backends.strings.manifests.BackendStringsManifest(
-#     ['ChatChoicesService'],
+#     ['ChatChoicesService', 'ChatChoicesStreamService'],
 #     'mlx',
 # )
@@ -34,12 +48,7 @@ from ....standard import DefaultOptions
 ##
-# @omlish-manifest $.minichain.registries.manifests.RegistryManifest(
-#     name='mlx',
-#     type='ChatChoicesService',
-# )
-@static_check_is_chat_choices_service
-class MlxChatChoicesService(lang.ExitStacked):
+class BaseMlxChatChoicesService(lang.ExitStacked):
     DEFAULT_MODEL: ta.ClassVar[ModelSpecifier] = (
         # 'mlx-community/DeepSeek-Coder-V2-Lite-Instruct-8bit'
         # 'mlx-community/Llama-3.3-70B-Instruct-4bit'
@@ -52,8 +61,8 @@ class MlxChatChoicesService(lang.ExitStacked):
         # 'mlx-community/Qwen2.5-0.5B-4bit'
         # 'mlx-community/Qwen2.5-32B-Instruct-8bit'
         # 'mlx-community/Qwen2.5-Coder-32B-Instruct-8bit'
-        # 'mlx-community/mamba-2.8b-hf-f16'
         # 'mlx-community/Qwen3-30B-A3B-6bit'
+        # 'mlx-community/mamba-2.8b-hf-f16'
     )
     def __init__(self, *configs: Config) -> None:
@@ -70,17 +79,14 @@ class MlxChatChoicesService(lang.ExitStacked):
     }
     def _get_msg_content(self, m: Message) -> str | None:
-        if isinstance(m, AiMessage):
-            return check.isinstance(m.c, str)
-        elif isinstance(m, (SystemMessage, UserMessage)):
+        if isinstance(m, (AiMessage, SystemMessage, UserMessage)):
             return check.isinstance(m.c, str)
         else:
             raise TypeError(m)
     @lang.cached_function(transient=True)
-    def _load_model(self) -> mlxu.LoadedModel:
+    def _load_model(self) -> 'mlxu.LoadedModel':
         # FIXME: walk state, find all mx.arrays, dealloc/set to empty
         check.not_none(self._exit_stack)
@@ -96,10 +102,9 @@ class MlxChatChoicesService(lang.ExitStacked):
         max_tokens=MaxTokens,
     )
-    async def invoke(self, request: ChatChoicesRequest) -> ChatChoicesResponse:
-        loaded_model = self._load_model()
-        tokenizer = loaded_model.tokenization.tokenizer
+    @lang.cached_function(transient=True)
+    def _get_tokenizer(self) -> 'mlxu.tokenization.Tokenizer':
+        tokenizer = self._load_model().tokenization.tokenizer
         if not (
                 hasattr(tokenizer, 'apply_chat_template') and
@@ -107,26 +112,44 @@ class MlxChatChoicesService(lang.ExitStacked):
         ):
             raise RuntimeError(tokenizer)
-        prompt = tokenizer.apply_chat_template(
+        return tokenizer
+    def _build_prompt(self, messages: ta.Sequence[Message]) -> str:
+        return check.isinstance(self._get_tokenizer().apply_chat_template(
             [  # type: ignore[arg-type]
                 dict(
                     role=self.ROLES_MAP[type(m)],
                     content=self._get_msg_content(m),
                 )
-                for m in request.v
+                for m in messages
             ],
             tokenize=False,
             add_generation_prompt=True,
-        )
+        ), str)
+    def _build_kwargs(self, oc: tv.TypedValuesConsumer) -> dict[str, ta.Any]:
+        kwargs: dict[str, ta.Any] = {}
+        kwargs.update(oc.pop_scalar_kwargs(**self._OPTION_KWARG_NAMES_MAP))
+        return kwargs
-        kwargs = dict()
+# @omlish-manifest $.minichain.registries.manifests.RegistryManifest(
+#     name='mlx',
+#     type='ChatChoicesService',
+# )
+@static_check_is_chat_choices_service
+class MlxChatChoicesService(BaseMlxChatChoicesService):
+    async def invoke(self, request: ChatChoicesRequest) -> ChatChoicesResponse:
+        loaded_model = self._load_model()
+        prompt = self._build_prompt(request.v)
         with tv.consume(
                 *self._default_options,
                 *request.options,
                 override=True,
         ) as oc:
-            kwargs.update(oc.pop_scalar_kwargs(**self._OPTION_KWARG_NAMES_MAP))
+            kwargs = self._build_kwargs(oc)
         response = mlxu.generate(
             loaded_model.model,
@@ -139,3 +162,57 @@ class MlxChatChoicesService(lang.ExitStacked):
         return ChatChoicesResponse([
             AiChoice([AiMessage(response)])  # noqa
         ])
+# @omlish-manifest $.minichain.registries.manifests.RegistryManifest(
+#     name='mlx',
+#     type='ChatChoicesStreamService',
+# )
+@static_check_is_chat_choices_stream_service
+class MlxChatChoicesStreamService(BaseMlxChatChoicesService):
+    def __init__(self, *configs: Config) -> None:
+        super().__init__()
+        with tv.consume(*configs) as cc:
+            self._model = cc.pop(MlxChatChoicesService.DEFAULT_MODEL)
+            self._default_options: tv.TypedValues = DefaultOptions.pop(cc)
+    READ_CHUNK_SIZE = 64 * 1024
+    async def invoke(
+            self,
+            request: ChatChoicesStreamRequest,
+            *,
+            max_tokens: int = 4096,  # FIXME: ChatOption
+    ) -> ChatChoicesStreamResponse:
+        loaded_model = self._load_model()
+        prompt = self._build_prompt(request.v)
+        with tv.consume(
+                *self._default_options,
+                *request.options,
+                override=True,
+        ) as oc:
+            oc.pop(UseResources, None)
+            kwargs = self._build_kwargs(oc)
+        async with UseResources.or_new(request.options) as rs:
+            gen: ta.Iterator[mlxu.GenerationOutput] = rs.enter_context(contextlib.closing(mlxu.stream_generate(
+                loaded_model.model,
+                loaded_model.tokenization,
+                check.isinstance(prompt, str),
+                mlxu.GenerationParams(**kwargs),
+                # verbose=True,
+            )))
+            async def inner(sink: StreamResponseSink[AiChoicesDeltas]) -> ta.Sequence[ChatChoicesOutputs]:
+                for go in gen:
+                    if go.text:
+                        await sink.emit(AiChoicesDeltas([AiChoiceDeltas([
+                            ContentAiDelta(go.text),
+                        ])]))
+                return []
+            return await new_stream_response(rs, inner)

ommlds/minichain/backends/impls/ollama/__init__.py ADDED Viewed

File without changes

ommlds/minichain/backends/impls/ollama/chat.py ADDED Viewed

@@ -0,0 +1,199 @@
+import typing as ta
+from omlish import check
+from omlish import lang
+from omlish import marshal as msh
+from omlish import typedvalues as tv
+from omlish.formats import json
+from omlish.http import all as http
+from omlish.io.buffers import DelimitingBuffer
+from .....backends.ollama import protocol as pt
+from ....chat.choices.services import ChatChoicesOutputs
+from ....chat.choices.services import ChatChoicesRequest
+from ....chat.choices.services import ChatChoicesResponse
+from ....chat.choices.services import static_check_is_chat_choices_service
+from ....chat.choices.stream.services import ChatChoicesStreamRequest
+from ....chat.choices.stream.services import ChatChoicesStreamResponse
+from ....chat.choices.stream.services import static_check_is_chat_choices_stream_service
+from ....chat.choices.stream.types import AiChoiceDeltas
+from ....chat.choices.stream.types import AiChoicesDeltas
+from ....chat.choices.types import AiChoice
+from ....chat.messages import AiMessage
+from ....chat.messages import AnyAiMessage
+from ....chat.messages import Message
+from ....chat.messages import SystemMessage
+from ....chat.messages import UserMessage
+from ....chat.stream.types import ContentAiDelta
+from ....models.configs import ModelName
+from ....resources import UseResources
+from ....standard import ApiUrl
+from ....stream.services import StreamResponseSink
+from ....stream.services import new_stream_response
+##
+# @omlish-manifest $.minichain.backends.strings.manifests.BackendStringsManifest(
+#     [
+#         'ChatChoicesService',
+#         'ChatChoicesStreamService',
+#     ],
+#     'ollama',
+# )
+##
+class BaseOllamaChatChoicesService(lang.Abstract):
+    DEFAULT_API_URL: ta.ClassVar[ApiUrl] = ApiUrl('http://localhost:11434/api')
+    DEFAULT_MODEL_NAME: ta.ClassVar[ModelName] = ModelName('llama3.2')
+    def __init__(
+            self,
+            *configs: ApiUrl | ModelName,
+            http_client: http.AsyncHttpClient | None = None,
+    ) -> None:
+        super().__init__()
+        self._http_client = http_client
+        with tv.consume(*configs) as cc:
+            self._api_url = cc.pop(self.DEFAULT_API_URL)
+            self._model_name = cc.pop(self.DEFAULT_MODEL_NAME)
+    #
+    ROLE_MAP: ta.ClassVar[ta.Mapping[type[Message], pt.Role]] = {  # noqa
+        SystemMessage: 'system',
+        UserMessage: 'user',
+        AiMessage: 'assistant',
+    }
+    @classmethod
+    def _get_message_content(cls, m: Message) -> str | None:
+        if isinstance(m, (AiMessage, UserMessage, SystemMessage)):
+            return check.isinstance(m.c, str)
+        else:
+            raise TypeError(m)
+    @classmethod
+    def _build_request_messages(cls, mc_msgs: ta.Iterable[Message]) -> ta.Sequence[pt.Message]:
+        messages: list[pt.Message] = []
+        for m in mc_msgs:
+            messages.append(pt.Message(
+                role=cls.ROLE_MAP[type(m)],
+                content=cls._get_message_content(m),
+            ))
+        return messages
+##
+# @omlish-manifest $.minichain.registries.manifests.RegistryManifest(
+#     name='ollama',
+#     type='ChatChoicesService',
+# )
+@static_check_is_chat_choices_service
+class OllamaChatChoicesService(BaseOllamaChatChoicesService):
+    async def invoke(
+            self,
+            request: ChatChoicesRequest,
+    ) -> ChatChoicesResponse:
+        messages = self._build_request_messages(request.v)
+        a_req = pt.ChatRequest(
+            model=self._model_name.v,
+            messages=messages,
+            # tools=tools or None,
+            stream=False,
+        )
+        raw_request = msh.marshal(a_req)
+        async with http.manage_async_client(self._http_client) as http_client:
+            raw_response = await http_client.request(http.HttpRequest(
+                self._api_url.v.removesuffix('/') + '/chat',
+                data=json.dumps(raw_request).encode('utf-8'),
+            ))
+        json_response = json.loads(check.not_none(raw_response.data).decode('utf-8'))
+        resp = msh.unmarshal(json_response, pt.ChatResponse)
+        out: list[AnyAiMessage] = []
+        if resp.message.role == 'assistant':
+            out.append(AiMessage(
+                check.not_none(resp.message.content),
+            ))
+        else:
+            raise TypeError(resp.message.role)
+        return ChatChoicesResponse([
+            AiChoice(out),
+        ])
+##
+# @omlish-manifest $.minichain.registries.manifests.RegistryManifest(
+#     name='ollama',
+#     type='ChatChoicesStreamService',
+# )
+@static_check_is_chat_choices_stream_service
+class OllamaChatChoicesStreamService(BaseOllamaChatChoicesService):
+    READ_CHUNK_SIZE: ta.ClassVar[int] = -1
+    async def invoke(
+            self,
+            request: ChatChoicesStreamRequest,
+    ) -> ChatChoicesStreamResponse:
+        messages = self._build_request_messages(request.v)
+        a_req = pt.ChatRequest(
+            model=self._model_name.v,
+            messages=messages,
+            # tools=tools or None,
+            stream=True,
+        )
+        raw_request = msh.marshal(a_req)
+        http_request = http.HttpRequest(
+            self._api_url.v.removesuffix('/') + '/chat',
+            data=json.dumps(raw_request).encode('utf-8'),
+        )
+        async with UseResources.or_new(request.options) as rs:
+            http_client = await rs.enter_async_context(http.manage_async_client(self._http_client))
+            http_response = await rs.enter_async_context(await http_client.stream_request(http_request))
+            async def inner(sink: StreamResponseSink[AiChoicesDeltas]) -> ta.Sequence[ChatChoicesOutputs] | None:
+                db = DelimitingBuffer([b'\r', b'\n', b'\r\n'])
+                while True:
+                    b = await http_response.stream.read1(self.READ_CHUNK_SIZE)
+                    for l in db.feed(b):
+                        if isinstance(l, DelimitingBuffer.Incomplete):
+                            # FIXME: handle
+                            return []
+                        lj = json.loads(l.decode('utf-8'))
+                        lp: pt.ChatResponse = msh.unmarshal(lj, pt.ChatResponse)
+                        check.state(lp.message.role == 'assistant')
+                        check.none(lp.message.tool_name)
+                        check.state(not lp.message.tool_calls)
+                        if (c := lp.message.content):
+                            await sink.emit(AiChoicesDeltas([AiChoiceDeltas([ContentAiDelta(
+                                c,
+                            )])]))
+                    if not b:
+                        return []
+            return await new_stream_response(rs, inner)

ommlds/minichain/backends/impls/openai/chat.py CHANGED Viewed

@@ -26,9 +26,9 @@ from ....chat.choices.services import static_check_is_chat_choices_service
 from ....models.configs import ModelName
 from ....standard import ApiKey
 from ....standard import DefaultOptions
-from .format2 import OpenaiChatRequestHandler
-from .format2 import build_mc_choices_response
-from .names import MODEL_NAMES
+from .format import OpenaiChatRequestHandler
+from .format import build_mc_choices_response
+from .names import CHAT_MODEL_NAMES
 ##
@@ -40,11 +40,17 @@ from .names import MODEL_NAMES
 # )
 @static_check_is_chat_choices_service
 class OpenaiChatChoicesService:
-    DEFAULT_MODEL_NAME: ta.ClassVar[ModelName] = ModelName(check.not_none(MODEL_NAMES.default))
+    DEFAULT_MODEL_NAME: ta.ClassVar[ModelName] = ModelName(check.not_none(CHAT_MODEL_NAMES.default))
-    def __init__(self, *configs: ApiKey | ModelName | DefaultOptions) -> None:
+    def __init__(
+            self,
+            *configs: ApiKey | ModelName | DefaultOptions,
+            http_client: http.AsyncHttpClient | None = None,
+    ) -> None:
         super().__init__()
+        self._http_client = http_client
         with tv.consume(*configs) as cc:
             self._model_name = cc.pop(self.DEFAULT_MODEL_NAME)
             self._api_key = ApiKey.pop_secret(cc, env='OPENAI_API_KEY')
@@ -60,7 +66,7 @@ class OpenaiChatChoicesService:
                 *request.options,
                 override=True,
             ),
-            model=MODEL_NAMES.resolve(self._model_name.v),
+            model=CHAT_MODEL_NAMES.resolve(self._model_name.v),
             mandatory_kwargs=dict(
                 stream=False,
             ),
@@ -68,13 +74,14 @@ class OpenaiChatChoicesService:
         raw_request = msh.marshal(rh.oai_request())
-        http_response = http.request(
+        http_response = await http.async_request(
             'https://api.openai.com/v1/chat/completions',
             headers={
                 http.consts.HEADER_CONTENT_TYPE: http.consts.CONTENT_TYPE_JSON,
                 http.consts.HEADER_AUTH: http.consts.format_bearer_auth_header(check.not_none(self._api_key).reveal()),
             },
             data=json.dumps(raw_request).encode('utf-8'),
+            client=self._http_client,
         )
         raw_response = json.loads(check.not_none(http_response.data).decode('utf-8'))

ommlds/minichain/backends/impls/openai/completion.py CHANGED Viewed

@@ -23,9 +23,15 @@ from ....standard import ApiKey
 class OpenaiCompletionService:
     DEFAULT_MODEL_NAME: ta.ClassVar[str] = 'gpt-3.5-turbo-instruct'
-    def __init__(self, *configs: Config) -> None:
+    def __init__(
+            self,
+            *configs: Config,
+            http_client: http.AsyncHttpClient | None = None,
+    ) -> None:
         super().__init__()
+        self._http_client = http_client
         with tv.consume(*configs) as cc:
             self._api_key = ApiKey.pop_secret(cc, env='OPENAI_API_KEY')
@@ -41,13 +47,14 @@ class OpenaiCompletionService:
             stream=False,
         )
-        raw_response = http.request(
+        raw_response = await http.async_request(
             'https://api.openai.com/v1/completions',
             headers={
                 http.consts.HEADER_CONTENT_TYPE: http.consts.CONTENT_TYPE_JSON,
                 http.consts.HEADER_AUTH: http.consts.format_bearer_auth_header(check.not_none(self._api_key).reveal()),
             },
             data=json.dumps(raw_request).encode('utf-8'),
+            client=self._http_client,
         )
         response = json.loads(check.not_none(raw_response.data).decode('utf-8'))

ommlds 0.0.0.dev456__py3-none-any.whl → 0.0.0.dev485__py3-none-any.whl

ommlds 0.0.0.dev456py3-none-any.whl → 0.0.0.dev485py3-none-any.whl