PyPI - ommlds - Versions diffs - 0.0.0.dev440__py3-none-any.whl → 0.0.0.dev480__py3-none-any.whl - Mend

ommlds 0.0.0.dev440py3-none-any.whl → 0.0.0.dev480py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (271) hide show

ommlds/.omlish-manifests.json +332 -35
ommlds/__about__.py +15 -9
ommlds/_hacks/__init__.py +4 -0
ommlds/_hacks/funcs.py +110 -0
ommlds/_hacks/names.py +158 -0
ommlds/_hacks/params.py +73 -0
ommlds/_hacks/patches.py +0 -3
ommlds/backends/anthropic/protocol/_marshal.py +2 -2
ommlds/backends/anthropic/protocol/sse/_marshal.py +1 -1
ommlds/backends/anthropic/protocol/sse/assemble.py +23 -7
ommlds/backends/anthropic/protocol/sse/events.py +13 -0
ommlds/backends/anthropic/protocol/types.py +30 -9
ommlds/backends/google/protocol/__init__.py +3 -0
ommlds/backends/google/protocol/_marshal.py +16 -0
ommlds/backends/google/protocol/types.py +626 -0
ommlds/backends/groq/_marshal.py +23 -0
ommlds/backends/groq/protocol.py +249 -0
ommlds/backends/mlx/generation.py +1 -1
ommlds/backends/mlx/loading.py +58 -1
ommlds/backends/ollama/__init__.py +0 -0
ommlds/backends/ollama/protocol.py +170 -0
ommlds/backends/openai/protocol/__init__.py +9 -28
ommlds/backends/openai/protocol/_common.py +18 -0
ommlds/backends/openai/protocol/_marshal.py +27 -0
ommlds/backends/openai/protocol/chatcompletion/chunk.py +58 -31
ommlds/backends/openai/protocol/chatcompletion/contentpart.py +49 -44
ommlds/backends/openai/protocol/chatcompletion/message.py +55 -43
ommlds/backends/openai/protocol/chatcompletion/request.py +114 -66
ommlds/backends/openai/protocol/chatcompletion/response.py +71 -45
ommlds/backends/openai/protocol/chatcompletion/responseformat.py +27 -20
ommlds/backends/openai/protocol/chatcompletion/tokenlogprob.py +16 -7
ommlds/backends/openai/protocol/completionusage.py +24 -15
ommlds/backends/tavily/__init__.py +0 -0
ommlds/backends/tavily/protocol.py +301 -0
ommlds/backends/tinygrad/models/llama3/__init__.py +22 -14
ommlds/backends/transformers/__init__.py +0 -0
ommlds/backends/transformers/filecache.py +109 -0
ommlds/backends/transformers/streamers.py +73 -0
ommlds/cli/asyncs.py +30 -0
ommlds/cli/backends/catalog.py +93 -0
ommlds/cli/backends/configs.py +9 -0
ommlds/cli/backends/inject.py +31 -36
ommlds/cli/backends/injection.py +16 -0
ommlds/cli/backends/types.py +46 -0
ommlds/cli/content/__init__.py +0 -0
ommlds/cli/content/messages.py +34 -0
ommlds/cli/content/strings.py +42 -0
ommlds/cli/inject.py +15 -32
ommlds/cli/inputs/__init__.py +0 -0
ommlds/cli/inputs/asyncs.py +32 -0
ommlds/cli/inputs/sync.py +75 -0
ommlds/cli/main.py +270 -110
ommlds/cli/rendering/__init__.py +0 -0
ommlds/cli/rendering/configs.py +9 -0
ommlds/cli/rendering/inject.py +31 -0
ommlds/cli/rendering/markdown.py +52 -0
ommlds/cli/rendering/raw.py +73 -0
ommlds/cli/rendering/types.py +21 -0
ommlds/cli/secrets.py +21 -0
ommlds/cli/sessions/base.py +1 -1
ommlds/cli/sessions/chat/chat/__init__.py +0 -0
ommlds/cli/sessions/chat/chat/ai/__init__.py +0 -0
ommlds/cli/sessions/chat/chat/ai/configs.py +11 -0
ommlds/cli/sessions/chat/chat/ai/inject.py +74 -0
ommlds/cli/sessions/chat/chat/ai/injection.py +14 -0
ommlds/cli/sessions/chat/chat/ai/rendering.py +70 -0
ommlds/cli/sessions/chat/chat/ai/services.py +79 -0
ommlds/cli/sessions/chat/chat/ai/tools.py +44 -0
ommlds/cli/sessions/chat/chat/ai/types.py +28 -0
ommlds/cli/sessions/chat/chat/state/__init__.py +0 -0
ommlds/cli/sessions/chat/chat/state/configs.py +11 -0
ommlds/cli/sessions/chat/chat/state/inject.py +36 -0
ommlds/cli/sessions/chat/chat/state/inmemory.py +33 -0
ommlds/cli/sessions/chat/chat/state/storage.py +52 -0
ommlds/cli/sessions/chat/chat/state/types.py +38 -0
ommlds/cli/sessions/chat/chat/user/__init__.py +0 -0
ommlds/cli/sessions/chat/chat/user/configs.py +17 -0
ommlds/cli/sessions/chat/chat/user/inject.py +62 -0
ommlds/cli/sessions/chat/chat/user/interactive.py +31 -0
ommlds/cli/sessions/chat/chat/user/oneshot.py +25 -0
ommlds/cli/sessions/chat/chat/user/types.py +15 -0
ommlds/cli/sessions/chat/configs.py +27 -0
ommlds/cli/sessions/chat/driver.py +43 -0
ommlds/cli/sessions/chat/inject.py +33 -65
ommlds/cli/sessions/chat/phases/__init__.py +0 -0
ommlds/cli/sessions/chat/phases/inject.py +27 -0
ommlds/cli/sessions/chat/phases/injection.py +14 -0
ommlds/cli/sessions/chat/phases/manager.py +29 -0
ommlds/cli/sessions/chat/phases/types.py +29 -0
ommlds/cli/sessions/chat/session.py +27 -0
ommlds/cli/sessions/chat/tools/__init__.py +0 -0
ommlds/cli/sessions/chat/tools/configs.py +22 -0
ommlds/cli/sessions/chat/tools/confirmation.py +46 -0
ommlds/cli/sessions/chat/tools/execution.py +66 -0
ommlds/cli/sessions/chat/tools/fs/__init__.py +0 -0
ommlds/cli/sessions/chat/tools/fs/configs.py +12 -0
ommlds/cli/sessions/chat/tools/fs/inject.py +35 -0
ommlds/cli/sessions/chat/tools/inject.py +88 -0
ommlds/cli/sessions/chat/tools/injection.py +44 -0
ommlds/cli/sessions/chat/tools/rendering.py +58 -0
ommlds/cli/sessions/chat/tools/todo/__init__.py +0 -0
ommlds/cli/sessions/chat/tools/todo/configs.py +12 -0
ommlds/cli/sessions/chat/tools/todo/inject.py +31 -0
ommlds/cli/sessions/chat/tools/weather/__init__.py +0 -0
ommlds/cli/sessions/chat/tools/weather/configs.py +12 -0
ommlds/cli/sessions/chat/tools/weather/inject.py +22 -0
ommlds/cli/{tools/weather.py → sessions/chat/tools/weather/tools.py} +1 -1
ommlds/cli/sessions/completion/configs.py +21 -0
ommlds/cli/sessions/completion/inject.py +42 -0
ommlds/cli/sessions/completion/session.py +35 -0
ommlds/cli/sessions/embedding/configs.py +21 -0
ommlds/cli/sessions/embedding/inject.py +42 -0
ommlds/cli/sessions/embedding/session.py +33 -0
ommlds/cli/sessions/inject.py +28 -11
ommlds/cli/state/__init__.py +0 -0
ommlds/cli/state/inject.py +28 -0
ommlds/cli/{state.py → state/storage.py} +41 -24
ommlds/minichain/__init__.py +84 -24
ommlds/minichain/_marshal.py +49 -9
ommlds/minichain/_typedvalues.py +2 -4
ommlds/minichain/backends/catalogs/base.py +20 -1
ommlds/minichain/backends/catalogs/simple.py +2 -2
ommlds/minichain/backends/catalogs/strings.py +10 -8
ommlds/minichain/backends/impls/anthropic/chat.py +65 -27
ommlds/minichain/backends/impls/anthropic/names.py +10 -8
ommlds/minichain/backends/impls/anthropic/protocol.py +109 -0
ommlds/minichain/backends/impls/anthropic/stream.py +111 -43
ommlds/minichain/backends/impls/duckduckgo/search.py +1 -1
ommlds/minichain/backends/impls/dummy/__init__.py +0 -0
ommlds/minichain/backends/impls/dummy/chat.py +69 -0
ommlds/minichain/backends/impls/google/chat.py +114 -22
ommlds/minichain/backends/impls/google/search.py +7 -2
ommlds/minichain/backends/impls/google/stream.py +219 -0
ommlds/minichain/backends/impls/google/tools.py +149 -0
ommlds/minichain/backends/impls/groq/__init__.py +0 -0
ommlds/minichain/backends/impls/groq/chat.py +75 -0
ommlds/minichain/backends/impls/groq/names.py +48 -0
ommlds/minichain/backends/impls/groq/protocol.py +143 -0
ommlds/minichain/backends/impls/groq/stream.py +125 -0
ommlds/minichain/backends/impls/llamacpp/chat.py +33 -18
ommlds/minichain/backends/impls/llamacpp/completion.py +1 -1
ommlds/minichain/backends/impls/llamacpp/format.py +4 -2
ommlds/minichain/backends/impls/llamacpp/stream.py +37 -20
ommlds/minichain/backends/impls/mistral.py +20 -5
ommlds/minichain/backends/impls/mlx/chat.py +96 -22
ommlds/minichain/backends/impls/ollama/__init__.py +0 -0
ommlds/minichain/backends/impls/ollama/chat.py +199 -0
ommlds/minichain/backends/impls/openai/chat.py +18 -8
ommlds/minichain/backends/impls/openai/completion.py +10 -3
ommlds/minichain/backends/impls/openai/embedding.py +10 -3
ommlds/minichain/backends/impls/openai/format.py +131 -106
ommlds/minichain/backends/impls/openai/names.py +31 -5
ommlds/minichain/backends/impls/openai/stream.py +43 -25
ommlds/minichain/backends/impls/tavily.py +66 -0
ommlds/minichain/backends/impls/tinygrad/chat.py +23 -16
ommlds/minichain/backends/impls/transformers/sentence.py +1 -1
ommlds/minichain/backends/impls/transformers/tokens.py +1 -1
ommlds/minichain/backends/impls/transformers/transformers.py +155 -34
ommlds/minichain/backends/strings/parsing.py +1 -1
ommlds/minichain/backends/strings/resolving.py +4 -1
ommlds/minichain/chat/_marshal.py +16 -9
ommlds/minichain/chat/choices/adapters.py +4 -4
ommlds/minichain/chat/choices/services.py +1 -1
ommlds/minichain/chat/choices/stream/__init__.py +0 -0
ommlds/minichain/chat/choices/stream/adapters.py +35 -0
ommlds/minichain/chat/choices/stream/joining.py +31 -0
ommlds/minichain/chat/choices/stream/services.py +45 -0
ommlds/minichain/chat/choices/stream/types.py +43 -0
ommlds/minichain/chat/choices/types.py +2 -2
ommlds/minichain/chat/history.py +3 -3
ommlds/minichain/chat/messages.py +55 -19
ommlds/minichain/chat/services.py +3 -3
ommlds/minichain/chat/stream/_marshal.py +16 -0
ommlds/minichain/chat/stream/joining.py +85 -0
ommlds/minichain/chat/stream/services.py +15 -21
ommlds/minichain/chat/stream/types.py +32 -19
ommlds/minichain/chat/tools/execution.py +8 -7
ommlds/minichain/chat/tools/ids.py +9 -15
ommlds/minichain/chat/tools/parsing.py +17 -26
ommlds/minichain/chat/transforms/base.py +29 -38
ommlds/minichain/chat/transforms/metadata.py +30 -4
ommlds/minichain/chat/transforms/services.py +9 -11
ommlds/minichain/content/_marshal.py +44 -20
ommlds/minichain/content/json.py +13 -0
ommlds/minichain/content/materialize.py +14 -21
ommlds/minichain/content/prepare.py +4 -0
ommlds/minichain/content/transforms/interleave.py +1 -1
ommlds/minichain/content/transforms/squeeze.py +1 -1
ommlds/minichain/content/transforms/stringify.py +1 -1
ommlds/minichain/json.py +20 -0
ommlds/minichain/lib/code/__init__.py +0 -0
ommlds/minichain/lib/code/prompts.py +6 -0
ommlds/minichain/lib/fs/binfiles.py +108 -0
ommlds/minichain/lib/fs/context.py +126 -0
ommlds/minichain/lib/fs/errors.py +101 -0
ommlds/minichain/lib/fs/suggestions.py +36 -0
ommlds/minichain/lib/fs/tools/__init__.py +0 -0
ommlds/minichain/lib/fs/tools/edit.py +104 -0
ommlds/minichain/lib/fs/tools/ls.py +38 -0
ommlds/minichain/lib/fs/tools/read.py +115 -0
ommlds/minichain/lib/fs/tools/recursivels/__init__.py +0 -0
ommlds/minichain/lib/fs/tools/recursivels/execution.py +40 -0
ommlds/minichain/lib/todo/__init__.py +0 -0
ommlds/minichain/lib/todo/context.py +54 -0
ommlds/minichain/lib/todo/tools/__init__.py +0 -0
ommlds/minichain/lib/todo/tools/read.py +44 -0
ommlds/minichain/lib/todo/tools/write.py +335 -0
ommlds/minichain/lib/todo/types.py +60 -0
ommlds/minichain/llms/_marshal.py +25 -17
ommlds/minichain/llms/types.py +4 -0
ommlds/minichain/registries/globals.py +18 -4
ommlds/minichain/resources.py +66 -43
ommlds/minichain/search.py +1 -1
ommlds/minichain/services/_marshal.py +46 -39
ommlds/minichain/services/facades.py +3 -3
ommlds/minichain/services/services.py +1 -1
ommlds/minichain/standard.py +8 -0
ommlds/minichain/stream/services.py +152 -38
ommlds/minichain/stream/wrap.py +22 -24
ommlds/minichain/tools/_marshal.py +1 -1
ommlds/minichain/tools/execution/catalog.py +2 -1
ommlds/minichain/tools/execution/context.py +34 -14
ommlds/minichain/tools/execution/errors.py +15 -0
ommlds/minichain/tools/execution/executors.py +8 -3
ommlds/minichain/tools/execution/reflect.py +40 -5
ommlds/minichain/tools/fns.py +46 -9
ommlds/minichain/tools/jsonschema.py +14 -5
ommlds/minichain/tools/reflect.py +54 -18
ommlds/minichain/tools/types.py +33 -1
ommlds/minichain/utils.py +27 -0
ommlds/minichain/vectors/_marshal.py +11 -10
ommlds/nanochat/LICENSE +21 -0
ommlds/nanochat/__init__.py +0 -0
ommlds/nanochat/rustbpe/LICENSE +21 -0
ommlds/nanochat/tokenizers.py +406 -0
ommlds/server/server.py +3 -3
ommlds/specs/__init__.py +0 -0
ommlds/specs/mcp/__init__.py +0 -0
ommlds/specs/mcp/_marshal.py +23 -0
ommlds/specs/mcp/protocol.py +266 -0
ommlds/tools/git.py +27 -10
ommlds/tools/ocr.py +8 -9
ommlds/wiki/analyze.py +2 -2
ommlds/wiki/text/mfh.py +1 -5
ommlds/wiki/text/wtp.py +1 -3
ommlds/wiki/utils/xml.py +5 -5
{ommlds-0.0.0.dev440.dist-info → ommlds-0.0.0.dev480.dist-info}/METADATA +24 -21
ommlds-0.0.0.dev480.dist-info/RECORD +427 -0
ommlds/cli/backends/standard.py +0 -20
ommlds/cli/sessions/chat/base.py +0 -42
ommlds/cli/sessions/chat/interactive.py +0 -73
ommlds/cli/sessions/chat/printing.py +0 -96
ommlds/cli/sessions/chat/prompt.py +0 -143
ommlds/cli/sessions/chat/state.py +0 -109
ommlds/cli/sessions/chat/tools.py +0 -91
ommlds/cli/sessions/completion/completion.py +0 -44
ommlds/cli/sessions/embedding/embedding.py +0 -42
ommlds/cli/tools/config.py +0 -13
ommlds/cli/tools/inject.py +0 -64
ommlds/minichain/chat/stream/adapters.py +0 -69
ommlds/minichain/lib/fs/ls/execution.py +0 -32
ommlds-0.0.0.dev440.dist-info/RECORD +0 -303
/ommlds/{cli/tools → backends/google}/__init__.py +0 -0
/ommlds/{minichain/lib/fs/ls → backends/groq}/__init__.py +0 -0
/ommlds/{huggingface.py → backends/huggingface.py} +0 -0
/ommlds/minichain/lib/fs/{ls → tools/recursivels}/rendering.py +0 -0
/ommlds/minichain/lib/fs/{ls → tools/recursivels}/running.py +0 -0
{ommlds-0.0.0.dev440.dist-info → ommlds-0.0.0.dev480.dist-info}/WHEEL +0 -0
{ommlds-0.0.0.dev440.dist-info → ommlds-0.0.0.dev480.dist-info}/entry_points.txt +0 -0
{ommlds-0.0.0.dev440.dist-info → ommlds-0.0.0.dev480.dist-info}/licenses/LICENSE +0 -0
{ommlds-0.0.0.dev440.dist-info → ommlds-0.0.0.dev480.dist-info}/top_level.txt +0 -0

ommlds/minichain/backends/impls/anthropic/stream.py CHANGED Viewed

@@ -1,26 +1,33 @@
 import typing as ta
 from omlish import check
-from omlish import lang
+from omlish import marshal as msh
 from omlish import typedvalues as tv
 from omlish.formats import json
 from omlish.http import all as http
 from omlish.http import sse
 from omlish.io.buffers import DelimitingBuffer
+from .....backends.anthropic.protocol import types as pt
+from .....backends.anthropic.protocol.sse.events import AnthropicSseDecoderEvents
 from ....chat.choices.services import ChatChoicesOutputs
-from ....chat.messages import SystemMessage
-from ....chat.stream.services import ChatChoicesStreamRequest
-from ....chat.stream.services import ChatChoicesStreamResponse
-from ....chat.stream.services import static_check_is_chat_choices_stream_service
-from ....chat.stream.types import AiChoiceDelta
-from ....chat.stream.types import AiChoiceDeltas
+from ....chat.choices.stream.services import ChatChoicesStreamRequest
+from ....chat.choices.stream.services import ChatChoicesStreamResponse
+from ....chat.choices.stream.services import static_check_is_chat_choices_stream_service
+from ....chat.choices.stream.types import AiChoiceDeltas
+from ....chat.choices.stream.types import AiChoicesDeltas
+from ....chat.stream.types import ContentAiDelta
+from ....chat.stream.types import PartialToolUseAiDelta
+from ....chat.tools.types import Tool
 from ....configs import Config
 from ....resources import UseResources
 from ....standard import ApiKey
+from ....stream.services import StreamResponseSink
 from ....stream.services import new_stream_response
 from .chat import AnthropicChatChoicesService
 from .names import MODEL_NAMES
+from .protocol import build_protocol_chat_messages
+from .protocol import build_protocol_tool
 ##
@@ -32,42 +39,46 @@ from .names import MODEL_NAMES
 # )
 @static_check_is_chat_choices_stream_service
 class AnthropicChatChoicesStreamService:
-    def __init__(self, *configs: Config) -> None:
+    def __init__(
+            self,
+            *configs: Config,
+            http_client: http.AsyncHttpClient | None = None,
+    ) -> None:
         super().__init__()
+        self._http_client = http_client
         with tv.consume(*configs) as cc:
             self._model_name = cc.pop(AnthropicChatChoicesService.DEFAULT_MODEL_NAME)
             self._api_key = check.not_none(ApiKey.pop_secret(cc, env='ANTHROPIC_API_KEY'))
-    READ_CHUNK_SIZE = 64 * 1024
+    READ_CHUNK_SIZE: ta.ClassVar[int] = -1
-    def invoke(
+    async def invoke(
             self,
             request: ChatChoicesStreamRequest,
             *,
             max_tokens: int = 4096,  # FIXME: ChatOption
     ) -> ChatChoicesStreamResponse:
-        messages = []
-        system: str | None = None
-        for i, m in enumerate(request.v):
-            if isinstance(m, SystemMessage):
-                if i != 0 or system is not None:
-                    raise Exception('Only supports one system message and must be first')
-                system = AnthropicChatChoicesService._get_msg_content(m)  # noqa
-            else:
-                messages.append(dict(
-                    role=AnthropicChatChoicesService.ROLES_MAP[type(m)],  # noqa
-                    content=check.isinstance(AnthropicChatChoicesService._get_msg_content(m), str),  # noqa
-                ))
-        raw_request = dict(
+        messages, system = build_protocol_chat_messages(request.v)
+        tools: list[pt.ToolSpec] = []
+        with tv.TypedValues(*request.options).consume() as oc:
+            t: Tool
+            for t in oc.pop(Tool, []):
+                tools.append(build_protocol_tool(t))
+        a_req = pt.MessagesRequest(
             model=MODEL_NAMES.resolve(self._model_name.v),
-            **lang.opt_kw(system=system),
+            system=system,
             messages=messages,
+            tools=tools or None,
             max_tokens=max_tokens,
             stream=True,
         )
+        raw_request = msh.marshal(a_req)
         http_request = http.HttpRequest(
             'https://api.anthropic.com/v1/messages',
             headers={
@@ -78,16 +89,19 @@ class AnthropicChatChoicesStreamService:
             data=json.dumps(raw_request).encode('utf-8'),
         )
-        with UseResources.or_new(request.options) as rs:
-            http_client = rs.enter_context(http.client())
-            http_response = rs.enter_context(http_client.stream_request(http_request))
+        async with UseResources.or_new(request.options) as rs:
+            http_client = await rs.enter_async_context(http.manage_async_client(self._http_client))
+            http_response = await rs.enter_async_context(await http_client.stream_request(http_request))
+            async def inner(sink: StreamResponseSink[AiChoicesDeltas]) -> ta.Sequence[ChatChoicesOutputs] | None:
+                msg_start: AnthropicSseDecoderEvents.MessageStart | None = None
+                cbk_start: AnthropicSseDecoderEvents.ContentBlockStart | None = None
+                msg_stop: AnthropicSseDecoderEvents.MessageStop | None = None
-            def yield_choices() -> ta.Generator[AiChoiceDeltas, None, ta.Sequence[ChatChoicesOutputs] | None]:
                 db = DelimitingBuffer([b'\r', b'\n', b'\r\n'])
                 sd = sse.SseDecoder()
                 while True:
-                    # FIXME: read1 not on response stream protocol
-                    b = http_response.stream.read1(self.READ_CHUNK_SIZE)  # type: ignore[attr-defined]
+                    b = await http_response.stream.read1(self.READ_CHUNK_SIZE)
                     for l in db.feed(b):
                         if isinstance(l, DelimitingBuffer.Incomplete):
                             # FIXME: handle
@@ -95,29 +109,83 @@ class AnthropicChatChoicesStreamService:
                         # FIXME: https://docs.anthropic.com/en/docs/build-with-claude/streaming
                         for so in sd.process_line(l):
-                            # FIXME: AnthropicSseMessageAssembler lol
-                            if isinstance(so, sse.SseEvent) and so.type == b'message':
+                            if isinstance(so, sse.SseEvent):
                                 ss = so.data.decode('utf-8')
                                 if ss == '[DONE]':
                                     return []
-                                sj = json.loads(ss)  # ChatCompletionChunk
+                                dct = json.loads(ss)
+                                check.equal(dct['type'], so.type.decode('utf-8'))
+                                ae = msh.unmarshal(dct, AnthropicSseDecoderEvents.Event)
+                                match ae:
+                                    case AnthropicSseDecoderEvents.MessageStart():
+                                        check.none(msg_start)
+                                        msg_start = ae
+                                        if msg_start.message.content:
+                                            raise NotImplementedError
+                                    case AnthropicSseDecoderEvents.ContentBlockStart():
+                                        check.not_none(msg_start)
+                                        check.none(cbk_start)
+                                        cbk_start = ae
+                                        if isinstance(ae.content_block, AnthropicSseDecoderEvents.ContentBlockStart.Text):  # noqa
+                                            await sink.emit(AiChoicesDeltas([AiChoiceDeltas([ContentAiDelta(
+                                                ae.content_block.text,
+                                            )])]))
+                                        elif isinstance(ae.content_block, AnthropicSseDecoderEvents.ContentBlockStart.ToolUse):  # noqa
+                                            await sink.emit(AiChoicesDeltas([AiChoiceDeltas([PartialToolUseAiDelta(  # noqa
+                                                id=ae.content_block.id,
+                                                name=ae.content_block.name,
+                                                raw_args=ae.content_block.input,
+                                            )])]))
+                                        else:
+                                            raise TypeError(ae.content_block)
+                                    case AnthropicSseDecoderEvents.ContentBlockDelta():
+                                        check.not_none(cbk_start)
+                                        if isinstance(ae.delta, AnthropicSseDecoderEvents.ContentBlockDelta.TextDelta):
+                                            await sink.emit(AiChoicesDeltas([AiChoiceDeltas([ContentAiDelta(
+                                                ae.delta.text,
+                                            )])]))
+                                        elif isinstance(ae.delta, AnthropicSseDecoderEvents.ContentBlockDelta.InputJsonDelta):  # noqa
+                                            await sink.emit(AiChoicesDeltas([AiChoiceDeltas([PartialToolUseAiDelta(  # noqa
+                                                raw_args=ae.delta.partial_json,
+                                            )])]))
+                                        else:
+                                            raise TypeError(ae.delta)
+                                    case AnthropicSseDecoderEvents.ContentBlockStop():
+                                        check.not_none(cbk_start)
+                                        cbk_start = None
+                                    case AnthropicSseDecoderEvents.MessageDelta():
+                                        check.not_none(msg_start)
+                                        check.none(cbk_start)
-                                check.state(sj['object'] == 'chat.completion.chunk')
+                                    case AnthropicSseDecoderEvents.MessageStop():
+                                        check.not_none(msg_start)
+                                        check.none(msg_stop)
+                                        msg_stop = ae
-                                # FIXME: stop reason
-                                if not sj['choices']:
-                                    continue
+                                    case AnthropicSseDecoderEvents.Ping():
+                                        pass
-                                yield [
-                                    AiChoiceDelta(choice['delta'])
-                                    for choice in sj['choices']
-                                ]
+                                    case _:
+                                        raise TypeError(ae)
                     if not b:
+                        check.not_none(msg_stop)
+                        check.none(cbk_start)
                         return []
             # raw_response = json.loads(check.not_none(http_response.data).decode('utf-8'))
             # return rh.build_response(raw_response)
-            return new_stream_response(rs, yield_choices())
+            return await new_stream_response(rs, inner)

ommlds/minichain/backends/impls/duckduckgo/search.py CHANGED Viewed

@@ -17,7 +17,7 @@ from ....search import static_check_is_search_service
 # )
 @static_check_is_search_service
 class DuckduckgoSearchService:
-    def invoke(self, request: SearchRequest) -> SearchResponse:
+    async def invoke(self, request: SearchRequest) -> SearchResponse:
         dsch = ddgs.DDGS()
         res = dsch.text(request.v)
         return SearchResponse(SearchHits(

ommlds/minichain/backends/impls/dummy/__init__.py ADDED Viewed

File without changes

ommlds/minichain/backends/impls/dummy/chat.py ADDED Viewed

@@ -0,0 +1,69 @@
+# ruff: noqa: PERF402
+import typing as ta
+from omlish.text.lorem import LOREM
+from ....chat.choices.services import ChatChoicesRequest
+from ....chat.choices.services import ChatChoicesResponse
+from ....chat.choices.services import static_check_is_chat_choices_service
+from ....chat.choices.stream.services import ChatChoicesStreamRequest
+from ....chat.choices.stream.services import ChatChoicesStreamResponse
+from ....chat.choices.stream.services import static_check_is_chat_choices_stream_service
+from ....chat.choices.stream.types import AiChoiceDeltas
+from ....chat.choices.stream.types import AiChoicesDeltas
+from ....chat.choices.types import AiChoice
+from ....chat.choices.types import ChatChoicesOutputs
+from ....chat.messages import AiMessage
+from ....chat.stream.types import ContentAiDelta
+from ....resources import UseResources
+from ....stream.services import StreamResponseSink
+from ....stream.services import new_stream_response
+##
+# @omlish-manifest $.minichain.registries.manifests.RegistryManifest(
+#     name='dummy',
+#     type='ChatChoicesService',
+# )
+@static_check_is_chat_choices_service
+class DummyChatChoicesService:
+    async def invoke(self, request: ChatChoicesRequest) -> ChatChoicesResponse:
+        return ChatChoicesResponse([AiChoice([AiMessage(LOREM)])])
+##
+# @omlish-manifest $.minichain.registries.manifests.RegistryManifest(
+#     name='dummy',
+#     type='ChatChoicesStreamService',
+# )
+@static_check_is_chat_choices_stream_service
+class DummyChatChoicesStreamService:
+    async def invoke(self, request: ChatChoicesStreamRequest) -> ChatChoicesStreamResponse:
+        async with UseResources.or_new(request.options) as rs:
+            async def inner(sink: StreamResponseSink[AiChoicesDeltas]) -> ta.Sequence[ChatChoicesOutputs]:
+                for s in LOREM:
+                    await sink.emit(AiChoicesDeltas([
+                        AiChoiceDeltas([
+                            ContentAiDelta(s),
+                        ]),
+                    ]))
+                return []
+            return await new_stream_response(rs, inner)
+##
+# @omlish-manifest $.minichain.backends.strings.manifests.BackendStringsManifest(
+#     [
+#         'ChatChoicesService',
+#         'ChatChoicesStreamService',
+#     ],
+#     'dummy',
+# )

ommlds/minichain/backends/impls/google/chat.py CHANGED Viewed

@@ -4,21 +4,29 @@ https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models
 import typing as ta
 from omlish import check
+from omlish import marshal as msh
 from omlish import typedvalues as tv
 from omlish.formats import json
 from omlish.http import all as http
+from .....backends.google.protocol import types as pt
 from ....chat.choices.services import ChatChoicesRequest
 from ....chat.choices.services import ChatChoicesResponse
 from ....chat.choices.services import static_check_is_chat_choices_service
 from ....chat.choices.types import AiChoice
 from ....chat.messages import AiMessage
+from ....chat.messages import AnyAiMessage
 from ....chat.messages import Message
 from ....chat.messages import SystemMessage
+from ....chat.messages import ToolUseMessage
+from ....chat.messages import ToolUseResultMessage
 from ....chat.messages import UserMessage
+from ....chat.tools.types import Tool
 from ....models.configs import ModelName
 from ....standard import ApiKey
+from ....tools.types import ToolUse
 from .names import MODEL_NAMES
+from .tools import build_tool_spec_schema
 ##
@@ -32,9 +40,15 @@ from .names import MODEL_NAMES
 class GoogleChatChoicesService:
     DEFAULT_MODEL_NAME: ta.ClassVar[ModelName] = ModelName(check.not_none(MODEL_NAMES.default))
-    def __init__(self, *configs: ApiKey | ModelName) -> None:
+    def __init__(
+            self,
+            *configs: ApiKey | ModelName,
+            http_client: http.AsyncHttpClient | None = None,
+    ) -> None:
         super().__init__()
+        self._http_client = http_client
         with tv.consume(*configs) as cc:
             self._model_name = cc.pop(self.DEFAULT_MODEL_NAME)
             self._api_key = ApiKey.pop_secret(cc, env='GEMINI_API_KEY')
@@ -52,43 +66,121 @@ class GoogleChatChoicesService:
     BASE_URL: ta.ClassVar[str] = 'https://generativelanguage.googleapis.com/v1beta/models'
     ROLES_MAP: ta.ClassVar[ta.Mapping[type[Message], str]] = {
-        SystemMessage: 'system',
         UserMessage: 'user',
-        AiMessage: 'assistant',
+        AiMessage: 'model',
+        ToolUseMessage: 'model',
     }
-    def invoke(
+    async def invoke(
             self,
             request: ChatChoicesRequest,
     ) -> ChatChoicesResponse:
         key = check.not_none(self._api_key).reveal()
-        req_dct = {
-            'contents': [
-                {
-                    'role': self.ROLES_MAP[type(m)],
-                    'parts': [
-                        {
-                            'text': self._get_msg_content(m),
-                        },
-                    ],
-                }
-                for m in request.v
-            ],
-        }
+        g_sys_content: pt.Content | None = None
+        g_contents: list[pt.Content] = []
+        for i, m in enumerate(request.v):
+            if isinstance(m, SystemMessage):
+                check.arg(i == 0)
+                check.none(g_sys_content)
+                g_sys_content = pt.Content(
+                    parts=[pt.Part(
+                        text=check.not_none(self._get_msg_content(m)),
+                    )],
+                )
+            elif isinstance(m, ToolUseResultMessage):
+                tr_resp_val: pt.Value
+                if m.tur.c is None:
+                    tr_resp_val = pt.NullValue()  # type: ignore[unreachable]
+                elif isinstance(m.tur.c, str):
+                    tr_resp_val = pt.StringValue(m.tur.c)
+                else:
+                    raise TypeError(m.tur.c)
+                g_contents.append(pt.Content(
+                    parts=[pt.Part(
+                        function_response=pt.FunctionResponse(
+                            id=m.tur.id,
+                            name=m.tur.name,
+                            response={
+                                'value': tr_resp_val,
+                            },
+                        ),
+                    )],
+                ))
+            elif isinstance(m, AiMessage):
+                g_contents.append(pt.Content(
+                    parts=[pt.Part(
+                        text=check.not_none(self._get_msg_content(m)),
+                    )],
+                    role='model',
+                ))
+            elif isinstance(m, ToolUseMessage):
+                g_contents.append(pt.Content(
+                    parts=[pt.Part(
+                        function_call=pt.FunctionCall(
+                            id=m.tu.id,
+                            name=m.tu.name,
+                            args=m.tu.args,
+                        ),
+                    )],
+                    role='model',
+                ))
+            else:
+                g_contents.append(pt.Content(
+                    parts=[pt.Part(
+                        text=check.not_none(self._get_msg_content(m)),
+                    )],
+                    role=self.ROLES_MAP[type(m)],  # type: ignore[arg-type]
+                ))
+        g_tools: list[pt.Tool] = []
+        with tv.TypedValues(*request.options).consume() as oc:
+            t: Tool
+            for t in oc.pop(Tool, []):
+                g_tools.append(pt.Tool(
+                    function_declarations=[build_tool_spec_schema(t.spec)],
+                ))
+        g_req = pt.GenerateContentRequest(
+            contents=g_contents or None,
+            tools=g_tools or None,
+            system_instruction=g_sys_content,
+        )
+        req_dct = msh.marshal(g_req)
         model_name = MODEL_NAMES.resolve(self._model_name.v)
-        resp = http.request(
+        resp = await http.async_request(
             f'{self.BASE_URL.rstrip("/")}/{model_name}:generateContent?key={key}',
             headers={'Content-Type': 'application/json'},
             data=json.dumps_compact(req_dct).encode('utf-8'),
             method='POST',
+            client=self._http_client,
         )
         resp_dct = json.loads(check.not_none(resp.data).decode('utf-8'))
-        return ChatChoicesResponse([
-            AiChoice(AiMessage(c['content']['parts'][0]['text']))
-            for c in resp_dct['candidates']
-        ])
+        g_resp = msh.unmarshal(resp_dct, pt.GenerateContentResponse)
+        ai_choices: list[AiChoice] = []
+        for c in g_resp.candidates or []:
+            out: list[AnyAiMessage] = []
+            for g_resp_part in check.not_none(check.not_none(c.content).parts):
+                if (g_txt := g_resp_part.text) is not None:
+                    out.append(AiMessage(g_txt))
+                elif (g_fc := g_resp_part.function_call) is not None:
+                    out.append(ToolUseMessage(ToolUse(
+                        id=g_fc.id,
+                        name=g_fc.name,
+                        args=g_fc.args or {},
+                    )))
+                else:
+                    raise TypeError(g_resp_part)
+            ai_choices.append(AiChoice(out))
+        return ChatChoicesResponse(ai_choices)

ommlds/minichain/backends/impls/google/search.py CHANGED Viewed

@@ -82,13 +82,17 @@ class CseSearchService:
             self,
             cse_id: str | None = None,
             cse_api_key: str | None = None,
+            *,
+            http_client: http.AsyncHttpClient | None = None,
     ) -> None:
         super().__init__()
         self._cse_id = cse_id
         self._cse_api_key = cse_api_key
-    def invoke(
+        self._http_client = http_client
+    async def invoke(
             self,
             request: SearchRequest,
     ) -> SearchResponse:
@@ -97,8 +101,9 @@ class CseSearchService:
             cx=check.non_empty_str(self._cse_id),
             q=request.v,
         ))
-        resp = http.request(
+        resp = await http.async_request(
             f'https://www.googleapis.com/customsearch/v1?{qs}',
+            client=self._http_client,
         )
         out = check.not_none(resp.data)

ommlds 0.0.0.dev440__py3-none-any.whl → 0.0.0.dev480__py3-none-any.whl

ommlds 0.0.0.dev440py3-none-any.whl → 0.0.0.dev480py3-none-any.whl