PyPI - llm-gemini - Versions diffs - 0.13a0__py3-none-any.whl → 0.14__py3-none-any.whl - Mend

llm-gemini 0.13a0py3-none-any.whl → 0.14py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

{llm_gemini-0.13a0.dist-info → llm_gemini-0.14.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.2
 Name: llm-gemini
-Version: 0.13a0
+Version: 0.14
 Summary: LLM plugin to access Google's Gemini family of models
 Author: Simon Willison
 License: Apache-2.0
@@ -11,12 +11,13 @@ Project-URL: CI, https://github.com/simonw/llm-gemini/actions
 Classifier: License :: OSI Approved :: Apache Software License
 Description-Content-Type: text/markdown
 License-File: LICENSE
-Requires-Dist: llm>=0.23a0
+Requires-Dist: llm>=0.23
 Requires-Dist: httpx
 Requires-Dist: ijson
 Provides-Extra: test
 Requires-Dist: pytest; extra == "test"
 Requires-Dist: pytest-recording; extra == "test"
+Requires-Dist: pytest-asyncio; extra == "test"
 Requires-Dist: nest-asyncio; extra == "test"
 # llm-gemini
@@ -145,7 +146,7 @@ llm chat -m gemini-1.5-pro-latest
 ## Embeddings
-The plugin also adds support for the `text-embedding-004` embedding model.
+The plugin also adds support for the `gemini-embedding-exp-03-07` and `text-embedding-004` embedding models.
 Run that against a single string like this:
 ```bash
@@ -153,10 +154,20 @@ llm embed -m text-embedding-004 -c 'hello world'
 ```
 This returns a JSON array of 768 numbers.
+The `gemini-embedding-exp-03-07` model is larger, returning 3072 numbers. You can also use variants of it that are truncated down to smaller sizes:
+- `gemini-embedding-exp-03-07` - 3072 numbers
+- `gemini-embedding-exp-03-07-2048` - 2048 numbers
+- `gemini-embedding-exp-03-07-1024` - 1024 numbers
+- `gemini-embedding-exp-03-07-512` - 512 numbers
+- `gemini-embedding-exp-03-07-256` - 256 numbers
+- `gemini-embedding-exp-03-07-128` - 128 numbers
 This command will embed every `README.md` file in child directories of the current directory and store the results in a SQLite database called `embed.db` in a collection called `readmes`:
 ```bash
-llm embed-multi readmes --files . '*/README.md' -d embed.db -m text-embedding-004
+llm embed-multi readmes -d embed.db -m gemini-embedding-exp-03-07-128 \
+  --files . '*/README.md'
 ```
 You can then run similarity searches against that collection like this:
 ```bash

llm_gemini-0.14.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,7 @@
+llm_gemini.py,sha256=KgiKMPY6q-GkAMzH0gfQWp0cjBBKizNhlnZ3nX5pXWY,14917
+llm_gemini-0.14.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
+llm_gemini-0.14.dist-info/METADATA,sha256=J8oA7hZmNrFsRyH3_s4oesSjWNEaK8pWcT2p-_quPTA,7556
+llm_gemini-0.14.dist-info/WHEEL,sha256=jB7zZ3N9hIM9adW7qlTAyycLYW9npaWKLRzaoVcLKcM,91
+llm_gemini-0.14.dist-info/entry_points.txt,sha256=n544bpgUPIBc5l_cnwsTxPc3gMGJHPtAyqBNp-CkMWk,26
+llm_gemini-0.14.dist-info/top_level.txt,sha256=WUQmG6_2QKbT_8W4HH93qyKl_0SUteL4Ra6_PhyNGKU,11
+llm_gemini-0.14.dist-info/RECORD,,

llm_gemini.py CHANGED Viewed

@@ -65,8 +65,16 @@ def register_models(register):
     ]:
         can_google_search = model_id in GOOGLE_SEARCH_MODELS
         register(
-            GeminiPro(model_id, can_google_search=can_google_search),
-            AsyncGeminiPro(model_id, can_google_search=can_google_search),
+            GeminiPro(
+                model_id,
+                can_google_search=can_google_search,
+                can_schema="flash-thinking" not in model_id,
+            ),
+            AsyncGeminiPro(
+                model_id,
+                can_google_search=can_google_search,
+                can_schema="flash-thinking" not in model_id,
+            ),
         )
@@ -82,7 +90,7 @@ def resolve_type(attachment):
 def cleanup_schema(schema):
     "Gemini supports only a subset of JSON schema"
-    keys_to_remove = ("$schema", "additionalProperties")
+    keys_to_remove = ("$schema", "additionalProperties", "title")
     # Recursively remove them
     if isinstance(schema, dict):
         for key in keys_to_remove:
@@ -186,9 +194,10 @@ class _SharedGemini:
             default=None,
         )
-    def __init__(self, model_id, can_google_search=False):
+    def __init__(self, model_id, can_google_search=False, can_schema=False):
         self.model_id = model_id
         self.can_google_search = can_google_search
+        self.supports_schema = can_schema
         if can_google_search:
             self.Options = self.OptionsWithGoogleSearch
@@ -279,9 +288,17 @@ class _SharedGemini:
             return f'```\n{part["codeExecutionResult"]["output"].strip()}\n```\n'
         return ""
+    def process_candidates(self, candidates):
+        # We only use the first candidate
+        for part in candidates[0]["content"]["parts"]:
+            yield self.process_part(part)
     def set_usage(self, response):
         try:
-            usage = response.response_json[-1].pop("usageMetadata")
+            # Don't record the "content" key from that last candidate
+            for candidate in response.response_json["candidates"]:
+                candidate.pop("content", None)
+            usage = response.response_json.pop("usageMetadata")
             input_tokens = usage.pop("promptTokenCount", None)
             output_tokens = usage.pop("candidatesTokenCount", None)
             usage.pop("totalTokenCount", None)
@@ -311,17 +328,16 @@ class GeminiPro(_SharedGemini, llm.KeyModel):
             for chunk in http_response.iter_bytes():
                 coro.send(chunk)
                 if events:
-                    event = events[0]
-                    if isinstance(event, dict) and "error" in event:
-                        raise llm.ModelError(event["error"]["message"])
-                    try:
-                        part = event["candidates"][0]["content"]["parts"][0]
-                        yield self.process_part(part)
-                    except KeyError:
-                        yield ""
-                    gathered.append(event)
+                    for event in events:
+                        if isinstance(event, dict) and "error" in event:
+                            raise llm.ModelError(event["error"]["message"])
+                        try:
+                            yield from self.process_candidates(event["candidates"])
+                        except KeyError:
+                            yield ""
+                        gathered.append(event)
                     events.clear()
-        response.response_json = gathered
+        response.response_json = gathered[-1]
         self.set_usage(response)
@@ -344,25 +360,37 @@ class AsyncGeminiPro(_SharedGemini, llm.AsyncKeyModel):
                 async for chunk in http_response.aiter_bytes():
                     coro.send(chunk)
                     if events:
-                        event = events[0]
-                        if isinstance(event, dict) and "error" in event:
-                            raise llm.ModelError(event["error"]["message"])
-                        try:
-                            part = event["candidates"][0]["content"]["parts"][0]
-                            yield self.process_part(part)
-                        except KeyError:
-                            yield ""
-                        gathered.append(event)
+                        for event in events:
+                            if isinstance(event, dict) and "error" in event:
+                                raise llm.ModelError(event["error"]["message"])
+                            try:
+                                for chunk in self.process_candidates(
+                                    event["candidates"]
+                                ):
+                                    yield chunk
+                            except KeyError:
+                                yield ""
+                            gathered.append(event)
                         events.clear()
-        response.response_json = gathered
+        response.response_json = gathered[-1]
         self.set_usage(response)
 @llm.hookimpl
 def register_embedding_models(register):
+    register(GeminiEmbeddingModel("text-embedding-004", "text-embedding-004"))
+    # gemini-embedding-exp-03-07 in different truncation sizes
     register(
-        GeminiEmbeddingModel("text-embedding-004", "text-embedding-004"),
+        GeminiEmbeddingModel(
+            "gemini-embedding-exp-03-07", "gemini-embedding-exp-03-07"
+        ),
     )
+    for i in (128, 256, 512, 1024, 2048):
+        register(
+            GeminiEmbeddingModel(
+                f"gemini-embedding-exp-03-07-{i}", f"gemini-embedding-exp-03-07", i
+            ),
+        )
 class GeminiEmbeddingModel(llm.EmbeddingModel):
@@ -370,9 +398,10 @@ class GeminiEmbeddingModel(llm.EmbeddingModel):
     key_env_var = "LLM_GEMINI_KEY"
     batch_size = 20
-    def __init__(self, model_id, gemini_model_id):
+    def __init__(self, model_id, gemini_model_id, truncate=None):
         self.model_id = model_id
         self.gemini_model_id = gemini_model_id
+        self.truncate = truncate
     def embed_batch(self, items):
         headers = {
@@ -398,4 +427,7 @@ class GeminiEmbeddingModel(llm.EmbeddingModel):
             )
         response.raise_for_status()
-        return [item["values"] for item in response.json()["embeddings"]]
+        values = [item["values"] for item in response.json()["embeddings"]]
+        if self.truncate:
+            values = [value[: self.truncate] for value in values]
+        return values

llm_gemini-0.13a0.dist-info/RECORD DELETED Viewed

@@ -1,7 +0,0 @@
-llm_gemini.py,sha256=M4_OIzaF3ytfrCdQ_md9sS6ViDN38JlP9aaykY5Ct0E,13634
-llm_gemini-0.13a0.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
-llm_gemini-0.13a0.dist-info/METADATA,sha256=_SbfjPGKz4M4Wfvd6p8zyx37qOF99R-aTBxGQ0lnGHY,7018
-llm_gemini-0.13a0.dist-info/WHEEL,sha256=jB7zZ3N9hIM9adW7qlTAyycLYW9npaWKLRzaoVcLKcM,91
-llm_gemini-0.13a0.dist-info/entry_points.txt,sha256=n544bpgUPIBc5l_cnwsTxPc3gMGJHPtAyqBNp-CkMWk,26
-llm_gemini-0.13a0.dist-info/top_level.txt,sha256=WUQmG6_2QKbT_8W4HH93qyKl_0SUteL4Ra6_PhyNGKU,11
-llm_gemini-0.13a0.dist-info/RECORD,,

{llm_gemini-0.13a0.dist-info → llm_gemini-0.14.dist-info}/LICENSE RENAMED Viewed

File without changes

{llm_gemini-0.13a0.dist-info → llm_gemini-0.14.dist-info}/WHEEL RENAMED Viewed

File without changes

{llm_gemini-0.13a0.dist-info → llm_gemini-0.14.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{llm_gemini-0.13a0.dist-info → llm_gemini-0.14.dist-info}/top_level.txt RENAMED Viewed

File without changes

llm-gemini 0.13a0__py3-none-any.whl → 0.14__py3-none-any.whl

llm-gemini 0.13a0py3-none-any.whl → 0.14py3-none-any.whl