PyPI - vision-agent - Versions diffs - 0.2.117__py3-none-any.whl → 0.2.119__py3-none-any.whl - Mend

vision-agent 0.2.117py3-none-any.whl → 0.2.119py3-none-any.whl

Files changed (17) hide show

vision_agent/agent/agent.py +1 -1
vision_agent/agent/vision_agent.py +107 -49
vision_agent/agent/vision_agent_coder.py +46 -23
vision_agent/agent/vision_agent_prompts.py +43 -22
vision_agent/clients/landing_public_api.py +2 -2
vision_agent/lmm/lmm.py +15 -6
vision_agent/lmm/types.py +3 -1
vision_agent/tools/__init__.py +2 -2
vision_agent/tools/meta_tools.py +281 -273
vision_agent/tools/tools.py +36 -14
vision_agent/tools/tools_types.py +3 -3
vision_agent/utils/execute.py +69 -22
vision_agent/utils/image_utils.py +2 -2
{vision_agent-0.2.117.dist-info → vision_agent-0.2.119.dist-info}/METADATA +12 -8
{vision_agent-0.2.117.dist-info → vision_agent-0.2.119.dist-info}/RECORD +17 -17
{vision_agent-0.2.117.dist-info → vision_agent-0.2.119.dist-info}/LICENSE +0 -0
{vision_agent-0.2.117.dist-info → vision_agent-0.2.119.dist-info}/WHEEL +0 -0

vision_agent/tools/tools.py CHANGED Viewed

@@ -1,7 +1,9 @@
 import io
 import json
 import logging
+import os
 import tempfile
+import urllib.request
 from importlib import resources
 from pathlib import Path
 from typing import Any, Dict, List, Optional, Tuple, Union, cast
@@ -760,10 +762,10 @@ def florence2_image_caption(image: np.ndarray, detail_caption: bool = True) -> s
     return answer[task]  # type: ignore
-def florence2_object_detection(prompt: str, image: np.ndarray) -> List[Dict[str, Any]]:
-    """'florencev2_object_detection' is a tool that can detect and count multiple
-    objects given a text prompt such as category names or referring expressions. You
-    can optionally separate the categories in the text with commas. It returns a list
+def florence2_phrase_grounding(prompt: str, image: np.ndarray) -> List[Dict[str, Any]]:
+    """'florence2_phrase_grounding' is a tool that can detect multiple
+    objects given a text prompt which can be object names or caption. You
+    can optionally separate the object names in the text with commas. It returns a list
     of bounding boxes with normalized coordinates, label names and associated
     probability scores of 1.0.
@@ -780,7 +782,7 @@ def florence2_object_detection(prompt: str, image: np.ndarray) -> List[Dict[str,
     Example
     -------
-        >>> florence2_object_detection('person looking at a coyote', image)
+        >>> florence2_phrase_grounding('person looking at a coyote', image)
         [
             {'score': 1.0, 'label': 'person', 'bbox': [0.1, 0.11, 0.35, 0.4]},
             {'score': 1.0, 'label': 'coyote', 'bbox': [0.34, 0.21, 0.85, 0.5},
@@ -792,7 +794,7 @@ def florence2_object_detection(prompt: str, image: np.ndarray) -> List[Dict[str,
         "image": image_b64,
         "task": "<CAPTION_TO_PHRASE_GROUNDING>",
         "prompt": prompt,
-        "function_name": "florence2_object_detection",
+        "function_name": "florence2_phrase_grounding",
     }
     detections = send_inference_request(data, "florence2", v2=True)
@@ -1220,6 +1222,13 @@ def extract_frames(
             video_file_path = video.download(output_path=temp_dir)
             return extract_frames_from_video(video_file_path, fps)
+    elif str(video_uri).startswith(("http", "https")):
+        _, image_suffix = os.path.splitext(video_uri)
+        with tempfile.NamedTemporaryFile(delete=False, suffix=image_suffix) as tmp_file:
+            # Download the video and save it to the temporary file
+            with urllib.request.urlopen(str(video_uri)) as response:
+                tmp_file.write(response.read())
+            return extract_frames_from_video(tmp_file.name, fps)
     return extract_frames_from_video(str(video_uri), fps)
@@ -1250,10 +1259,10 @@ def save_json(data: Any, file_path: str) -> None:
 def load_image(image_path: str) -> np.ndarray:
-    """'load_image' is a utility function that loads an image from the given file path string.
+    """'load_image' is a utility function that loads an image from the given file path string or an URL.
     Parameters:
-        image_path (str): The path to the image.
+        image_path (str): The path or URL to the image.
     Returns:
         np.ndarray: The image as a NumPy array.
@@ -1265,6 +1274,13 @@ def load_image(image_path: str) -> np.ndarray:
     # NOTE: sometimes the generated code pass in a NumPy array
     if isinstance(image_path, np.ndarray):
         return image_path
+    if image_path.startswith(("http", "https")):
+        _, image_suffix = os.path.splitext(image_path)
+        with tempfile.NamedTemporaryFile(delete=False, suffix=image_suffix) as tmp_file:
+            # Download the image and save it to the temporary file
+            with urllib.request.urlopen(image_path) as response:
+                tmp_file.write(response.read())
+            image_path = tmp_file.name
     image = Image.open(image_path).convert("RGB")
     return np.array(image)
@@ -1316,7 +1332,7 @@ def save_video(
         video.write_videofile(f.name, codec="libx264")
         f.close()
         _save_video_to_result(f.name)
-        return f.name
+    return f.name
 def _save_video_to_result(video_uri: str) -> None:
@@ -1418,6 +1434,7 @@ def overlay_segmentation_masks(
     medias: Union[np.ndarray, List[np.ndarray]],
     masks: Union[List[Dict[str, Any]], List[List[Dict[str, Any]]]],
     draw_label: bool = True,
+    secondary_label_key: str = "tracking_label",
 ) -> Union[np.ndarray, List[np.ndarray]]:
     """'overlay_segmentation_masks' is a utility function that displays segmentation
     masks.
@@ -1426,7 +1443,10 @@ def overlay_segmentation_masks(
         medias (Union[np.ndarray, List[np.ndarray]]): The image or frames to display
             the masks on.
         masks (Union[List[Dict[str, Any]], List[List[Dict[str, Any]]]]): A list of
-            dictionaries containing the masks.
+            dictionaries containing the masks, labels and scores.
+        draw_label (bool, optional): If True, the labels will be displayed on the image.
+        secondary_label_key (str, optional): The key to use for the secondary
+            tracking label which is needed in videos to display tracking information.
     Returns:
         np.ndarray: The image with the masks displayed.
@@ -1471,6 +1491,7 @@ def overlay_segmentation_masks(
         for elt in masks_int[i]:
             mask = elt["mask"]
             label = elt["label"]
+            tracking_lbl = elt.get(secondary_label_key, None)
             np_mask = np.zeros((pil_image.size[1], pil_image.size[0], 4))
             np_mask[mask > 0, :] = color[label] + (255 * 0.5,)
             mask_img = Image.fromarray(np_mask.astype(np.uint8))
@@ -1478,16 +1499,17 @@ def overlay_segmentation_masks(
             if draw_label:
                 draw = ImageDraw.Draw(pil_image)
-                text_box = draw.textbbox((0, 0), text=label, font=font)
+                text = tracking_lbl if tracking_lbl else label
+                text_box = draw.textbbox((0, 0), text=text, font=font)
                 x, y = _get_text_coords_from_mask(
                     mask,
                     v_gap=(text_box[3] - text_box[1]) + 10,
                     h_gap=(text_box[2] - text_box[0]) // 2,
                 )
                 if x != 0 and y != 0:
-                    text_box = draw.textbbox((x, y), text=label, font=font)
+                    text_box = draw.textbbox((x, y), text=text, font=font)
                     draw.rectangle((x, y, text_box[2], text_box[3]), fill=color[label])
-                    draw.text((x, y), label, fill="black", font=font)
+                    draw.text((x, y), text, fill="black", font=font)
         frame_out.append(np.array(pil_image))
     return frame_out[0] if len(frame_out) == 1 else frame_out
@@ -1663,7 +1685,7 @@ FUNCTION_TOOLS = [
     florence2_ocr,
     florence2_sam2_image,
     florence2_sam2_video,
-    florence2_object_detection,
+    florence2_phrase_grounding,
     ixc25_image_vqa,
     ixc25_video_vqa,
     detr_segmentation,

vision_agent/tools/tools_types.py CHANGED Viewed

@@ -1,8 +1,8 @@
-from uuid import UUID
 from enum import Enum
-from typing import List, Tuple, Optional
+from typing import List, Optional, Tuple
+from uuid import UUID
-from pydantic import BaseModel, ConfigDict, Field, field_serializer, SerializationInfo
+from pydantic import BaseModel, ConfigDict, Field, SerializationInfo, field_serializer
 class BboxInput(BaseModel):

vision_agent/utils/execute.py CHANGED Viewed

@@ -5,7 +5,6 @@ import os
 import platform
 import re
 import sys
-import tempfile
 import traceback
 import warnings
 from enum import Enum
@@ -40,6 +39,7 @@ from vision_agent.utils.exceptions import (
 load_dotenv()
 _LOGGER = logging.getLogger(__name__)
 _SESSION_TIMEOUT = 600  # 10 minutes
+WORKSPACE = Path(os.getenv("WORKSPACE", ""))
 class MimeType(str, Enum):
@@ -384,8 +384,15 @@ class Execution(BaseModel):
 class CodeInterpreter(abc.ABC):
     """Code interpreter interface."""
-    def __init__(self, timeout: int, *args: Any, **kwargs: Any) -> None:
+    def __init__(
+        self,
+        timeout: int,
+        remote_path: Optional[Union[str, Path]] = None,
+        *args: Any,
+        **kwargs: Any,
+    ) -> None:
         self.timeout = timeout
+        self.remote_path = Path(remote_path if remote_path is not None else WORKSPACE)
     def __enter__(self) -> Self:
         return self
@@ -406,17 +413,21 @@ class CodeInterpreter(abc.ABC):
         self.restart_kernel()
         return self.exec_cell(code)
-    def upload_file(self, file: Union[str, Path]) -> str:
+    def upload_file(self, file: Union[str, Path]) -> Path:
         # Default behavior is a no-op (for local code interpreter)
-        return str(file)
+        return Path(file)
-    def download_file(self, file_path: str) -> Path:
+    def download_file(
+        self, remote_file_path: Union[str, Path], local_file_path: Union[str, Path]
+    ) -> Path:
         # Default behavior is a no-op (for local code interpreter)
-        return Path(file_path)
+        return Path(local_file_path)
 class E2BCodeInterpreter(CodeInterpreter):
-    def __init__(self, *args: Any, **kwargs: Any) -> None:
+    def __init__(
+        self, remote_path: Optional[Union[str, Path]] = None, *args: Any, **kwargs: Any
+    ) -> None:
         super().__init__(*args, **kwargs)
         assert os.getenv("E2B_API_KEY"), "E2B_API_KEY environment variable must be set"
         try:
@@ -443,6 +454,9 @@ print(f"Vision Agent version: {va_version}")"""
         _LOGGER.info(
             f"E2BCodeInterpreter (sandbox id: {self.interpreter.sandbox_id}) initialized:\n{sys_versions}"
         )
+        self.remote_path = Path(
+            remote_path if remote_path is not None else "/home/user"
+        )
     def close(self, *args: Any, **kwargs: Any) -> None:
         try:
@@ -516,19 +530,22 @@ print(f"Vision Agent version: {va_version}")"""
         before_sleep=tenacity.before_sleep_log(_LOGGER, logging.INFO),
         after=tenacity.after_log(_LOGGER, logging.INFO),
     )
-    def upload_file(self, file: Union[str, Path]) -> str:
+    def upload_file(self, file: Union[str, Path]) -> Path:
         file_name = Path(file).name
-        remote_path = f"/home/user/{file_name}"
         with open(file, "rb") as f:
-            self.interpreter.files.write(path=remote_path, data=f)
-            _LOGGER.info(f"File ({file}) is uploaded to: {remote_path}")
-            return remote_path
-    def download_file(self, file_path: str) -> Path:
-        with tempfile.NamedTemporaryFile(mode="w+b", delete=False) as file:
-            file.write(self.interpreter.files.read(path=file_path, format="bytes"))
-            _LOGGER.info(f"File ({file_path}) is downloaded to: {file.name}")
-            return Path(file.name)
+            self.interpreter.files.write(path=str(self.remote_path / file_name), data=f)
+        _LOGGER.info(f"File ({file}) is uploaded to: {str(self.remote_path)}")
+        return self.remote_path / file_name
+    def download_file(
+        self, remote_file_path: Union[str, Path], local_file_path: Union[str, Path]
+    ) -> Path:
+        with open(local_file_path, "w+b") as f:
+            f.write(
+                self.interpreter.files.read(path=str(remote_file_path), format="bytes")
+            )
+        _LOGGER.info(f"File ({remote_file_path}) is downloaded to: {local_file_path}")
+        return Path(local_file_path)
     @staticmethod
     def _new_e2b_interpreter_impl(*args, **kwargs) -> E2BCodeInterpreterImpl:  # type: ignore
@@ -540,7 +557,11 @@ print(f"Vision Agent version: {va_version}")"""
 class LocalCodeInterpreter(CodeInterpreter):
-    def __init__(self, timeout: int = _SESSION_TIMEOUT) -> None:
+    def __init__(
+        self,
+        timeout: int = _SESSION_TIMEOUT,
+        remote_path: Optional[Union[str, Path]] = None,
+    ) -> None:
         super().__init__(timeout=timeout)
         self.nb = nbformat.v4.new_notebook()
         self.nb_client = NotebookClient(self.nb, timeout=self.timeout)
@@ -554,6 +575,7 @@ Timeout: {self.timeout}"""
         )
         sleep(1)
         self._new_kernel()
+        self.remote_path = Path(remote_path if remote_path is not None else WORKSPACE)
     def _new_kernel(self) -> None:
         if self.nb_client.kc is None or not run_sync(self.nb_client.kc.is_alive)():  # type: ignore
@@ -607,6 +629,25 @@ Timeout: {self.timeout}"""
             traceback_raw = traceback.format_exc().splitlines()
             return Execution.from_exception(e, traceback_raw)
+    def upload_file(self, file_path: Union[str, Path]) -> Path:
+        with open(file_path, "rb") as f:
+            contents = f.read()
+        with open(self.remote_path / Path(file_path).name, "wb") as f:
+            f.write(contents)
+        _LOGGER.info(f"File ({file_path}) is uploaded to: {str(self.remote_path)}")
+        return Path(self.remote_path / file_path)
+    def download_file(
+        self, remote_file_path: Union[str, Path], local_file_path: Union[str, Path]
+    ) -> Path:
+        with open(self.remote_path / remote_file_path, "rb") as f:
+            contents = f.read()
+        with open(local_file_path, "wb") as f:
+            f.write(contents)
+        _LOGGER.info(f"File ({remote_file_path}) is downloaded to: {local_file_path}")
+        return Path(local_file_path)
 class CodeInterpreterFactory:
     """Factory class for creating code interpreters.
@@ -630,13 +671,19 @@ class CodeInterpreterFactory:
         return instance
     @staticmethod
-    def new_instance(code_sandbox_runtime: Optional[str] = None) -> CodeInterpreter:
+    def new_instance(
+        code_sandbox_runtime: Optional[str] = None, remote_path: Optional[str] = None
+    ) -> CodeInterpreter:
         if not code_sandbox_runtime:
             code_sandbox_runtime = os.getenv("CODE_SANDBOX_RUNTIME", "local")
         if code_sandbox_runtime == "e2b":
-            instance: CodeInterpreter = E2BCodeInterpreter(timeout=_SESSION_TIMEOUT)
+            instance: CodeInterpreter = E2BCodeInterpreter(
+                timeout=_SESSION_TIMEOUT, remote_path=remote_path
+            )
         elif code_sandbox_runtime == "local":
-            instance = LocalCodeInterpreter(timeout=_SESSION_TIMEOUT)
+            instance = LocalCodeInterpreter(
+                timeout=_SESSION_TIMEOUT, remote_path=remote_path
+            )
         else:
             raise ValueError(
                 f"Unsupported code sandbox runtime: {code_sandbox_runtime}. Supported runtimes: e2b, local"

vision_agent/utils/image_utils.py CHANGED Viewed

@@ -70,7 +70,7 @@ def rle_decode_array(rle: Dict[str, List[int]]) -> np.ndarray:
     r"""Decode a run-length encoded mask. Returns numpy array, 1 - mask, 0 - background.
     Parameters:
-        mask: The mask in run-length encoded as an array.
+        rle: The run-length encoded mask.
     """
     size = rle["size"]
     counts = rle["counts"]
@@ -100,7 +100,7 @@ def frames_to_bytes(
     """
     with tempfile.NamedTemporaryFile(delete=True) as temp_file:
         clip = ImageSequenceClip(frames, fps=fps)
-        clip.write_videofile(temp_file.name + f".{file_ext}", fps=fps)
+        clip.write_videofile(temp_file.name + f".{file_ext}", fps=fps, codec="libx264")
         with open(temp_file.name + f".{file_ext}", "rb") as f:
             buffer_bytes = f.read()
     return buffer_bytes

{vision_agent-0.2.117.dist-info → vision_agent-0.2.119.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: vision-agent
-Version: 0.2.117
+Version: 0.2.119
 Summary: Toolset for Vision Agent
 Author: Landing AI
 Author-email: dev@landing.ai
@@ -81,15 +81,15 @@ export OPENAI_API_KEY="your-api-key"
 ```
 ### Vision Agent
-There are two agents that you can use. Vision Agent is a conversational agent that has
+There are two agents that you can use. `VisionAgent` is a conversational agent that has
 access to tools that allow it to write an navigate python code and file systems. It can
-converse with the user in natural language. VisionAgentCoder is an agent that can write
-code for vision tasks, such as counting people in an image. However, it cannot converse
-and can only respond with code. VisionAgent can call VisionAgentCoder to write vision
-code.
+converse with the user in natural language. `VisionAgentCoder` is an agent specifically
+for writing code for vision tasks, such as counting people in an image. However, it
+cannot chat with you and can only respond with code. `VisionAgent` can call
+`VisionAgentCoder` to write vision code.
 #### Basic Usage
-To run the streamlit app locally to chat with Vision Agent, you can run the following
+To run the streamlit app locally to chat with `VisionAgent`, you can run the following
 command:
 ```bash
@@ -186,7 +186,7 @@ the code and having it update. You just need to add the code as a response from
 assistant:
 ```python
-agent = va.agent.VisionAgent(verbosity=2)
+agent = va.agent.VisionAgentCoder(verbosity=2)
 conv = [
     {
         "role": "user",
@@ -252,6 +252,10 @@ function. Make sure the documentation is in the same format above with descripti
 `Parameters:`, `Returns:`, and `Example\n-------`. You can find an example use case
 [here](examples/custom_tools/) as this is what the agent uses to pick and use the tool.
+Can't find the tool you need and want add it to `VisionAgent`? Check out our
+[vision-agent-tools](https://github.com/landing-ai/vision-agent-tools) repository where
+we add the source code for all the tools used in `VisionAgent`.
 ## Additional Backends
 ### Ollama
 We also provide a `VisionAgentCoder` that uses Ollama. To get started you must download

{vision_agent-0.2.117.dist-info → vision_agent-0.2.119.dist-info}/RECORD RENAMED Viewed

@@ -1,33 +1,33 @@
 vision_agent/__init__.py,sha256=EAb4-f9iyuEYkBrX4ag1syM8Syx8118_t0R6_C34M9w,57
 vision_agent/agent/__init__.py,sha256=FRwiux1FGvGccetyUCtY46KP01fQteqorm-JtFepovI,176
-vision_agent/agent/agent.py,sha256=Bt8yhjCFXuRdZaHxKEesG40V09nWRt45sZluri1R3AA,575
+vision_agent/agent/agent.py,sha256=2cjIOxEuSJrqbfPXYoV0qER5ihXsPFCoEFJa4jpqan0,597
 vision_agent/agent/agent_utils.py,sha256=22LiPhkJlS5mVeo2dIi259pc2NgA7PGHRpcbnrtKo78,1930
-vision_agent/agent/vision_agent.py,sha256=5rgO-pScVOS3t4sWnLBnGYYkGftGgF4U0FpZzFVrDAY,8447
-vision_agent/agent/vision_agent_coder.py,sha256=qRSv_krY6-uHJC8exo3Nw0dPJ81jSzhKw2WTCHw1XVE,33733
+vision_agent/agent/vision_agent.py,sha256=IEyXT_JPCuWmBHdEnM1Wrsj7hmCe5pKLf0gnZFJTddI,11046
+vision_agent/agent/vision_agent_coder.py,sha256=DOTmDdGPxcI06Jp6yx4ekRMP0vhiVaK9B9Dl8UyJHeo,34396
 vision_agent/agent/vision_agent_coder_prompts.py,sha256=xIya1txRZM8qoQHAWTEkEFCL8L3iZD7QD09t3ZtdxSE,11305
-vision_agent/agent/vision_agent_prompts.py,sha256=ydUU_Wvw-jqdL_vObSUr-VCQvjSwA5Fd74TbbhUzyxk,6112
+vision_agent/agent/vision_agent_prompts.py,sha256=0GliXFtBf32aPu2ClU63FI5ii5CTxWYsvrsmnnDp-gs,7134
 vision_agent/clients/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 vision_agent/clients/http.py,sha256=k883i6M_4nl7zwwHSI-yP5sAgQZIDPM1nrKD6YFJ3Xs,2009
-vision_agent/clients/landing_public_api.py,sha256=6L15zh5lP5JHCpGnYpHMREgrrKiJin_OYdf2vT9HHZQ,1507
+vision_agent/clients/landing_public_api.py,sha256=rGtACkr8o5egDuMHQ5MBO4NuvsgPTp9Ew3rbq4R-vs0,1507
 vision_agent/fonts/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 vision_agent/fonts/default_font_ch_en.ttf,sha256=1YM0Z3XqLDjSNbF7ihQFSAIUdjF9m1rtHiNC_6QosTE,1594400
 vision_agent/lmm/__init__.py,sha256=YuUZRsMHdn8cMOv6iBU8yUqlIOLrbZQqZl9KPnofsHQ,103
-vision_agent/lmm/lmm.py,sha256=cuXtfFb7kJwVTyHTeK_t1bYItPiNjmDI2gF8vJs4gsM,20231
-vision_agent/lmm/types.py,sha256=8TSRoTbXyCKVJiH-wHXI2OiGOMSkYv1vLGYeAXtNpOQ,153
-vision_agent/tools/__init__.py,sha256=Y6Y7McmdC8cm6UsJgExBLEPi4StBkqfY4y8_Mp7LlWU,2190
-vision_agent/tools/meta_tools.py,sha256=q6h7hZarZrsWRloVE6PbTZwW8J2N1uUM9Ac-XxsT6hk,13365
+vision_agent/lmm/lmm.py,sha256=AYrZNdhghG293wd3aKZ1jK1lUm2NLWwALktbM4wNais,20862
+vision_agent/lmm/types.py,sha256=ZEXR_ptBL0ZwDMTDYkgxUCmSZFmBYPQd2jreNzr_8UY,221
+vision_agent/tools/__init__.py,sha256=i7JOLxRaLdcY7-vCNOGAeOFMBfiAUIwWhnT32FO97VE,2201
+vision_agent/tools/meta_tools.py,sha256=Vu9WnKicGhafx9dPzDbQjQdcIzRCYYFPF68o79hDP-8,14616
 vision_agent/tools/prompts.py,sha256=V1z4YJLXZuUl_iZ5rY0M5hHc_2tmMEUKr0WocXKGt4E,1430
 vision_agent/tools/tool_utils.py,sha256=qMsb9d8QtpXGgF9rpPO2dA390BewKdYO68oWKDu-TGg,6504
-vision_agent/tools/tools.py,sha256=JscejDn05jpYW6psPkRDesegPtZJshNWCncGFPOpI7c,58626
-vision_agent/tools/tools_types.py,sha256=z6_XtUhWgh201yM7Z0CYtiLBEGdHPc_QUydMDHZ84EA,2216
+vision_agent/tools/tools.py,sha256=kbbMToAaHxl42dDEvyz9Mvtpqts0l0hGoC5YQQyozr8,59953
+vision_agent/tools/tools_types.py,sha256=iLWSirheC87fKQolIhx_O4Jk8Lv7DRiLuE8PJqLGiVQ,2216
 vision_agent/utils/__init__.py,sha256=pWk0ktvR4aUEhuEIzSLM9kSgW4WDVqptdvOTeGLkJ6M,230
 vision_agent/utils/exceptions.py,sha256=booSPSuoULF7OXRr_YbC4dtKt6gM_HyiFQHBuaW86C4,2052
-vision_agent/utils/execute.py,sha256=1_pyu16WRlFD81W8Uy_Sv7_jD_qkrkxHdUNeFstBzaA,25082
-vision_agent/utils/image_utils.py,sha256=c1LrmaHD331za8DbA1myJpgUmWoDzePaOK6-dsdpZQo,9847
+vision_agent/utils/execute.py,sha256=Ap8Yx80spQq5f2QtKGx1MK03BR45mJKhlp1kfh-rIao,26751
+vision_agent/utils/image_utils.py,sha256=eNghu_2L8624jEXy8ZZS9OX46Mv0DT9bcvLForujwTs,9848
 vision_agent/utils/sim.py,sha256=ebE9Cs00pVEDI1HMjAzUBk88tQQmc2U-yAzIDinnekU,5572
 vision_agent/utils/type_defs.py,sha256=BE12s3JNQy36QvauXHjwyeffVh5enfcvd4vTzSwvEZI,1384
 vision_agent/utils/video.py,sha256=rNmU9KEIkZB5-EztZNlUiKYN0mm_55A_2VGUM0QpqLA,8779
-vision_agent-0.2.117.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
-vision_agent-0.2.117.dist-info/METADATA,sha256=GxjyDhGf-9M3VAM5T2A1DHuR4A4KbceN4q-wGDw8Vhw,11997
-vision_agent-0.2.117.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
-vision_agent-0.2.117.dist-info/RECORD,,
+vision_agent-0.2.119.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
+vision_agent-0.2.119.dist-info/METADATA,sha256=ag8Cf800dZJtJqJtwEcf4gqf7Qjf-K1JMoeisDI7RWQ,12255
+vision_agent-0.2.119.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
+vision_agent-0.2.119.dist-info/RECORD,,

{vision_agent-0.2.117.dist-info → vision_agent-0.2.119.dist-info}/LICENSE RENAMED Viewed

File without changes

{vision_agent-0.2.117.dist-info → vision_agent-0.2.119.dist-info}/WHEEL RENAMED Viewed

File without changes

vision-agent 0.2.117__py3-none-any.whl → 0.2.119__py3-none-any.whl

vision-agent 0.2.117py3-none-any.whl → 0.2.119py3-none-any.whl