PyPI - vision-agent - Versions diffs - 0.2.229__py3-none-any.whl → 0.2.231__py3-none-any.whl - Mend

vision-agent 0.2.229py3-none-any.whl → 0.2.231py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

vision_agent/.sim_tools/df.csv +10 -8
vision_agent/agent/agent_utils.py +10 -9
vision_agent/agent/types.py +1 -0
vision_agent/agent/vision_agent.py +3 -4
vision_agent/agent/vision_agent_coder_prompts.py +6 -6
vision_agent/agent/vision_agent_coder_v2.py +41 -26
vision_agent/agent/vision_agent_planner_prompts.py +6 -6
vision_agent/agent/vision_agent_planner_prompts_v2.py +16 -50
vision_agent/agent/vision_agent_planner_v2.py +11 -12
vision_agent/agent/vision_agent_prompts.py +11 -11
vision_agent/agent/vision_agent_prompts_v2.py +18 -3
vision_agent/agent/vision_agent_v2.py +29 -30
vision_agent/configs/__init__.py +1 -0
vision_agent/configs/anthropic_config.py +150 -0
vision_agent/configs/anthropic_openai_config.py +150 -0
vision_agent/configs/config.py +150 -0
vision_agent/configs/openai_config.py +160 -0
vision_agent/lmm/__init__.py +1 -1
vision_agent/lmm/lmm.py +63 -9
vision_agent/tools/__init__.py +4 -4
vision_agent/tools/planner_tools.py +74 -48
vision_agent/tools/tool_utils.py +3 -0
vision_agent/tools/tools.py +49 -31
vision_agent/utils/sim.py +33 -12
vision_agent-0.2.231.dist-info/METADATA +148 -0
vision_agent-0.2.231.dist-info/RECORD +52 -0
vision_agent-0.2.229.dist-info/METADATA +0 -562
vision_agent-0.2.229.dist-info/RECORD +0 -47
{vision_agent-0.2.229.dist-info → vision_agent-0.2.231.dist-info}/LICENSE +0 -0
{vision_agent-0.2.229.dist-info → vision_agent-0.2.231.dist-info}/WHEEL +0 -0

vision_agent/tools/tools.py CHANGED Viewed

@@ -222,7 +222,7 @@ def sam2(
     ret = _sam2(image, detections, image_size)
     _display_tool_trace(
         sam2.__name__,
-        {},
+        {"detections": detections},
         ret["display_data"],
         ret["files"],
     )
@@ -314,18 +314,29 @@ def od_sam2_video_tracking(
     # Process each segment and collect detections
     detections_per_segment: List[Any] = []
-    for segment_index, segment in enumerate(segments):
-        segment_detections = process_segment(
-            segment_frames=segment,
-            od_model=od_model,
-            prompt=prompt,
-            fine_tune_id=fine_tune_id,
-            chunk_length=chunk_length,
-            image_size=image_size,
-            segment_index=segment_index,
-            object_detection_tool=_apply_object_detection,
-        )
-        detections_per_segment.append(segment_detections)
+    with ThreadPoolExecutor() as executor:
+        futures = {
+            executor.submit(
+                process_segment,
+                segment_frames=segment,
+                od_model=od_model,
+                prompt=prompt,
+                fine_tune_id=fine_tune_id,
+                chunk_length=chunk_length,
+                image_size=image_size,
+                segment_index=segment_index,
+                object_detection_tool=_apply_object_detection,
+            ): segment_index
+            for segment_index, segment in enumerate(segments)
+        }
+        for future in as_completed(futures):
+            segment_index = futures[future]
+            detections_per_segment.append((segment_index, future.result()))
+    detections_per_segment = [
+        x[1] for x in sorted(detections_per_segment, key=lambda x: x[0])
+    ]
     merged_detections = merge_segments(detections_per_segment)
     post_processed = post_process(merged_detections, image_size)
@@ -390,7 +401,7 @@ def _owlv2_object_detection(
         {
             "label": bbox["label"],
             "bbox": normalize_bbox(bbox["bounding_box"], image_size),
-            "score": bbox["score"],
+            "score": round(bbox["score"], 2),
         }
         for bbox in bboxes
     ]
@@ -398,7 +409,7 @@ def _owlv2_object_detection(
         {
             "label": bbox["label"],
             "bbox": bbox["bounding_box"],
-            "score": bbox["score"],
+            "score": round(bbox["score"], 2),
         }
         for bbox in bboxes
     ]
@@ -582,7 +593,7 @@ def owlv2_sam2_video_tracking(
     )
     _display_tool_trace(
         owlv2_sam2_video_tracking.__name__,
-        {},
+        {"prompt": prompt, "chunk_length": chunk_length},
         ret["display_data"],
         ret["files"],
     )
@@ -595,14 +606,14 @@ def owlv2_sam2_video_tracking(
 def florence2_object_detection(
     prompt: str, image: np.ndarray, fine_tune_id: Optional[str] = None
 ) -> List[Dict[str, Any]]:
-    """'florence2_object_detection' is a tool that can detect multiple
-    objects given a text prompt which can be object names or caption. You
-    can optionally separate the object names in the text with commas. It returns a list
-    of bounding boxes with normalized coordinates, label names and associated
-    confidence scores of 1.0.
+    """'florence2_object_detection' is a tool that can detect multiple objects given a
+    text prompt which can be object names or caption. You can optionally separate the
+    object names in the text with commas. It returns a list of bounding boxes with
+    normalized coordinates, label names and associated confidence scores of 1.0.
     Parameters:
-        prompt (str): The prompt to ground to the image.
+        prompt (str): The prompt to ground to the image. Use exclusive categories that
+            do not overlap such as 'person, car' and NOT 'person, athlete'.
         image (np.ndarray): The image to used to detect objects
         fine_tune_id (Optional[str]): If you have a fine-tuned model, you can pass the
             fine-tuned model ID here to use it.
@@ -681,7 +692,8 @@ def florence2_sam2_instance_segmentation(
     1.0.
     Parameters:
-        prompt (str): The prompt to ground to the image.
+        prompt (str): The prompt to ground to the image. Use exclusive categories that
+            do not overlap such as 'person, car' and NOT 'person, athlete'.
         image (np.ndarray): The image to ground the prompt to.
         fine_tune_id (Optional[str]): If you have a fine-tuned model, you can pass the
             fine-tuned model ID here to use it.
@@ -769,7 +781,8 @@ def florence2_sam2_video_tracking(
     is useful for tracking and counting without duplicating counts.
     Parameters:
-        prompt (str): The prompt to ground to the video.
+        prompt (str): The prompt to ground to the image. Use exclusive categories that
+            do not overlap such as 'person, car' and NOT 'person, athlete'.
         frames (List[np.ndarray]): The list of frames to ground the prompt to.
         chunk_length (Optional[int]): The number of frames to re-run florence2 to find
             new objects.
@@ -1679,7 +1692,7 @@ def video_temporal_localization(
     prompt: str,
     frames: List[np.ndarray],
     model: str = "qwen2vl",
-    chunk_length_frames: Optional[int] = 2,
+    chunk_length_frames: int = 2,
 ) -> List[float]:
     """'video_temporal_localization' will run qwen2vl on each chunk_length_frames
     value selected for the video. It can detect multiple objects independently per
@@ -1693,7 +1706,7 @@ def video_temporal_localization(
         frames (List[np.ndarray]): The reference frames used for the question
         model (str): The model to use for the inference. Valid values are
             'qwen2vl', 'gpt4o'.
-        chunk_length_frames (Optional[int]): length of each chunk in frames
+        chunk_length_frames (int): length of each chunk in frames
     Returns:
         List[float]: A list of floats with a value of 1.0 if the objects to be found
@@ -1712,8 +1725,7 @@ def video_temporal_localization(
         "model": model,
         "function_name": "video_temporal_localization",
     }
-    if chunk_length_frames is not None:
-        payload["chunk_length_frames"] = chunk_length_frames
+    payload["chunk_length_frames"] = chunk_length_frames
     data = send_inference_request(
         payload, "video-temporal-localization", files=files, v2=True
@@ -1724,7 +1736,13 @@ def video_temporal_localization(
         data,
         files,
     )
-    return [cast(float, value) for value in data]
+    chunked_data = [cast(float, value) for value in data]
+    full_data = []
+    for value in chunked_data:
+        full_data.extend([value] * chunk_length_frames)
+    return full_data[: len(frames)]
 def vit_image_classification(image: np.ndarray) -> Dict[str, Any]:
@@ -2148,7 +2166,7 @@ def siglip_classification(image: np.ndarray, labels: List[str]) -> Dict[str, Any
     return response
-# agentic od tools
+# Agentic OD Tools
 def _agentic_object_detection(
@@ -2644,7 +2662,7 @@ def save_image(image: np.ndarray, file_path: str) -> None:
 def save_video(
-    frames: List[np.ndarray], output_video_path: Optional[str] = None, fps: float = 1
+    frames: List[np.ndarray], output_video_path: Optional[str] = None, fps: float = 5
 ) -> str:
     """'save_video' is a utility function that saves a list of frames as a mp4 video file on disk.

vision_agent/utils/sim.py CHANGED Viewed

@@ -98,10 +98,12 @@ class Sim:
             raise ValueError("key is required if no column 'embs' is present.")
         if sim_key is not None:
-            self.df["embs"] = self.df[sim_key].apply(
-                lambda x: get_embedding(
-                    self.emb_call,
-                    x,
+            self.df = self.df.assign(
+                embs=self.df[sim_key].apply(
+                    lambda x: get_embedding(
+                        self.emb_call,
+                        x,
+                    )
                 )
             )
@@ -141,7 +143,9 @@ class Sim:
         df_load = pd.read_csv(load_dir / "df.csv")
         if platform.system() == "Windows":
-            df_load["doc"] = df_load["doc"].apply(lambda x: x.replace("\r", ""))
+            df_load = df_load.assign(
+                doc=df_load.doc.apply(lambda x: x.replace("\r", ""))
+            )
         return df.equals(df_load)  # type: ignore
     @lru_cache(maxsize=256)
@@ -166,7 +170,9 @@ class Sim:
             self.emb_call,
             query,
         )
-        self.df["sim"] = self.df.embs.apply(lambda x: 1 - cosine(x, embedding))
+        self.df = self.df.assign(
+            sim=self.df.embs.apply(lambda x: 1 - cosine(x, embedding))
+        )
         res = self.df.sort_values("sim", ascending=False).head(k)
         if thresh is not None:
             res = res[res.sim > thresh]
@@ -214,8 +220,13 @@ class AzureSim(Sim):
             raise ValueError("key is required if no column 'embs' is present.")
         if sim_key is not None:
-            self.df["embs"] = self.df[sim_key].apply(
-                lambda x: get_embedding(self.emb_call, x)
+            self.df = self.df.assign(
+                embs=self.df[sim_key].apply(
+                    lambda x: get_embedding(
+                        self.emb_call,
+                        x,
+                    )
+                )
             )
@@ -245,8 +256,13 @@ class OllamaSim(Sim):
             raise ValueError("key is required if no column 'embs' is present.")
         if sim_key is not None:
-            self.df["embs"] = self.df[sim_key].apply(
-                lambda x: get_embedding(emb_call, x)
+            self.df = self.df.assign(
+                embs=self.df[sim_key].apply(
+                    lambda x: get_embedding(
+                        self.emb_call,
+                        x,
+                    )
+                )
             )
@@ -267,8 +283,13 @@ class StellaSim(Sim):
             raise ValueError("key is required if no column 'embs' is present.")
         if sim_key is not None:
-            self.df["embs"] = self.df[sim_key].apply(
-                lambda x: get_embedding(emb_call, x)
+            self.df = self.df.assign(
+                embs=self.df[sim_key].apply(
+                    lambda x: get_embedding(
+                        self.emb_call,
+                        x,
+                    )
+                )
             )
     @staticmethod

vision_agent-0.2.231.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,148 @@
+Metadata-Version: 2.1
+Name: vision-agent
+Version: 0.2.231
+Summary: Toolset for Vision Agent
+Author: Landing AI
+Author-email: dev@landing.ai
+Requires-Python: >=3.9,<4.0
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.9
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Requires-Dist: anthropic (>=0.31.0,<0.32.0)
+Requires-Dist: av (>=11.0.0,<12.0.0)
+Requires-Dist: e2b (>=0.17.2a50,<0.18.0)
+Requires-Dist: e2b-code-interpreter (==0.0.11a37)
+Requires-Dist: flake8 (>=7.0.0,<8.0.0)
+Requires-Dist: ipykernel (>=6.29.4,<7.0.0)
+Requires-Dist: langsmith (>=0.1.58,<0.2.0)
+Requires-Dist: libcst (>=1.5.0,<2.0.0)
+Requires-Dist: matplotlib (>=3.9.2,<4.0.0)
+Requires-Dist: nbclient (>=0.10.0,<0.11.0)
+Requires-Dist: nbformat (>=5.10.4,<6.0.0)
+Requires-Dist: numpy (>=1.21.0,<2.0.0)
+Requires-Dist: openai (>=1.0.0,<2.0.0)
+Requires-Dist: opencv-python (>=4.0.0,<5.0.0)
+Requires-Dist: opentelemetry-api (>=1.29.0,<2.0.0)
+Requires-Dist: pandas (>=2.0.0,<3.0.0)
+Requires-Dist: pillow (>=10.0.0,<11.0.0)
+Requires-Dist: pillow-heif (>=0.16.0,<0.17.0)
+Requires-Dist: pydantic (==2.7.4)
+Requires-Dist: pydantic-settings (>=2.2.1,<3.0.0)
+Requires-Dist: pytube (==15.0.0)
+Requires-Dist: requests (>=2.0.0,<3.0.0)
+Requires-Dist: rich (>=13.7.1,<14.0.0)
+Requires-Dist: scikit-learn (>=1.5.2,<2.0.0)
+Requires-Dist: scipy (>=1.13.0,<1.14.0)
+Requires-Dist: tabulate (>=0.9.0,<0.10.0)
+Requires-Dist: tenacity (>=8.3.0,<9.0.0)
+Requires-Dist: tqdm (>=4.64.0,<5.0.0)
+Requires-Dist: typing_extensions (>=4.0.0,<5.0.0)
+Project-URL: Homepage, https://landing.ai
+Project-URL: documentation, https://github.com/landing-ai/vision-agent
+Project-URL: repository, https://github.com/landing-ai/vision-agent
+Description-Content-Type: text/markdown
+<div align="center">
+    <picture>
+        <source media="(prefers-color-scheme: dark)" srcset="https://github.com/landing-ai/vision-agent/blob/main/assets/logo_light.svg?raw=true">
+        <source media="(prefers-color-scheme: light)" srcset="https://github.com/landing-ai/vision-agent/blob/main/assets/logo_dark.svg?raw=true">
+        <img alt="VisionAgent" height="200px" src="https://github.com/landing-ai/vision-agent/blob/main/assets/logo_light.svg?raw=true">
+    </picture>
+[![](https://dcbadge.vercel.app/api/server/wPdN8RCYew?compact=true&style=flat)](https://discord.gg/wPdN8RCYew)
+![ci_status](https://github.com/landing-ai/vision-agent/actions/workflows/ci_cd.yml/badge.svg)
+[![PyPI version](https://badge.fury.io/py/vision-agent.svg)](https://badge.fury.io/py/vision-agent)
+![version](https://img.shields.io/pypi/pyversions/vision-agent)
+</div>
+## VisionAgent
+VisionAgent is a library that helps you utilize agent frameworks to generate code to
+solve your vision task. Check out our discord for updates and roadmaps! The fastest
+way to test out VisionAgent is to use our web application which you can find [here](https://va.landing.ai/).
+## Installation
+```bash
+pip install vision-agent
+```
+```bash
+export ANTHROPIC_API_KEY="your-api-key"
+export OPENAI_API_KEY="your-api-key"
+```
+> **_NOTE:_** We found using both Anthropic Claude-3.5 and OpenAI o1 to be provide the best performance for VisionAgent. If you want to use a different LLM provider or only one, see 'Using Other LLM Providers' below.
+## Documentation
+[VisionAgent Library Docs](https://landing-ai.github.io/vision-agent/)
+## Examples
+### Counting cans in an image
+You can run VisionAgent in a local Jupyter Notebook [Counting cans in an image](https://github.com/landing-ai/vision-agent/blob/main/examples/notebooks/counting_cans.ipynb)
+### Generating code
+You can use VisionAgent to generate code to count the number of people in an image:
+```python
+from vision_agent.agent import VisionAgentCoderV2
+from vision_agent.agent.types import AgentMessage
+agent = VisionAgentCoderV2(verbose=True)
+code_context = agent.generate_code(
+    [
+        AgentMessage(
+            role="user",
+            content="Count the number of people in this image",
+            media=["people.png"]
+        )
+    ]
+)
+with open("generated_code.py", "w") as f:
+    f.write(code_context.code + "\n" + code_context.test)
+```
+### Using the tools directly
+VisionAgent produces code that utilizes our tools. You can also use the tools directly.
+For example if you wanted to detect people in an image and visualize the results:
+```python
+import vision_agent.tools as T
+import matplotlib.pyplot as plt
+image = T.load_image("people.png")
+dets = T.countgd_object_detection("person", image)
+# visualize the countgd bounding boxes on the image
+viz = T.overlay_bounding_boxes(image, dets)
+# save the visualization to a file
+T.save_image(viz, "people_detected.png")
+# display the visualization
+plt.imshow(viz)
+plt.show()
+```
+You can also use the tools for running on video files:
+```python
+import vision_agent.tools as T
+frames_and_ts = T.extract_frames_and_timestamps("people.mp4")
+# extract the frames from the frames_and_ts list
+frames = [f["frame"] for f in frames_and_ts]
+# run the countgd tracking on the frames
+tracks = T.countgd_sam2_video_tracking("person", frames)
+# visualize the countgd tracking results on the frames and save the video
+viz = T.overlay_segmentation_masks(frames, tracks)
+T.save_video(viz, "people_detected.mp4")
+```
+## Using Other LLM Providers
+You can use other LLM providers by changing `config.py` in the `vision_agent/configs`
+directory. For example to change to Anthropic simply just run:
+```bash
+cp vision_agent/configs/anthropic_config.py vision_agent/configs/config.py
+```
+> **_NOTE:_** VisionAgent moves fast and we are constantly updating and changing the library. If you have any questions or need help, please reach out to us on our discord channel.

vision_agent-0.2.231.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,52 @@
+vision_agent/.sim_tools/df.csv,sha256=XdcgkjC7CjF_CoJnXmFkYOPUBwHemiwsauh62b1eh1M,42472
+vision_agent/.sim_tools/embs.npy,sha256=YJe8EcKVNmeX_75CS2T1sbY-sUS_1HQAMT-34zc18a0,254080
+vision_agent/__init__.py,sha256=EAb4-f9iyuEYkBrX4ag1syM8Syx8118_t0R6_C34M9w,57
+vision_agent/agent/README.md,sha256=Q4w7FWw38qaWosQYAZ7NqWx8Q5XzuWrlv7nLhjUd1-8,5527
+vision_agent/agent/__init__.py,sha256=M8CffavdIh8Zh-skznLHIaQkYGCGK7vk4dq1FaVkbs4,617
+vision_agent/agent/agent.py,sha256=_1tHWAs7Jm5tqDzEcPfCRvJV3uRRveyh4n9_9pd6I1w,1565
+vision_agent/agent/agent_utils.py,sha256=IXxN9XruaeNTreUrdztb3kWJhimpsdH6hjv6xT4jg1Q,14062
+vision_agent/agent/types.py,sha256=dIdxATH_PP76pD5Wfo0oofWt6iPQh0vpf48QbEQSzhs,2472
+vision_agent/agent/vision_agent.py,sha256=fH9NOLk7twL1fPr9vLSqkaYhah-gfDWfTOVF2FfMyzI,23461
+vision_agent/agent/vision_agent_coder.py,sha256=flUxOibyGZK19BCSK5mhaD3HjCxHw6c6FtKom6N2q1E,27359
+vision_agent/agent/vision_agent_coder_prompts.py,sha256=_kkPLezUVnBXieNPlxMQab_6J6P7F-aa6ItF5NhZZsM,12281
+vision_agent/agent/vision_agent_coder_prompts_v2.py,sha256=idmSMfxebPULqqvllz3gqRzGDchEvS5dkGngvBs4PGo,4872
+vision_agent/agent/vision_agent_coder_v2.py,sha256=ZR2PQoMqNM6yK3vn_0rrCJf_EplRKye7t7bVjyl51ls,16476
+vision_agent/agent/vision_agent_planner.py,sha256=fFzjNkZBKkh8Y_oS06ATI4qz31xmIJvixb_tV1kX8KA,18590
+vision_agent/agent/vision_agent_planner_prompts.py,sha256=rYRdJthc-sQN57VgCBKrF09Sd73BSxcBdjNe6C4WNZ8,6837
+vision_agent/agent/vision_agent_planner_prompts_v2.py,sha256=5xTx93lNpoyT4eAD9jicwDyDAkuW7eQqicr17zCjrQw,33337
+vision_agent/agent/vision_agent_planner_v2.py,sha256=7hBQdg9y4oCLDiQ54Kh12_uIMywedKKNPWiKPRA01cQ,20568
+vision_agent/agent/vision_agent_prompts.py,sha256=KaJwYPUP7_GvQsCPPs6Fdawmi3AQWmWajBUuzj7gTG4,13812
+vision_agent/agent/vision_agent_prompts_v2.py,sha256=AW_bW1boGiCLyLFd3h4GQenfDACttQagDHwpBkSW4Xo,2518
+vision_agent/agent/vision_agent_v2.py,sha256=335VT0hk0jkB14y4W3cJo5ueEu1wY_jjN-R_m2xaQ30,10752
+vision_agent/clients/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+vision_agent/clients/http.py,sha256=k883i6M_4nl7zwwHSI-yP5sAgQZIDPM1nrKD6YFJ3Xs,2009
+vision_agent/clients/landing_public_api.py,sha256=lU2ev6E8NICmR8DMUljuGcVFy5VNJQ4WQkWC8WnnJEc,1503
+vision_agent/configs/__init__.py,sha256=Iu75-w9_nlPmnB_qKA7nYaaaHf7xtTrDmK8N4v2WV34,27
+vision_agent/configs/anthropic_config.py,sha256=T1UuESgiY8913A6wA42P7-cg8FTk9-LkJpyywo7OnIQ,4298
+vision_agent/configs/anthropic_openai_config.py,sha256=YQjFxmlxppn5L55dJjK_v1myBJQ_V5J4q25pmUtwTOU,4310
+vision_agent/configs/config.py,sha256=YQjFxmlxppn5L55dJjK_v1myBJQ_V5J4q25pmUtwTOU,4310
+vision_agent/configs/openai_config.py,sha256=v2_AIY89d7LKWn4uqA2G047U2IdmnqZrGH2Iww9gRIw,4498
+vision_agent/fonts/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+vision_agent/fonts/default_font_ch_en.ttf,sha256=1YM0Z3XqLDjSNbF7ihQFSAIUdjF9m1rtHiNC_6QosTE,1594400
+vision_agent/lmm/__init__.py,sha256=xk2Rn8Zgpy2xwYaOGHzy4tXxnxo2aj6SkpNjeJ8yxcY,111
+vision_agent/lmm/lmm.py,sha256=arwfYPWme_RxCxSpEQ0ZkpHO22GFPCwVeoSvXqLPOAk,19288
+vision_agent/lmm/types.py,sha256=ZEXR_ptBL0ZwDMTDYkgxUCmSZFmBYPQd2jreNzr_8UY,221
+vision_agent/tools/__init__.py,sha256=zopUrANPx7p0NGy6BxmEaYhDrj8DX8w7BLfgmCbz-mU,2897
+vision_agent/tools/meta_tools.py,sha256=TPeS7QWnc_PmmU_ndiDT03dXbQ5yDSP33E7U8cSj7Ls,28660
+vision_agent/tools/planner_tools.py,sha256=Mk3N-I-Qs4ezeyv8EL9BxdxmJG5oWiH5bFkvgwJKB0s,14660
+vision_agent/tools/prompts.py,sha256=V1z4YJLXZuUl_iZ5rY0M5hHc_2tmMEUKr0WocXKGt4E,1430
+vision_agent/tools/tool_utils.py,sha256=xJRWF96Ge9RvhhVHrOtifjUYoc4HIJ2y7c2VOQ2Lp8s,10152
+vision_agent/tools/tools.py,sha256=3B3xWFVA3qfAO6ySSQ2yUPUAiTrgJomL48hLO_VP6RQ,106015
+vision_agent/tools/tools_types.py,sha256=8hYf2OZhI58gvf65KGaeGkt4EQ56nwLFqIQDPHioOBc,2339
+vision_agent/utils/__init__.py,sha256=QKk4zVjMwGxQI0MQ-aZZA50N-qItxRY4EB9CwQkZ2HY,185
+vision_agent/utils/exceptions.py,sha256=booSPSuoULF7OXRr_YbC4dtKt6gM_HyiFQHBuaW86C4,2052
+vision_agent/utils/execute.py,sha256=vOEP5Ys7S2lc0_7pOJbgk7OaWi85hrCNu9_8Bo3zk6I,29356
+vision_agent/utils/image_utils.py,sha256=z_ONgcza125B10NkoGwPOzXnL470bpTWZbkB16NeeH0,12188
+vision_agent/utils/sim.py,sha256=DYya76dYVtifFyXilMLxBzGgyfyeqhEwU4RJ4894lCI,9796
+vision_agent/utils/type_defs.py,sha256=BE12s3JNQy36QvauXHjwyeffVh5enfcvd4vTzSwvEZI,1384
+vision_agent/utils/video.py,sha256=e1VwKhXzzlC5LcFMyrcQYrPnpnX4wxDpnQ-76sB4jgM,6001
+vision_agent/utils/video_tracking.py,sha256=wK5dOutqV2t2aeaxedstCBa7xy-NNQE0-QZqKu1QUds,9498
+vision_agent-0.2.231.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
+vision_agent-0.2.231.dist-info/METADATA,sha256=N8t9F4hZ4bgyZeDhrVepMZzO5dtRmzRB8VI6fq1fFAA,5760
+vision_agent-0.2.231.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
+vision_agent-0.2.231.dist-info/RECORD,,

vision-agent 0.2.229__py3-none-any.whl → 0.2.231__py3-none-any.whl

vision-agent 0.2.229py3-none-any.whl → 0.2.231py3-none-any.whl