vision-agent 0.2.104__tar.gz → 0.2.106__tar.gz
Sign up to get free protection for your applications and to get access to all the features.
- {vision_agent-0.2.104 → vision_agent-0.2.106}/PKG-INFO +1 -1
- {vision_agent-0.2.104 → vision_agent-0.2.106}/pyproject.toml +1 -1
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/tools/tools.py +5 -4
- {vision_agent-0.2.104 → vision_agent-0.2.106}/LICENSE +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/README.md +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/__init__.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/__init__.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/agent.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/agent_utils.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/vision_agent.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/vision_agent_coder.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/vision_agent_coder_prompts.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/vision_agent_prompts.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/clients/__init__.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/clients/http.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/clients/landing_public_api.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/fonts/__init__.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/fonts/default_font_ch_en.ttf +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/lmm/__init__.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/lmm/lmm.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/lmm/types.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/tools/__init__.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/tools/meta_tools.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/tools/meta_tools_types.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/tools/prompts.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/tools/tool_utils.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/__init__.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/exceptions.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/execute.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/image_utils.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/sim.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/type_defs.py +0 -0
- {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/video.py +0 -0
@@ -148,7 +148,7 @@ def owl_v2(
|
|
148
148
|
|
149
149
|
Example
|
150
150
|
-------
|
151
|
-
>>> owl_v2("car
|
151
|
+
>>> owl_v2("car, dinosaur", image)
|
152
152
|
[
|
153
153
|
{'score': 0.99, 'label': 'dinosaur', 'bbox': [0.1, 0.11, 0.35, 0.4]},
|
154
154
|
{'score': 0.98, 'label': 'car', 'bbox': [0.2, 0.21, 0.45, 0.5},
|
@@ -157,7 +157,7 @@ def owl_v2(
|
|
157
157
|
image_size = image.shape[:2]
|
158
158
|
image_b64 = convert_to_b64(image)
|
159
159
|
request_data = {
|
160
|
-
"prompts": prompt.split("
|
160
|
+
"prompts": prompt.split(","),
|
161
161
|
"image": image_b64,
|
162
162
|
"confidence": box_threshold,
|
163
163
|
"function_name": "owl_v2",
|
@@ -607,12 +607,13 @@ def florencev2_image_caption(image: np.ndarray, detail_caption: bool = True) ->
|
|
607
607
|
return answer[task] # type: ignore
|
608
608
|
|
609
609
|
|
610
|
-
def florencev2_object_detection(image: np.ndarray
|
610
|
+
def florencev2_object_detection(prompt: str, image: np.ndarray) -> List[Dict[str, Any]]:
|
611
611
|
"""'florencev2_object_detection' is a tool that can detect objects given a text
|
612
612
|
prompt such as a phrase or class names separated by commas. It returns a list of
|
613
613
|
detected objects as labels and their location as bounding boxes with score of 1.0.
|
614
614
|
|
615
615
|
Parameters:
|
616
|
+
prompt (str): The prompt to ground to the image.
|
616
617
|
image (np.ndarray): The image to used to detect objects
|
617
618
|
|
618
619
|
Returns:
|
@@ -624,7 +625,7 @@ def florencev2_object_detection(image: np.ndarray, prompt: str) -> List[Dict[str
|
|
624
625
|
|
625
626
|
Example
|
626
627
|
-------
|
627
|
-
>>> florencev2_object_detection(
|
628
|
+
>>> florencev2_object_detection('person looking at a coyote', image)
|
628
629
|
[
|
629
630
|
{'score': 1.0, 'label': 'person', 'bbox': [0.1, 0.11, 0.35, 0.4]},
|
630
631
|
{'score': 1.0, 'label': 'coyote', 'bbox': [0.34, 0.21, 0.85, 0.5},
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/vision_agent_coder_prompts.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|