vision-agent 0.2.104__tar.gz → 0.2.106__tar.gz

Sign up to get free protection for your applications and to get access to all the features.
Files changed (33) hide show
  1. {vision_agent-0.2.104 → vision_agent-0.2.106}/PKG-INFO +1 -1
  2. {vision_agent-0.2.104 → vision_agent-0.2.106}/pyproject.toml +1 -1
  3. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/tools/tools.py +5 -4
  4. {vision_agent-0.2.104 → vision_agent-0.2.106}/LICENSE +0 -0
  5. {vision_agent-0.2.104 → vision_agent-0.2.106}/README.md +0 -0
  6. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/__init__.py +0 -0
  7. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/__init__.py +0 -0
  8. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/agent.py +0 -0
  9. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/agent_utils.py +0 -0
  10. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/vision_agent.py +0 -0
  11. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/vision_agent_coder.py +0 -0
  12. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/vision_agent_coder_prompts.py +0 -0
  13. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/agent/vision_agent_prompts.py +0 -0
  14. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/clients/__init__.py +0 -0
  15. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/clients/http.py +0 -0
  16. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/clients/landing_public_api.py +0 -0
  17. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/fonts/__init__.py +0 -0
  18. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/fonts/default_font_ch_en.ttf +0 -0
  19. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/lmm/__init__.py +0 -0
  20. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/lmm/lmm.py +0 -0
  21. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/lmm/types.py +0 -0
  22. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/tools/__init__.py +0 -0
  23. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/tools/meta_tools.py +0 -0
  24. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/tools/meta_tools_types.py +0 -0
  25. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/tools/prompts.py +0 -0
  26. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/tools/tool_utils.py +0 -0
  27. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/__init__.py +0 -0
  28. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/exceptions.py +0 -0
  29. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/execute.py +0 -0
  30. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/image_utils.py +0 -0
  31. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/sim.py +0 -0
  32. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/type_defs.py +0 -0
  33. {vision_agent-0.2.104 → vision_agent-0.2.106}/vision_agent/utils/video.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: vision-agent
3
- Version: 0.2.104
3
+ Version: 0.2.106
4
4
  Summary: Toolset for Vision Agent
5
5
  Author: Landing AI
6
6
  Author-email: dev@landing.ai
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
4
4
 
5
5
  [tool.poetry]
6
6
  name = "vision-agent"
7
- version = "0.2.104"
7
+ version = "0.2.106"
8
8
  description = "Toolset for Vision Agent"
9
9
  authors = ["Landing AI <dev@landing.ai>"]
10
10
  readme = "README.md"
@@ -148,7 +148,7 @@ def owl_v2(
148
148
 
149
149
  Example
150
150
  -------
151
- >>> owl_v2("car. dinosaur", image)
151
+ >>> owl_v2("car, dinosaur", image)
152
152
  [
153
153
  {'score': 0.99, 'label': 'dinosaur', 'bbox': [0.1, 0.11, 0.35, 0.4]},
154
154
  {'score': 0.98, 'label': 'car', 'bbox': [0.2, 0.21, 0.45, 0.5},
@@ -157,7 +157,7 @@ def owl_v2(
157
157
  image_size = image.shape[:2]
158
158
  image_b64 = convert_to_b64(image)
159
159
  request_data = {
160
- "prompts": prompt.split("."),
160
+ "prompts": prompt.split(","),
161
161
  "image": image_b64,
162
162
  "confidence": box_threshold,
163
163
  "function_name": "owl_v2",
@@ -607,12 +607,13 @@ def florencev2_image_caption(image: np.ndarray, detail_caption: bool = True) ->
607
607
  return answer[task] # type: ignore
608
608
 
609
609
 
610
- def florencev2_object_detection(image: np.ndarray, prompt: str) -> List[Dict[str, Any]]:
610
+ def florencev2_object_detection(prompt: str, image: np.ndarray) -> List[Dict[str, Any]]:
611
611
  """'florencev2_object_detection' is a tool that can detect objects given a text
612
612
  prompt such as a phrase or class names separated by commas. It returns a list of
613
613
  detected objects as labels and their location as bounding boxes with score of 1.0.
614
614
 
615
615
  Parameters:
616
+ prompt (str): The prompt to ground to the image.
616
617
  image (np.ndarray): The image to used to detect objects
617
618
 
618
619
  Returns:
@@ -624,7 +625,7 @@ def florencev2_object_detection(image: np.ndarray, prompt: str) -> List[Dict[str
624
625
 
625
626
  Example
626
627
  -------
627
- >>> florencev2_object_detection(image, 'person looking at a coyote')
628
+ >>> florencev2_object_detection('person looking at a coyote', image)
628
629
  [
629
630
  {'score': 1.0, 'label': 'person', 'bbox': [0.1, 0.11, 0.35, 0.4]},
630
631
  {'score': 1.0, 'label': 'coyote', 'bbox': [0.34, 0.21, 0.85, 0.5},
File without changes
File without changes