vision-agent 0.2.145__tar.gz → 0.2.146__tar.gz

Sign up to get free protection for your applications and to get access to all the features.
Files changed (33) hide show
  1. {vision_agent-0.2.145 → vision_agent-0.2.146}/PKG-INFO +1 -1
  2. {vision_agent-0.2.145 → vision_agent-0.2.146}/pyproject.toml +1 -1
  3. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/tools/tools.py +48 -31
  4. {vision_agent-0.2.145 → vision_agent-0.2.146}/LICENSE +0 -0
  5. {vision_agent-0.2.145 → vision_agent-0.2.146}/README.md +0 -0
  6. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/__init__.py +0 -0
  7. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/agent/__init__.py +0 -0
  8. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/agent/agent.py +0 -0
  9. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/agent/agent_utils.py +0 -0
  10. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/agent/vision_agent.py +0 -0
  11. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/agent/vision_agent_coder.py +0 -0
  12. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/agent/vision_agent_coder_prompts.py +0 -0
  13. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/agent/vision_agent_prompts.py +0 -0
  14. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/clients/__init__.py +0 -0
  15. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/clients/http.py +0 -0
  16. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/clients/landing_public_api.py +0 -0
  17. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/fonts/__init__.py +0 -0
  18. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/fonts/default_font_ch_en.ttf +0 -0
  19. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/lmm/__init__.py +0 -0
  20. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/lmm/lmm.py +0 -0
  21. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/lmm/types.py +0 -0
  22. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/tools/__init__.py +0 -0
  23. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/tools/meta_tools.py +0 -0
  24. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/tools/prompts.py +0 -0
  25. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/tools/tool_utils.py +0 -0
  26. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/tools/tools_types.py +0 -0
  27. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/utils/__init__.py +0 -0
  28. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/utils/exceptions.py +0 -0
  29. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/utils/execute.py +0 -0
  30. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/utils/image_utils.py +0 -0
  31. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/utils/sim.py +0 -0
  32. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/utils/type_defs.py +0 -0
  33. {vision_agent-0.2.145 → vision_agent-0.2.146}/vision_agent/utils/video.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: vision-agent
3
- Version: 0.2.145
3
+ Version: 0.2.146
4
4
  Summary: Toolset for Vision Agent
5
5
  Author: Landing AI
6
6
  Author-email: dev@landing.ai
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
4
4
 
5
5
  [tool.poetry]
6
6
  name = "vision-agent"
7
- version = "0.2.145"
7
+ version = "0.2.146"
8
8
  description = "Toolset for Vision Agent"
9
9
  authors = ["Landing AI <dev@landing.ai>"]
10
10
  readme = "README.md"
@@ -1759,14 +1759,17 @@ def _save_video_to_result(video_uri: str) -> None:
1759
1759
 
1760
1760
 
1761
1761
  def overlay_bounding_boxes(
1762
- image: np.ndarray, bboxes: List[Dict[str, Any]]
1763
- ) -> np.ndarray:
1762
+ medias: Union[np.ndarray, List[np.ndarray]],
1763
+ bboxes: Union[List[Dict[str, Any]], List[List[Dict[str, Any]]]],
1764
+ ) -> Union[np.ndarray, List[np.ndarray]]:
1764
1765
  """'overlay_bounding_boxes' is a utility function that displays bounding boxes on
1765
1766
  an image.
1766
1767
 
1767
1768
  Parameters:
1768
- image (np.ndarray): The image to display the bounding boxes on.
1769
- bboxes (List[Dict[str, Any]]): A list of dictionaries containing the bounding
1769
+ medias (Union[np.ndarray, List[np.ndarra]]): The image or frames to display the
1770
+ bounding boxes on.
1771
+ bboxes (Union[List[Dict[str, Any]], List[List[Dict[str, Any]]]]): A list of
1772
+ dictionaries or a list of list of dictionaries containing the bounding
1770
1773
  boxes.
1771
1774
 
1772
1775
  Returns:
@@ -1778,41 +1781,54 @@ def overlay_bounding_boxes(
1778
1781
  image, [{'score': 0.99, 'label': 'dinosaur', 'bbox': [0.1, 0.11, 0.35, 0.4]}],
1779
1782
  )
1780
1783
  """
1781
- pil_image = Image.fromarray(image.astype(np.uint8)).convert("RGB")
1782
1784
 
1783
- if len(set([box["label"] for box in bboxes])) > len(COLORS):
1785
+ medias_int: List[np.ndarray] = (
1786
+ [medias] if isinstance(medias, np.ndarray) else medias
1787
+ )
1788
+ bbox_int = [bboxes] if isinstance(bboxes[0], dict) else bboxes
1789
+ bbox_int = cast(List[List[Dict[str, Any]]], bbox_int)
1790
+ labels = set([bb["label"] for b in bbox_int for bb in b])
1791
+
1792
+ if len(labels) > len(COLORS):
1784
1793
  _LOGGER.warning(
1785
1794
  "Number of unique labels exceeds the number of available colors. Some labels may have the same color."
1786
1795
  )
1787
1796
 
1788
- color = {
1789
- label: COLORS[i % len(COLORS)]
1790
- for i, label in enumerate(set([box["label"] for box in bboxes]))
1791
- }
1792
- bboxes = sorted(bboxes, key=lambda x: x["label"], reverse=True)
1797
+ color = {label: COLORS[i % len(COLORS)] for i, label in enumerate(labels)}
1793
1798
 
1794
- width, height = pil_image.size
1795
- fontsize = max(12, int(min(width, height) / 40))
1796
- draw = ImageDraw.Draw(pil_image)
1797
- font = ImageFont.truetype(
1798
- str(resources.files("vision_agent.fonts").joinpath("default_font_ch_en.ttf")),
1799
- fontsize,
1800
- )
1799
+ frame_out = []
1800
+ for i, frame in enumerate(medias_int):
1801
+ pil_image = Image.fromarray(frame.astype(np.uint8)).convert("RGB")
1801
1802
 
1802
- for elt in bboxes:
1803
- label = elt["label"]
1804
- box = elt["bbox"]
1805
- scores = elt["score"]
1803
+ bboxes = bbox_int[i]
1804
+ bboxes = sorted(bboxes, key=lambda x: x["label"], reverse=True)
1806
1805
 
1807
- # denormalize the box if it is normalized
1808
- box = denormalize_bbox(box, (height, width))
1806
+ width, height = pil_image.size
1807
+ fontsize = max(12, int(min(width, height) / 40))
1808
+ draw = ImageDraw.Draw(pil_image)
1809
+ font = ImageFont.truetype(
1810
+ str(
1811
+ resources.files("vision_agent.fonts").joinpath("default_font_ch_en.ttf")
1812
+ ),
1813
+ fontsize,
1814
+ )
1809
1815
 
1810
- draw.rectangle(box, outline=color[label], width=4)
1811
- text = f"{label}: {scores:.2f}"
1812
- text_box = draw.textbbox((box[0], box[1]), text=text, font=font)
1813
- draw.rectangle((box[0], box[1], text_box[2], text_box[3]), fill=color[label])
1814
- draw.text((box[0], box[1]), text, fill="black", font=font)
1815
- return np.array(pil_image)
1816
+ for elt in bboxes:
1817
+ label = elt["label"]
1818
+ box = elt["bbox"]
1819
+ scores = elt["score"]
1820
+
1821
+ # denormalize the box if it is normalized
1822
+ box = denormalize_bbox(box, (height, width))
1823
+ draw.rectangle(box, outline=color[label], width=4)
1824
+ text = f"{label}: {scores:.2f}"
1825
+ text_box = draw.textbbox((box[0], box[1]), text=text, font=font)
1826
+ draw.rectangle(
1827
+ (box[0], box[1], text_box[2], text_box[3]), fill=color[label]
1828
+ )
1829
+ draw.text((box[0], box[1]), text, fill="black", font=font)
1830
+ frame_out.append(np.array(pil_image))
1831
+ return frame_out[0] if len(frame_out) == 1 else frame_out
1816
1832
 
1817
1833
 
1818
1834
  def _get_text_coords_from_mask(
@@ -1852,7 +1868,8 @@ def overlay_segmentation_masks(
1852
1868
  medias (Union[np.ndarray, List[np.ndarray]]): The image or frames to display
1853
1869
  the masks on.
1854
1870
  masks (Union[List[Dict[str, Any]], List[List[Dict[str, Any]]]]): A list of
1855
- dictionaries containing the masks, labels and scores.
1871
+ dictionaries or a list of list of dictionaries containing the masks, labels
1872
+ and scores.
1856
1873
  draw_label (bool, optional): If True, the labels will be displayed on the image.
1857
1874
  secondary_label_key (str, optional): The key to use for the secondary
1858
1875
  tracking label which is needed in videos to display tracking information.
File without changes
File without changes