vision-agent 0.2.188__tar.gz → 0.2.190__tar.gz

Sign up to get free protection for your applications and to get access to all the features.
Files changed (35) hide show
  1. {vision_agent-0.2.188 → vision_agent-0.2.190}/PKG-INFO +1 -1
  2. {vision_agent-0.2.188 → vision_agent-0.2.190}/pyproject.toml +1 -1
  3. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/tools/__init__.py +1 -0
  4. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/tools/tools.py +43 -0
  5. {vision_agent-0.2.188 → vision_agent-0.2.190}/LICENSE +0 -0
  6. {vision_agent-0.2.188 → vision_agent-0.2.190}/README.md +0 -0
  7. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/__init__.py +0 -0
  8. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/agent/__init__.py +0 -0
  9. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/agent/agent.py +0 -0
  10. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/agent/agent_utils.py +0 -0
  11. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/agent/vision_agent.py +0 -0
  12. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/agent/vision_agent_coder.py +0 -0
  13. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/agent/vision_agent_coder_prompts.py +0 -0
  14. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/agent/vision_agent_planner.py +0 -0
  15. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/agent/vision_agent_planner_prompts.py +0 -0
  16. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/agent/vision_agent_prompts.py +0 -0
  17. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/clients/__init__.py +0 -0
  18. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/clients/http.py +0 -0
  19. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/clients/landing_public_api.py +0 -0
  20. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/fonts/__init__.py +0 -0
  21. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/fonts/default_font_ch_en.ttf +0 -0
  22. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/lmm/__init__.py +0 -0
  23. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/lmm/lmm.py +0 -0
  24. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/lmm/types.py +0 -0
  25. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/tools/meta_tools.py +0 -0
  26. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/tools/prompts.py +0 -0
  27. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/tools/tool_utils.py +0 -0
  28. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/tools/tools_types.py +0 -0
  29. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/utils/__init__.py +0 -0
  30. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/utils/exceptions.py +0 -0
  31. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/utils/execute.py +0 -0
  32. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/utils/image_utils.py +0 -0
  33. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/utils/sim.py +0 -0
  34. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/utils/type_defs.py +0 -0
  35. {vision_agent-0.2.188 → vision_agent-0.2.190}/vision_agent/utils/video.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: vision-agent
3
- Version: 0.2.188
3
+ Version: 0.2.190
4
4
  Summary: Toolset for Vision Agent
5
5
  Author: Landing AI
6
6
  Author-email: dev@landing.ai
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
4
4
 
5
5
  [tool.poetry]
6
6
  name = "vision-agent"
7
- version = "0.2.188"
7
+ version = "0.2.190"
8
8
  description = "Toolset for Vision Agent"
9
9
  authors = ["Landing AI <dev@landing.ai>"]
10
10
  readme = "README.md"
@@ -69,6 +69,7 @@ from .tools import (
69
69
  qwen2_vl_video_vqa,
70
70
  video_temporal_localization,
71
71
  flux_image_inpainting,
72
+ siglip_classification,
72
73
  )
73
74
 
74
75
  __new_tools__ = [
@@ -1845,6 +1845,48 @@ def flux_image_inpainting(
1845
1845
  return output_image
1846
1846
 
1847
1847
 
1848
+ def siglip_classification(image: np.ndarray, labels: List[str]) -> Dict[str, Any]:
1849
+ """'siglip_classification' is a tool that can classify an image or a cropped detection given a list
1850
+ of input labels or tags. It returns the same list of the input labels along with
1851
+ their probability scores based on image content.
1852
+
1853
+ Parameters:
1854
+ image (np.ndarray): The image to classify or tag
1855
+ labels (List[str]): The list of labels or tags that is associated with the image
1856
+
1857
+ Returns:
1858
+ Dict[str, Any]: A dictionary containing the labels and scores. One dictionary
1859
+ contains a list of given labels and other a list of scores.
1860
+
1861
+ Example
1862
+ -------
1863
+ >>> siglip_classification(image, ['dog', 'cat', 'bird'])
1864
+ {"labels": ["dog", "cat", "bird"], "scores": [0.68, 0.30, 0.02]},
1865
+ """
1866
+
1867
+ if image.shape[0] < 1 or image.shape[1] < 1:
1868
+ return {"labels": [], "scores": []}
1869
+
1870
+ image_file = numpy_to_bytes(image)
1871
+
1872
+ files = [("image", image_file)]
1873
+
1874
+ payload = {
1875
+ "model": "siglip",
1876
+ "labels": labels,
1877
+ }
1878
+
1879
+ response: dict[str, Any] = send_inference_request(
1880
+ payload=payload,
1881
+ endpoint_name="classification",
1882
+ files=files,
1883
+ v2=True,
1884
+ metadata_payload={"function_name": "siglip_classification"},
1885
+ )
1886
+
1887
+ return response
1888
+
1889
+
1848
1890
  # Utility and visualization functions
1849
1891
 
1850
1892
 
@@ -2362,6 +2404,7 @@ FUNCTION_TOOLS = [
2362
2404
  qwen2_vl_images_vqa,
2363
2405
  qwen2_vl_video_vqa,
2364
2406
  video_temporal_localization,
2407
+ flux_image_inpainting,
2365
2408
  ]
2366
2409
 
2367
2410
  UTIL_TOOLS = [
File without changes
File without changes