vision-agent 0.2.34__tar.gz → 0.2.36__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (36) hide show
  1. {vision_agent-0.2.34 → vision_agent-0.2.36}/PKG-INFO +1 -1
  2. {vision_agent-0.2.34 → vision_agent-0.2.36}/pyproject.toml +1 -1
  3. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/vision_agent.py +5 -1
  4. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/tools/tools.py +11 -9
  5. {vision_agent-0.2.34 → vision_agent-0.2.36}/LICENSE +0 -0
  6. {vision_agent-0.2.34 → vision_agent-0.2.36}/README.md +0 -0
  7. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/__init__.py +0 -0
  8. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/__init__.py +0 -0
  9. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/agent.py +0 -0
  10. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/agent_coder.py +0 -0
  11. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/agent_coder_prompts.py +0 -0
  12. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/data_interpreter.py +0 -0
  13. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/data_interpreter_prompts.py +0 -0
  14. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/easytool.py +0 -0
  15. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/easytool_prompts.py +0 -0
  16. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/easytool_v2.py +0 -0
  17. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/easytool_v2_prompts.py +0 -0
  18. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/reflexion.py +0 -0
  19. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/reflexion_prompts.py +0 -0
  20. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/agent/vision_agent_prompts.py +0 -0
  21. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/fonts/__init__.py +0 -0
  22. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/fonts/default_font_ch_en.ttf +0 -0
  23. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/llm/__init__.py +0 -0
  24. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/llm/llm.py +0 -0
  25. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/lmm/__init__.py +0 -0
  26. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/lmm/lmm.py +0 -0
  27. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/tools/__init__.py +0 -0
  28. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/tools/easytool_tools.py +0 -0
  29. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/tools/prompts.py +0 -0
  30. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/tools/tool_utils.py +0 -0
  31. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/utils/__init__.py +0 -0
  32. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/utils/execute.py +0 -0
  33. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/utils/image_utils.py +0 -0
  34. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/utils/sim.py +0 -0
  35. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/utils/type_defs.py +0 -0
  36. {vision_agent-0.2.34 → vision_agent-0.2.36}/vision_agent/utils/video.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: vision-agent
3
- Version: 0.2.34
3
+ Version: 0.2.36
4
4
  Summary: Toolset for Vision Agent
5
5
  Author: Landing AI
6
6
  Author-email: dev@landing.ai
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
4
4
 
5
5
  [tool.poetry]
6
6
  name = "vision-agent"
7
- version = "0.2.34"
7
+ version = "0.2.36"
8
8
  description = "Toolset for Vision Agent"
9
9
  authors = ["Landing AI <dev@landing.ai>"]
10
10
  readme = "README.md"
@@ -264,15 +264,19 @@ def retrieve_tools(
264
264
  )
265
265
  tool_info = []
266
266
  tool_desc = []
267
+ tool_list: List[Dict[str, str]] = []
267
268
  for task in plan:
268
269
  tools = tool_recommender.top_k(task["instructions"], k=2, thresh=0.3)
269
270
  tool_info.extend([e["doc"] for e in tools])
270
271
  tool_desc.extend([e["desc"] for e in tools])
272
+ tool_list.extend(
273
+ {"description": e["desc"], "documentation": e["doc"]} for e in tools
274
+ )
271
275
  log_progress(
272
276
  {
273
277
  "type": "tools",
274
278
  "status": "completed",
275
- "payload": tools,
279
+ "payload": tool_list,
276
280
  }
277
281
  )
278
282
  if verbosity == 2:
@@ -58,9 +58,10 @@ def grounding_dino(
58
58
  box_threshold: float = 0.20,
59
59
  iou_threshold: float = 0.20,
60
60
  ) -> List[Dict[str, Any]]:
61
- """'grounding_dino' is a tool that can detect and count objects given a text prompt
62
- such as category names or referring expressions. It returns a list and count of
63
- bounding boxes, label names and associated probability scores.
61
+ """'grounding_dino' is a tool that can detect and count multiple objects given a text
62
+ prompt such as category names or referring expressions. The categories in text prompt
63
+ are separated by commas or periods. It returns a list and count of bounding boxes,
64
+ label names and associated probability scores.
64
65
 
65
66
  Parameters:
66
67
  prompt (str): The prompt to ground to the image.
@@ -111,9 +112,10 @@ def grounding_sam(
111
112
  box_threshold: float = 0.20,
112
113
  iou_threshold: float = 0.20,
113
114
  ) -> List[Dict[str, Any]]:
114
- """'grounding_sam' is a tool that can detect and segment objects given a text
115
- prompt such as category names or referring expressions. It returns a list of
116
- bounding boxes, label names and masks file names and associated probability scores.
115
+ """'grounding_sam' is a tool that can detect and segment multiple objects given a
116
+ text prompt such as category names or referring expressions. The categories in text
117
+ prompt are separated by commas or periods. It returns a list of bounding boxes,
118
+ label names, mask file names and associated probability scores.
117
119
 
118
120
  Parameters:
119
121
  prompt (str): The prompt to ground to the image.
@@ -343,9 +345,9 @@ def image_question_answering(image: np.ndarray, prompt: str) -> str:
343
345
 
344
346
 
345
347
  def clip(image: np.ndarray, classes: List[str]) -> Dict[str, Any]:
346
- """'clip' is a tool that can classify an image given a list of input classes or tags.
347
- It returns the same list of the input classes along with their probability scores
348
- based on image content.
348
+ """'clip' is a tool that can classify an image or a cropped detection given a list
349
+ of input classes or tags. It returns the same list of the input classes along with
350
+ their probability scores based on image content.
349
351
 
350
352
  Parameters:
351
353
  image (np.ndarray): The image to classify or tag
File without changes
File without changes