vision-agent 0.0.46__py3-none-any.whl → 0.0.48__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- vision_agent/agent/vision_agent_prompts.py +1 -1
- vision_agent/tools/tools.py +20 -0
- {vision_agent-0.0.46.dist-info → vision_agent-0.0.48.dist-info}/METADATA +2 -2
- {vision_agent-0.0.46.dist-info → vision_agent-0.0.48.dist-info}/RECORD +6 -6
- {vision_agent-0.0.46.dist-info → vision_agent-0.0.48.dist-info}/LICENSE +0 -0
- {vision_agent-0.0.46.dist-info → vision_agent-0.0.48.dist-info}/WHEEL +0 -0
@@ -1,4 +1,4 @@
|
|
1
|
-
VISION_AGENT_REFLECTION = """You are an advanced reasoning agent that can improve based on self refection. You will be given a previous reasoning trial in which you were given the user's question, the available tools that the agent has, the decomposed tasks and tools that the agent used to answer the question and the final answer the agent provided. You must determine if the agent's answer was correct or incorrect. If the agent's answer was correct, respond with Finish. If the agent's answer was incorrect, you must diagnose a possible reason for failure or phrasing discrepancy and devise a new, concise, high level plan that aims to mitigate the same failure with the tools
|
1
|
+
VISION_AGENT_REFLECTION = """You are an advanced reasoning agent that can improve based on self refection. You will be given a previous reasoning trial in which you were given the user's question, the available tools that the agent has, the decomposed tasks and tools that the agent used to answer the question and the final answer the agent provided. You must determine if the agent's answer was correct or incorrect. If the agent's answer was correct, respond with Finish. If the agent's answer was incorrect, you must diagnose a possible reason for failure or phrasing discrepancy and devise a new, concise, high level plan that aims to mitigate the same failure with the tools available. Use complete sentences.
|
2
2
|
|
3
3
|
User's question: {question}
|
4
4
|
|
vision_agent/tools/tools.py
CHANGED
@@ -51,6 +51,25 @@ class Tool(ABC):
|
|
51
51
|
usage: Dict
|
52
52
|
|
53
53
|
|
54
|
+
class NoOp(Tool):
|
55
|
+
name = "noop_"
|
56
|
+
description = (
|
57
|
+
"'noop_' is a no-op tool that does nothing if you do not need to use a tool."
|
58
|
+
)
|
59
|
+
usage = {
|
60
|
+
"required_parameters": [],
|
61
|
+
"examples": [
|
62
|
+
{
|
63
|
+
"scenario": "If you do not want to use a tool.",
|
64
|
+
"parameters": {},
|
65
|
+
}
|
66
|
+
],
|
67
|
+
}
|
68
|
+
|
69
|
+
def __call__(self) -> None:
|
70
|
+
return None
|
71
|
+
|
72
|
+
|
54
73
|
class CLIP(Tool):
|
55
74
|
r"""CLIP is a tool that can classify or tag any image given a set if input classes
|
56
75
|
or tags.
|
@@ -612,6 +631,7 @@ TOOLS = {
|
|
612
631
|
i: {"name": c.name, "description": c.description, "usage": c.usage, "class": c}
|
613
632
|
for i, c in enumerate(
|
614
633
|
[
|
634
|
+
NoOp,
|
615
635
|
CLIP,
|
616
636
|
GroundingDINO,
|
617
637
|
AgentGroundingSAM,
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: vision-agent
|
3
|
-
Version: 0.0.
|
3
|
+
Version: 0.0.48
|
4
4
|
Summary: Toolset for Vision Agent
|
5
5
|
Author: Landing AI
|
6
6
|
Author-email: dev@landing.ai
|
@@ -69,7 +69,7 @@ export OPENAI_API_KEY="your-api-key"
|
|
69
69
|
You can interact with the agents as you would with any LLM or LMM model:
|
70
70
|
|
71
71
|
```python
|
72
|
-
>>>
|
72
|
+
>>> from vision_agent.agent import VisionAgent
|
73
73
|
>>> agent = VisionAgent()
|
74
74
|
>>> agent("What percentage of the area of this jar is filled with coffee beans?", image="jar.jpg")
|
75
75
|
"The percentage of area of the jar filled with coffee beans is 25%."
|
@@ -6,7 +6,7 @@ vision_agent/agent/easytool_prompts.py,sha256=uNp12LOFRLr3i2zLhNuLuyFms2-s8es2t6
|
|
6
6
|
vision_agent/agent/reflexion.py,sha256=wzpptfALNZIh9Q5jgkK3imGL5LWjTW_n_Ypsvxdh07Q,10101
|
7
7
|
vision_agent/agent/reflexion_prompts.py,sha256=UPGkt_qgHBMUY0VPVoF-BqhR0d_6WPjjrhbYLBYOtnQ,9342
|
8
8
|
vision_agent/agent/vision_agent.py,sha256=P2melU6XQCCiiL1C_4QsxGUaWbwahuJA90eIcQJTR4U,17449
|
9
|
-
vision_agent/agent/vision_agent_prompts.py,sha256=
|
9
|
+
vision_agent/agent/vision_agent_prompts.py,sha256=fSYO-6D-7rExS8tyZyZewrzAWsn2ZiqjBfoODL9m5Yk,6152
|
10
10
|
vision_agent/data/__init__.py,sha256=YU-5g3LbEQ6a4drz0RLGTagXMVU2Z4Xr3RlfWE-R0jU,46
|
11
11
|
vision_agent/data/data.py,sha256=pgtSGZdAnbQ8oGsuapLtFTMPajnCGDGekEXTnFuBwsY,5122
|
12
12
|
vision_agent/emb/__init__.py,sha256=YmCkGrJBtXb6X6Z3lnKiFoQYKXMgHMJp8JJyMLVvqcI,75
|
@@ -18,9 +18,9 @@ vision_agent/lmm/__init__.py,sha256=I8mbeNUajTfWVNqLsuFQVOaNBDlkIhYp9DFU8H4kB7g,
|
|
18
18
|
vision_agent/lmm/lmm.py,sha256=s_A3SKCoWm2biOt-gS9PXOsa9l-zrmR6mInLjAqam-A,8438
|
19
19
|
vision_agent/tools/__init__.py,sha256=AKN-T659HpwVearRnkCd6wWNoJ6K5kW9gAZwb8IQSLE,235
|
20
20
|
vision_agent/tools/prompts.py,sha256=9RBbyqlNlExsGKlJ89Jkph83DAEJ8PCVGaHoNbyN7TM,1416
|
21
|
-
vision_agent/tools/tools.py,sha256=
|
21
|
+
vision_agent/tools/tools.py,sha256=VD80cINHyesmGAfiCMrK506Q-G9QU_Srzey5wJ3aJGQ,23884
|
22
22
|
vision_agent/tools/video.py,sha256=40rscP8YvKN3lhZ4PDcOK4XbdFX2duCRpHY_krmBYKU,7476
|
23
|
-
vision_agent-0.0.
|
24
|
-
vision_agent-0.0.
|
25
|
-
vision_agent-0.0.
|
26
|
-
vision_agent-0.0.
|
23
|
+
vision_agent-0.0.48.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
|
24
|
+
vision_agent-0.0.48.dist-info/METADATA,sha256=y5wDj2u8p8zlIhxBh87SRWXAlc1hcMWd_aaLyuOKTbI,5581
|
25
|
+
vision_agent-0.0.48.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
|
26
|
+
vision_agent-0.0.48.dist-info/RECORD,,
|
File without changes
|
File without changes
|