vision-agent 1.0.3__py3-none-any.whl → 1.0.5__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- vision_agent/.sim_tools/df.csv +46 -47
- vision_agent/.sim_tools/embs.npy +0 -0
- vision_agent/agent/vision_agent_planner_prompts_v2.py +57 -58
- vision_agent/agent/vision_agent_planner_v2.py +3 -2
- vision_agent/configs/anthropic_config.py +29 -16
- vision_agent/configs/config.py +14 -15
- vision_agent/configs/openai_config.py +10 -10
- vision_agent/lmm/lmm.py +2 -2
- vision_agent/sim/sim.py +4 -1
- vision_agent/tools/planner_tools.py +13 -14
- vision_agent/tools/tools.py +16 -27
- vision_agent/utils/tools.py +8 -2
- {vision_agent-1.0.3.dist-info → vision_agent-1.0.5.dist-info}/METADATA +31 -3
- {vision_agent-1.0.3.dist-info → vision_agent-1.0.5.dist-info}/RECORD +16 -17
- vision_agent/configs/anthropic_openai_config.py +0 -164
- {vision_agent-1.0.3.dist-info → vision_agent-1.0.5.dist-info}/LICENSE +0 -0
- {vision_agent-1.0.3.dist-info → vision_agent-1.0.5.dist-info}/WHEEL +0 -0
@@ -1,5 +1,5 @@
|
|
1
|
-
vision_agent/.sim_tools/df.csv,sha256=
|
2
|
-
vision_agent/.sim_tools/embs.npy,sha256=
|
1
|
+
vision_agent/.sim_tools/df.csv,sha256=jCyBDlLxI9_yAxzLZcoN2BPpveF1yh29AlfdSAGTZ4A,40842
|
2
|
+
vision_agent/.sim_tools/embs.npy,sha256=QN8Ojc0Mv4_OS6WA4elvBhXTDHcpx2g1pLxsGqk4IQU,245888
|
3
3
|
vision_agent/__init__.py,sha256=EAb4-f9iyuEYkBrX4ag1syM8Syx8118_t0R6_C34M9w,57
|
4
4
|
vision_agent/agent/README.md,sha256=3XSPG_VO7-6y6P8COvcgSSonWj5uvfgvfmOkBpfKK8Q,5527
|
5
5
|
vision_agent/agent/__init__.py,sha256=M8CffavdIh8Zh-skznLHIaQkYGCGK7vk4dq1FaVkbs4,617
|
@@ -11,43 +11,42 @@ vision_agent/agent/vision_agent_coder_prompts_v2.py,sha256=53b_DhQtffX5wxLuCbNQ8
|
|
11
11
|
vision_agent/agent/vision_agent_coder_v2.py,sha256=ELc_J8Q4NKPs7YETu3a9O0Vk1zN3k6QfHBgu0M0IWGk,17450
|
12
12
|
vision_agent/agent/vision_agent_planner.py,sha256=8LeUsxUlGuQMqCdJ6jHXOe6RpKpzLtMW1AaJlfuIfzw,18680
|
13
13
|
vision_agent/agent/vision_agent_planner_prompts.py,sha256=rYRdJthc-sQN57VgCBKrF09Sd73BSxcBdjNe6C4WNZ8,6837
|
14
|
-
vision_agent/agent/vision_agent_planner_prompts_v2.py,sha256=
|
15
|
-
vision_agent/agent/vision_agent_planner_v2.py,sha256=
|
14
|
+
vision_agent/agent/vision_agent_planner_prompts_v2.py,sha256=YARVphHKLMNUqCeOsrManvgecl77RP1g51vtt7JpdWk,35937
|
15
|
+
vision_agent/agent/vision_agent_planner_v2.py,sha256=Aww_BJhTFKZ5XjYe8FW57z2Gwp2se0vg1t1DKLGRAyQ,22050
|
16
16
|
vision_agent/agent/vision_agent_prompts.py,sha256=KaJwYPUP7_GvQsCPPs6Fdawmi3AQWmWajBUuzj7gTG4,13812
|
17
17
|
vision_agent/agent/vision_agent_prompts_v2.py,sha256=OnHmmteAj8__2spEXNcckApQvEpkK_JIZd_SWzEyg9c,4230
|
18
18
|
vision_agent/agent/vision_agent_v2.py,sha256=iPW6DowH7wCFIA5vb1SdSLfZFWbn_oSC7Xa8uO8KIJI,11675
|
19
19
|
vision_agent/clients/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
20
20
|
vision_agent/clients/http.py,sha256=k883i6M_4nl7zwwHSI-yP5sAgQZIDPM1nrKD6YFJ3Xs,2009
|
21
21
|
vision_agent/configs/__init__.py,sha256=Iu75-w9_nlPmnB_qKA7nYaaaHf7xtTrDmK8N4v2WV34,27
|
22
|
-
vision_agent/configs/anthropic_config.py,sha256=
|
23
|
-
vision_agent/configs/
|
24
|
-
vision_agent/configs/
|
25
|
-
vision_agent/configs/openai_config.py,sha256=v2_AIY89d7LKWn4uqA2G047U2IdmnqZrGH2Iww9gRIw,4498
|
22
|
+
vision_agent/configs/anthropic_config.py,sha256=FBW3PsrZn4gJXhr-v1GGayuJuBPafzDz2Q4vyI_rBzA,4692
|
23
|
+
vision_agent/configs/config.py,sha256=FjpYViBJHMizgoZ3dp7T4Lbhbh1MHHstaG7icVdVsrU,4694
|
24
|
+
vision_agent/configs/openai_config.py,sha256=Bw7ElBYmBcaZttyRBoNpcy3uTkqg5qADk8LP0wse2NQ,4498
|
26
25
|
vision_agent/fonts/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
27
26
|
vision_agent/fonts/default_font_ch_en.ttf,sha256=1YM0Z3XqLDjSNbF7ihQFSAIUdjF9m1rtHiNC_6QosTE,1594400
|
28
27
|
vision_agent/lmm/__init__.py,sha256=4qX2lmGnKWHeKftXueEi9xj_ieK2nQh_ipHf72nKGFk,84
|
29
|
-
vision_agent/lmm/lmm.py,sha256=
|
28
|
+
vision_agent/lmm/lmm.py,sha256=utGJMeGEKImqHrY0q9kGu0uK3owG8wKyDustwrDrLto,19421
|
30
29
|
vision_agent/models/__init__.py,sha256=eIP0pD5dYog8zUA7uuTmUxCF6SIutbLRLRE0cmuCJgQ,326
|
31
30
|
vision_agent/models/agent_types.py,sha256=vBZ9-ns5lHDdFMO7ulCGGeZ6OwRo3gK4O3vN0814IWc,3064
|
32
31
|
vision_agent/models/lmm_types.py,sha256=v04h-NjbczHOIN8UWa1vvO5-1BDuZ4JQhD2mge1cXmw,305
|
33
32
|
vision_agent/models/tools_types.py,sha256=8hYf2OZhI58gvf65KGaeGkt4EQ56nwLFqIQDPHioOBc,2339
|
34
33
|
vision_agent/sim/__init__.py,sha256=Aouz6HEPPTYcLxR5_0fTYCL1OvPKAH1RMWAF90QXAlA,135
|
35
|
-
vision_agent/sim/sim.py,sha256=
|
34
|
+
vision_agent/sim/sim.py,sha256=8y060Ck7qOFJDw9k9Vl2xQYbLkNaTd6lP1YzbcwkkXc,9944
|
36
35
|
vision_agent/tools/__init__.py,sha256=H7FWx0OXGVIjrSOTpNH-YwE4LBuOfThZTG-SHFpo_Z8,2576
|
37
36
|
vision_agent/tools/meta_tools.py,sha256=DNRXHX9nZ1GBeqeLiq87sBshoe0aiZeYasETbG-9neI,24053
|
38
|
-
vision_agent/tools/planner_tools.py,sha256=
|
37
|
+
vision_agent/tools/planner_tools.py,sha256=iQWtTgXdomn0IWrbmvXXM-y8Q_RSEOxyP04HIRLrgWI,19576
|
39
38
|
vision_agent/tools/prompts.py,sha256=V1z4YJLXZuUl_iZ5rY0M5hHc_2tmMEUKr0WocXKGt4E,1430
|
40
|
-
vision_agent/tools/tools.py,sha256
|
39
|
+
vision_agent/tools/tools.py,sha256=4gwL8EFMwm6l0MujftJ8G8BO2z8Dh_a4FPjy_xUmYqs,121889
|
41
40
|
vision_agent/utils/__init__.py,sha256=mANUs_84VL-3gpZbXryvV2mWU623eWnRlJCSUHtMjuw,122
|
42
41
|
vision_agent/utils/agent.py,sha256=2ifTP5QElItnr4YHOJR6L5P1PUzV0GhChTTqVxuVyQg,15153
|
43
42
|
vision_agent/utils/exceptions.py,sha256=zis8smCbdEylBVZBTVfEUfAh7Rb7cWV3MSPambu6FsQ,1837
|
44
43
|
vision_agent/utils/execute.py,sha256=QAql6KC2uEhX1o_44mMA77lCmMUs0itaaGMFSfJBki8,21520
|
45
44
|
vision_agent/utils/image_utils.py,sha256=bJM2mEvB6E__M9pxi74yQYzAiZ7mu3KE2ptyVrp5vzQ,12533
|
46
|
-
vision_agent/utils/tools.py,sha256=
|
45
|
+
vision_agent/utils/tools.py,sha256=_XGcF-Zd527BWNkGopBZeJ4j5ehreAkNsKQSBFrlvjw,8138
|
47
46
|
vision_agent/utils/tools_doc.py,sha256=yFue6KSXoa_Z1ngCdBEc4SdPZOWF1rVLeaHu02I8Wis,2523
|
48
47
|
vision_agent/utils/video.py,sha256=rjsQ1sKKisaQ6AVjJz0zd_G4g-ovRweS_rs4JEhenoI,5340
|
49
48
|
vision_agent/utils/video_tracking.py,sha256=DZLFpNCuzuPJQzbQoVNcp-m4dKxgiKdCNM5QTh_zURE,12245
|
50
|
-
vision_agent-1.0.
|
51
|
-
vision_agent-1.0.
|
52
|
-
vision_agent-1.0.
|
53
|
-
vision_agent-1.0.
|
49
|
+
vision_agent-1.0.5.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
|
50
|
+
vision_agent-1.0.5.dist-info/METADATA,sha256=BFxGREHCEQJ6Qb-arJp2K0TTI6e_ygrkd_h8ZnJ9ou0,6746
|
51
|
+
vision_agent-1.0.5.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
|
52
|
+
vision_agent-1.0.5.dist-info/RECORD,,
|
@@ -1,164 +0,0 @@
|
|
1
|
-
from typing import Type
|
2
|
-
|
3
|
-
from pydantic import BaseModel, Field
|
4
|
-
|
5
|
-
from vision_agent.lmm import LMM, AnthropicLMM, OpenAILMM
|
6
|
-
|
7
|
-
|
8
|
-
class Config(BaseModel):
|
9
|
-
# for vision_agent_v2
|
10
|
-
agent: Type[LMM] = Field(default=AnthropicLMM)
|
11
|
-
agent_kwargs: dict = Field(
|
12
|
-
default_factory=lambda: {
|
13
|
-
"model_name": "claude-3-5-sonnet-20241022",
|
14
|
-
"temperature": 0.0,
|
15
|
-
"image_size": 768,
|
16
|
-
}
|
17
|
-
)
|
18
|
-
|
19
|
-
# for vision_agent_planner_v2
|
20
|
-
planner: Type[LMM] = Field(default=AnthropicLMM)
|
21
|
-
planner_kwargs: dict = Field(
|
22
|
-
default_factory=lambda: {
|
23
|
-
"model_name": "claude-3-5-sonnet-20241022",
|
24
|
-
"temperature": 0.0,
|
25
|
-
"image_size": 768,
|
26
|
-
}
|
27
|
-
)
|
28
|
-
|
29
|
-
# for vision_agent_planner_v2
|
30
|
-
summarizer: Type[LMM] = Field(default=OpenAILMM)
|
31
|
-
summarizer_kwargs: dict = Field(
|
32
|
-
default_factory=lambda: {
|
33
|
-
"model_name": "o1",
|
34
|
-
"temperature": 1.0, # o1 has fixed temperature
|
35
|
-
"image_size": 768,
|
36
|
-
}
|
37
|
-
)
|
38
|
-
|
39
|
-
# for vision_agent_planner_v2
|
40
|
-
critic: Type[LMM] = Field(default=AnthropicLMM)
|
41
|
-
critic_kwargs: dict = Field(
|
42
|
-
default_factory=lambda: {
|
43
|
-
"model_name": "claude-3-5-sonnet-20241022",
|
44
|
-
"temperature": 0.0,
|
45
|
-
"image_size": 768,
|
46
|
-
}
|
47
|
-
)
|
48
|
-
|
49
|
-
# for vision_agent_coder_v2
|
50
|
-
coder: Type[LMM] = Field(default=AnthropicLMM)
|
51
|
-
coder_kwargs: dict = Field(
|
52
|
-
default_factory=lambda: {
|
53
|
-
"model_name": "claude-3-5-sonnet-20241022",
|
54
|
-
"temperature": 0.0,
|
55
|
-
"image_size": 768,
|
56
|
-
}
|
57
|
-
)
|
58
|
-
|
59
|
-
# for vision_agent_coder_v2
|
60
|
-
tester: Type[LMM] = Field(default=AnthropicLMM)
|
61
|
-
tester_kwargs: dict = Field(
|
62
|
-
default_factory=lambda: {
|
63
|
-
"model_name": "claude-3-5-sonnet-20241022",
|
64
|
-
"temperature": 0.0,
|
65
|
-
"image_size": 768,
|
66
|
-
}
|
67
|
-
)
|
68
|
-
|
69
|
-
# for vision_agent_coder_v2
|
70
|
-
debugger: Type[LMM] = Field(default=AnthropicLMM)
|
71
|
-
debugger_kwargs: dict = Field(
|
72
|
-
default_factory=lambda: {
|
73
|
-
"model_name": "claude-3-5-sonnet-20241022",
|
74
|
-
"temperature": 0.0,
|
75
|
-
"image_size": 768,
|
76
|
-
}
|
77
|
-
)
|
78
|
-
|
79
|
-
# for get_tool_for_task
|
80
|
-
tool_tester: Type[LMM] = Field(default=AnthropicLMM)
|
81
|
-
tool_tester_kwargs: dict = Field(
|
82
|
-
default_factory=lambda: {
|
83
|
-
"model_name": "claude-3-5-sonnet-20241022",
|
84
|
-
"temperature": 0.0,
|
85
|
-
"image_size": 768,
|
86
|
-
}
|
87
|
-
)
|
88
|
-
|
89
|
-
# for get_tool_for_task
|
90
|
-
tool_chooser: Type[LMM] = Field(default=AnthropicLMM)
|
91
|
-
tool_chooser_kwargs: dict = Field(
|
92
|
-
default_factory=lambda: {
|
93
|
-
"model_name": "claude-3-5-sonnet-20241022",
|
94
|
-
"temperature": 1.0,
|
95
|
-
"image_size": 768,
|
96
|
-
}
|
97
|
-
)
|
98
|
-
|
99
|
-
# for get_tool_for_task
|
100
|
-
od_judge: Type[LMM] = Field(default=AnthropicLMM)
|
101
|
-
od_judge_kwargs: dict = Field(
|
102
|
-
default_factory=lambda: {
|
103
|
-
"model_name": "claude-3-5-sonnet-20241022",
|
104
|
-
"temperature": 0.0,
|
105
|
-
"image_size": 512,
|
106
|
-
}
|
107
|
-
)
|
108
|
-
|
109
|
-
# for suggestions module
|
110
|
-
suggester: Type[LMM] = Field(default=OpenAILMM)
|
111
|
-
suggester_kwargs: dict = Field(
|
112
|
-
default_factory=lambda: {
|
113
|
-
"model_name": "o1",
|
114
|
-
"temperature": 1.0,
|
115
|
-
"image_detail": "high",
|
116
|
-
"image_size": 1024,
|
117
|
-
}
|
118
|
-
)
|
119
|
-
|
120
|
-
# for vqa module
|
121
|
-
vqa: Type[LMM] = Field(default=AnthropicLMM)
|
122
|
-
vqa_kwargs: dict = Field(
|
123
|
-
default_factory=lambda: {
|
124
|
-
"model_name": "claude-3-5-sonnet-20241022",
|
125
|
-
"temperature": 0.0,
|
126
|
-
"image_size": 768,
|
127
|
-
}
|
128
|
-
)
|
129
|
-
|
130
|
-
def create_agent(self) -> LMM:
|
131
|
-
return self.agent(**self.agent_kwargs)
|
132
|
-
|
133
|
-
def create_planner(self) -> LMM:
|
134
|
-
return self.planner(**self.planner_kwargs)
|
135
|
-
|
136
|
-
def create_summarizer(self) -> LMM:
|
137
|
-
return self.summarizer(**self.summarizer_kwargs)
|
138
|
-
|
139
|
-
def create_critic(self) -> LMM:
|
140
|
-
return self.critic(**self.critic_kwargs)
|
141
|
-
|
142
|
-
def create_coder(self) -> LMM:
|
143
|
-
return self.coder(**self.coder_kwargs)
|
144
|
-
|
145
|
-
def create_tester(self) -> LMM:
|
146
|
-
return self.tester(**self.tester_kwargs)
|
147
|
-
|
148
|
-
def create_debugger(self) -> LMM:
|
149
|
-
return self.debugger(**self.debugger_kwargs)
|
150
|
-
|
151
|
-
def create_tool_tester(self) -> LMM:
|
152
|
-
return self.tool_tester(**self.tool_tester_kwargs)
|
153
|
-
|
154
|
-
def create_tool_chooser(self) -> LMM:
|
155
|
-
return self.tool_chooser(**self.tool_chooser_kwargs)
|
156
|
-
|
157
|
-
def create_od_judge(self) -> LMM:
|
158
|
-
return self.od_judge(**self.od_judge_kwargs)
|
159
|
-
|
160
|
-
def create_suggester(self) -> LMM:
|
161
|
-
return self.suggester(**self.suggester_kwargs)
|
162
|
-
|
163
|
-
def create_vqa(self) -> LMM:
|
164
|
-
return self.vqa(**self.vqa_kwargs)
|
File without changes
|
File without changes
|