vision-agent 1.0.3__py3-none-any.whl → 1.0.5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,5 +1,5 @@
1
- vision_agent/.sim_tools/df.csv,sha256=mIr1iubLDqGsL3K3ab6bmh6PtLvmOpvnaIX28lxdV6c,40706
2
- vision_agent/.sim_tools/embs.npy,sha256=pZZMFMg0rkIAOpMOjN7gjD58hPK07c2ylfQ9YST8xFA,245888
1
+ vision_agent/.sim_tools/df.csv,sha256=jCyBDlLxI9_yAxzLZcoN2BPpveF1yh29AlfdSAGTZ4A,40842
2
+ vision_agent/.sim_tools/embs.npy,sha256=QN8Ojc0Mv4_OS6WA4elvBhXTDHcpx2g1pLxsGqk4IQU,245888
3
3
  vision_agent/__init__.py,sha256=EAb4-f9iyuEYkBrX4ag1syM8Syx8118_t0R6_C34M9w,57
4
4
  vision_agent/agent/README.md,sha256=3XSPG_VO7-6y6P8COvcgSSonWj5uvfgvfmOkBpfKK8Q,5527
5
5
  vision_agent/agent/__init__.py,sha256=M8CffavdIh8Zh-skznLHIaQkYGCGK7vk4dq1FaVkbs4,617
@@ -11,43 +11,42 @@ vision_agent/agent/vision_agent_coder_prompts_v2.py,sha256=53b_DhQtffX5wxLuCbNQ8
11
11
  vision_agent/agent/vision_agent_coder_v2.py,sha256=ELc_J8Q4NKPs7YETu3a9O0Vk1zN3k6QfHBgu0M0IWGk,17450
12
12
  vision_agent/agent/vision_agent_planner.py,sha256=8LeUsxUlGuQMqCdJ6jHXOe6RpKpzLtMW1AaJlfuIfzw,18680
13
13
  vision_agent/agent/vision_agent_planner_prompts.py,sha256=rYRdJthc-sQN57VgCBKrF09Sd73BSxcBdjNe6C4WNZ8,6837
14
- vision_agent/agent/vision_agent_planner_prompts_v2.py,sha256=TiiF5BGnFVraFlQnDaeRU67927LvszvpcMUOgVgo0ps,35843
15
- vision_agent/agent/vision_agent_planner_v2.py,sha256=FuvTDe1mfznh4lkDGUyXa6yip8zQV5TDSxUG5zrsWc0,22010
14
+ vision_agent/agent/vision_agent_planner_prompts_v2.py,sha256=YARVphHKLMNUqCeOsrManvgecl77RP1g51vtt7JpdWk,35937
15
+ vision_agent/agent/vision_agent_planner_v2.py,sha256=Aww_BJhTFKZ5XjYe8FW57z2Gwp2se0vg1t1DKLGRAyQ,22050
16
16
  vision_agent/agent/vision_agent_prompts.py,sha256=KaJwYPUP7_GvQsCPPs6Fdawmi3AQWmWajBUuzj7gTG4,13812
17
17
  vision_agent/agent/vision_agent_prompts_v2.py,sha256=OnHmmteAj8__2spEXNcckApQvEpkK_JIZd_SWzEyg9c,4230
18
18
  vision_agent/agent/vision_agent_v2.py,sha256=iPW6DowH7wCFIA5vb1SdSLfZFWbn_oSC7Xa8uO8KIJI,11675
19
19
  vision_agent/clients/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
20
20
  vision_agent/clients/http.py,sha256=k883i6M_4nl7zwwHSI-yP5sAgQZIDPM1nrKD6YFJ3Xs,2009
21
21
  vision_agent/configs/__init__.py,sha256=Iu75-w9_nlPmnB_qKA7nYaaaHf7xtTrDmK8N4v2WV34,27
22
- vision_agent/configs/anthropic_config.py,sha256=T1UuESgiY8913A6wA42P7-cg8FTk9-LkJpyywo7OnIQ,4298
23
- vision_agent/configs/anthropic_openai_config.py,sha256=rUz5zca4Pn5dTUwJXiJzRDYua5PWizApCKI3y0zOvhc,4699
24
- vision_agent/configs/config.py,sha256=rUz5zca4Pn5dTUwJXiJzRDYua5PWizApCKI3y0zOvhc,4699
25
- vision_agent/configs/openai_config.py,sha256=v2_AIY89d7LKWn4uqA2G047U2IdmnqZrGH2Iww9gRIw,4498
22
+ vision_agent/configs/anthropic_config.py,sha256=FBW3PsrZn4gJXhr-v1GGayuJuBPafzDz2Q4vyI_rBzA,4692
23
+ vision_agent/configs/config.py,sha256=FjpYViBJHMizgoZ3dp7T4Lbhbh1MHHstaG7icVdVsrU,4694
24
+ vision_agent/configs/openai_config.py,sha256=Bw7ElBYmBcaZttyRBoNpcy3uTkqg5qADk8LP0wse2NQ,4498
26
25
  vision_agent/fonts/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
27
26
  vision_agent/fonts/default_font_ch_en.ttf,sha256=1YM0Z3XqLDjSNbF7ihQFSAIUdjF9m1rtHiNC_6QosTE,1594400
28
27
  vision_agent/lmm/__init__.py,sha256=4qX2lmGnKWHeKftXueEi9xj_ieK2nQh_ipHf72nKGFk,84
29
- vision_agent/lmm/lmm.py,sha256=XYp1frrqQ-6q-0y2IWwM8-EIH5UrFZ21SAhkcM32J9w,19355
28
+ vision_agent/lmm/lmm.py,sha256=utGJMeGEKImqHrY0q9kGu0uK3owG8wKyDustwrDrLto,19421
30
29
  vision_agent/models/__init__.py,sha256=eIP0pD5dYog8zUA7uuTmUxCF6SIutbLRLRE0cmuCJgQ,326
31
30
  vision_agent/models/agent_types.py,sha256=vBZ9-ns5lHDdFMO7ulCGGeZ6OwRo3gK4O3vN0814IWc,3064
32
31
  vision_agent/models/lmm_types.py,sha256=v04h-NjbczHOIN8UWa1vvO5-1BDuZ4JQhD2mge1cXmw,305
33
32
  vision_agent/models/tools_types.py,sha256=8hYf2OZhI58gvf65KGaeGkt4EQ56nwLFqIQDPHioOBc,2339
34
33
  vision_agent/sim/__init__.py,sha256=Aouz6HEPPTYcLxR5_0fTYCL1OvPKAH1RMWAF90QXAlA,135
35
- vision_agent/sim/sim.py,sha256=xkioTFNTPl7wAnNgIFfNzswKK_9dRQ6G8OL8-K4CqsI,9893
34
+ vision_agent/sim/sim.py,sha256=8y060Ck7qOFJDw9k9Vl2xQYbLkNaTd6lP1YzbcwkkXc,9944
36
35
  vision_agent/tools/__init__.py,sha256=H7FWx0OXGVIjrSOTpNH-YwE4LBuOfThZTG-SHFpo_Z8,2576
37
36
  vision_agent/tools/meta_tools.py,sha256=DNRXHX9nZ1GBeqeLiq87sBshoe0aiZeYasETbG-9neI,24053
38
- vision_agent/tools/planner_tools.py,sha256=mlpUODpsN9sg-OKdsBm-6maK3eA97FUgAWm1etfgx4E,19553
37
+ vision_agent/tools/planner_tools.py,sha256=iQWtTgXdomn0IWrbmvXXM-y8Q_RSEOxyP04HIRLrgWI,19576
39
38
  vision_agent/tools/prompts.py,sha256=V1z4YJLXZuUl_iZ5rY0M5hHc_2tmMEUKr0WocXKGt4E,1430
40
- vision_agent/tools/tools.py,sha256=-jBrykNYPinRpDXnBsnzlSgJ_hbZClzCp3pkzWjTUxs,122098
39
+ vision_agent/tools/tools.py,sha256=4gwL8EFMwm6l0MujftJ8G8BO2z8Dh_a4FPjy_xUmYqs,121889
41
40
  vision_agent/utils/__init__.py,sha256=mANUs_84VL-3gpZbXryvV2mWU623eWnRlJCSUHtMjuw,122
42
41
  vision_agent/utils/agent.py,sha256=2ifTP5QElItnr4YHOJR6L5P1PUzV0GhChTTqVxuVyQg,15153
43
42
  vision_agent/utils/exceptions.py,sha256=zis8smCbdEylBVZBTVfEUfAh7Rb7cWV3MSPambu6FsQ,1837
44
43
  vision_agent/utils/execute.py,sha256=QAql6KC2uEhX1o_44mMA77lCmMUs0itaaGMFSfJBki8,21520
45
44
  vision_agent/utils/image_utils.py,sha256=bJM2mEvB6E__M9pxi74yQYzAiZ7mu3KE2ptyVrp5vzQ,12533
46
- vision_agent/utils/tools.py,sha256=lGELSZ3xmrUa1cHR4ey_f9gyDvWsIA8Q2R7G9LNGKiE,8036
45
+ vision_agent/utils/tools.py,sha256=_XGcF-Zd527BWNkGopBZeJ4j5ehreAkNsKQSBFrlvjw,8138
47
46
  vision_agent/utils/tools_doc.py,sha256=yFue6KSXoa_Z1ngCdBEc4SdPZOWF1rVLeaHu02I8Wis,2523
48
47
  vision_agent/utils/video.py,sha256=rjsQ1sKKisaQ6AVjJz0zd_G4g-ovRweS_rs4JEhenoI,5340
49
48
  vision_agent/utils/video_tracking.py,sha256=DZLFpNCuzuPJQzbQoVNcp-m4dKxgiKdCNM5QTh_zURE,12245
50
- vision_agent-1.0.3.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
51
- vision_agent-1.0.3.dist-info/METADATA,sha256=DQaYakxwHNuuKQvA7MpaPZ8oCZT5hdhfcCWzB_9zXI4,5940
52
- vision_agent-1.0.3.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
53
- vision_agent-1.0.3.dist-info/RECORD,,
49
+ vision_agent-1.0.5.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
50
+ vision_agent-1.0.5.dist-info/METADATA,sha256=BFxGREHCEQJ6Qb-arJp2K0TTI6e_ygrkd_h8ZnJ9ou0,6746
51
+ vision_agent-1.0.5.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
52
+ vision_agent-1.0.5.dist-info/RECORD,,
@@ -1,164 +0,0 @@
1
- from typing import Type
2
-
3
- from pydantic import BaseModel, Field
4
-
5
- from vision_agent.lmm import LMM, AnthropicLMM, OpenAILMM
6
-
7
-
8
- class Config(BaseModel):
9
- # for vision_agent_v2
10
- agent: Type[LMM] = Field(default=AnthropicLMM)
11
- agent_kwargs: dict = Field(
12
- default_factory=lambda: {
13
- "model_name": "claude-3-5-sonnet-20241022",
14
- "temperature": 0.0,
15
- "image_size": 768,
16
- }
17
- )
18
-
19
- # for vision_agent_planner_v2
20
- planner: Type[LMM] = Field(default=AnthropicLMM)
21
- planner_kwargs: dict = Field(
22
- default_factory=lambda: {
23
- "model_name": "claude-3-5-sonnet-20241022",
24
- "temperature": 0.0,
25
- "image_size": 768,
26
- }
27
- )
28
-
29
- # for vision_agent_planner_v2
30
- summarizer: Type[LMM] = Field(default=OpenAILMM)
31
- summarizer_kwargs: dict = Field(
32
- default_factory=lambda: {
33
- "model_name": "o1",
34
- "temperature": 1.0, # o1 has fixed temperature
35
- "image_size": 768,
36
- }
37
- )
38
-
39
- # for vision_agent_planner_v2
40
- critic: Type[LMM] = Field(default=AnthropicLMM)
41
- critic_kwargs: dict = Field(
42
- default_factory=lambda: {
43
- "model_name": "claude-3-5-sonnet-20241022",
44
- "temperature": 0.0,
45
- "image_size": 768,
46
- }
47
- )
48
-
49
- # for vision_agent_coder_v2
50
- coder: Type[LMM] = Field(default=AnthropicLMM)
51
- coder_kwargs: dict = Field(
52
- default_factory=lambda: {
53
- "model_name": "claude-3-5-sonnet-20241022",
54
- "temperature": 0.0,
55
- "image_size": 768,
56
- }
57
- )
58
-
59
- # for vision_agent_coder_v2
60
- tester: Type[LMM] = Field(default=AnthropicLMM)
61
- tester_kwargs: dict = Field(
62
- default_factory=lambda: {
63
- "model_name": "claude-3-5-sonnet-20241022",
64
- "temperature": 0.0,
65
- "image_size": 768,
66
- }
67
- )
68
-
69
- # for vision_agent_coder_v2
70
- debugger: Type[LMM] = Field(default=AnthropicLMM)
71
- debugger_kwargs: dict = Field(
72
- default_factory=lambda: {
73
- "model_name": "claude-3-5-sonnet-20241022",
74
- "temperature": 0.0,
75
- "image_size": 768,
76
- }
77
- )
78
-
79
- # for get_tool_for_task
80
- tool_tester: Type[LMM] = Field(default=AnthropicLMM)
81
- tool_tester_kwargs: dict = Field(
82
- default_factory=lambda: {
83
- "model_name": "claude-3-5-sonnet-20241022",
84
- "temperature": 0.0,
85
- "image_size": 768,
86
- }
87
- )
88
-
89
- # for get_tool_for_task
90
- tool_chooser: Type[LMM] = Field(default=AnthropicLMM)
91
- tool_chooser_kwargs: dict = Field(
92
- default_factory=lambda: {
93
- "model_name": "claude-3-5-sonnet-20241022",
94
- "temperature": 1.0,
95
- "image_size": 768,
96
- }
97
- )
98
-
99
- # for get_tool_for_task
100
- od_judge: Type[LMM] = Field(default=AnthropicLMM)
101
- od_judge_kwargs: dict = Field(
102
- default_factory=lambda: {
103
- "model_name": "claude-3-5-sonnet-20241022",
104
- "temperature": 0.0,
105
- "image_size": 512,
106
- }
107
- )
108
-
109
- # for suggestions module
110
- suggester: Type[LMM] = Field(default=OpenAILMM)
111
- suggester_kwargs: dict = Field(
112
- default_factory=lambda: {
113
- "model_name": "o1",
114
- "temperature": 1.0,
115
- "image_detail": "high",
116
- "image_size": 1024,
117
- }
118
- )
119
-
120
- # for vqa module
121
- vqa: Type[LMM] = Field(default=AnthropicLMM)
122
- vqa_kwargs: dict = Field(
123
- default_factory=lambda: {
124
- "model_name": "claude-3-5-sonnet-20241022",
125
- "temperature": 0.0,
126
- "image_size": 768,
127
- }
128
- )
129
-
130
- def create_agent(self) -> LMM:
131
- return self.agent(**self.agent_kwargs)
132
-
133
- def create_planner(self) -> LMM:
134
- return self.planner(**self.planner_kwargs)
135
-
136
- def create_summarizer(self) -> LMM:
137
- return self.summarizer(**self.summarizer_kwargs)
138
-
139
- def create_critic(self) -> LMM:
140
- return self.critic(**self.critic_kwargs)
141
-
142
- def create_coder(self) -> LMM:
143
- return self.coder(**self.coder_kwargs)
144
-
145
- def create_tester(self) -> LMM:
146
- return self.tester(**self.tester_kwargs)
147
-
148
- def create_debugger(self) -> LMM:
149
- return self.debugger(**self.debugger_kwargs)
150
-
151
- def create_tool_tester(self) -> LMM:
152
- return self.tool_tester(**self.tool_tester_kwargs)
153
-
154
- def create_tool_chooser(self) -> LMM:
155
- return self.tool_chooser(**self.tool_chooser_kwargs)
156
-
157
- def create_od_judge(self) -> LMM:
158
- return self.od_judge(**self.od_judge_kwargs)
159
-
160
- def create_suggester(self) -> LMM:
161
- return self.suggester(**self.suggester_kwargs)
162
-
163
- def create_vqa(self) -> LMM:
164
- return self.vqa(**self.vqa_kwargs)