vision-agent 0.2.73__py3-none-any.whl → 0.2.75__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -437,7 +437,7 @@ def retrieve_tools(
437
437
  {
438
438
  "type": "tools",
439
439
  "status": "completed",
440
- "payload": {v["description"]: v for v in tool_list}.values(),
440
+ "payload": list({v["description"]: v for v in tool_list}.values()),
441
441
  }
442
442
  )
443
443
 
vision_agent/lmm/lmm.py CHANGED
@@ -164,6 +164,7 @@ class OpenAILMM(LMM):
164
164
  {"role": "system", "content": SYSTEM_PROMPT},
165
165
  {"role": "user", "content": prompt},
166
166
  ],
167
+ response_format={"type": "json_object"},
167
168
  )
168
169
 
169
170
  try:
@@ -179,7 +180,7 @@ class OpenAILMM(LMM):
179
180
  return lambda x: T.clip(x, params["prompt"])
180
181
 
181
182
  def generate_detector(self, question: str) -> Callable:
182
- api_doc = T.get_tool_documentation([T.grounding_dino])
183
+ api_doc = T.get_tool_documentation([T.owl_v2])
183
184
  prompt = CHOOSE_PARAMS.format(api_doc=api_doc, question=question)
184
185
  response = self.client.chat.completions.create(
185
186
  model=self.model_name,
@@ -187,6 +188,7 @@ class OpenAILMM(LMM):
187
188
  {"role": "system", "content": SYSTEM_PROMPT},
188
189
  {"role": "user", "content": prompt},
189
190
  ],
191
+ response_format={"type": "json_object"},
190
192
  )
191
193
 
192
194
  try:
@@ -199,7 +201,7 @@ class OpenAILMM(LMM):
199
201
  )
200
202
  raise ValueError("Failed to decode response")
201
203
 
202
- return lambda x: T.grounding_dino(params["prompt"], x)
204
+ return lambda x: T.owl_v2(params["prompt"], x)
203
205
 
204
206
  def generate_segmentor(self, question: str) -> Callable:
205
207
  api_doc = T.get_tool_documentation([T.grounding_sam])
@@ -210,6 +212,7 @@ class OpenAILMM(LMM):
210
212
  {"role": "system", "content": SYSTEM_PROMPT},
211
213
  {"role": "user", "content": prompt},
212
214
  ],
215
+ response_format={"type": "json_object"},
213
216
  )
214
217
 
215
218
  try:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: vision-agent
3
- Version: 0.2.73
3
+ Version: 0.2.75
4
4
  Summary: Toolset for Vision Agent
5
5
  Author: Landing AI
6
6
  Author-email: dev@landing.ai
@@ -182,8 +182,8 @@ you. For example:
182
182
 
183
183
  ```python
184
184
  >>> import vision_agent as va
185
- >>> llm = va.llm.OpenAILMM()
186
- >>> detector = llm.generate_detector("Can you build a jar detector for me?")
185
+ >>> lmm = va.lmm.OpenAILMM()
186
+ >>> detector = lmm.generate_detector("Can you build a jar detector for me?")
187
187
  >>> detector(va.tools.load_image("jar.jpg"))
188
188
  [{"labels": ["jar",],
189
189
  "scores": [0.99],
@@ -1,12 +1,12 @@
1
1
  vision_agent/__init__.py,sha256=EAb4-f9iyuEYkBrX4ag1syM8Syx8118_t0R6_C34M9w,57
2
2
  vision_agent/agent/__init__.py,sha256=IUwfbPMcT8X_rnXMLmI8gJ4ltsHy_XSs9eLiKURJxeY,81
3
3
  vision_agent/agent/agent.py,sha256=ZK-5lOtd9-eD9aWcXssJpnOyvZuO7_5hAmnb-6sWVe8,569
4
- vision_agent/agent/vision_agent.py,sha256=iYSGSz-6P0fjAqRafpJMrVYBa0kX_3cw2CA-okEJ_WE,25710
4
+ vision_agent/agent/vision_agent.py,sha256=gdWdjTOZ0KK3dnol8b_yf8MSErBPlbqgsd0lhYdZrLw,25716
5
5
  vision_agent/agent/vision_agent_prompts.py,sha256=jpGJjrxDrxZej5SSgsTEK1sSYttgkTiZqxZAU1jWfvk,8656
6
6
  vision_agent/fonts/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
7
7
  vision_agent/fonts/default_font_ch_en.ttf,sha256=1YM0Z3XqLDjSNbF7ihQFSAIUdjF9m1rtHiNC_6QosTE,1594400
8
8
  vision_agent/lmm/__init__.py,sha256=bw24xyQJHGzmph5e-bKCiTh9AX6tRFI2OUd0mofxjZI,68
9
- vision_agent/lmm/lmm.py,sha256=V7jfU94HwA-SiQLY14USHrSGtagVKCNGjZhW5MyKipo,11547
9
+ vision_agent/lmm/lmm.py,sha256=TzzACjTP1MNSrHolUWY7fEJzdVfZELQyImRpT8IU_1E,11690
10
10
  vision_agent/tools/__init__.py,sha256=aE1O8cMeLDPO50Sc-CuAQ_Akh0viz7vBxDcVeZNqsA0,1604
11
11
  vision_agent/tools/prompts.py,sha256=V1z4YJLXZuUl_iZ5rY0M5hHc_2tmMEUKr0WocXKGt4E,1430
12
12
  vision_agent/tools/tool_utils.py,sha256=ZOY45bCX3nlo6iGwaZ8RVpRJB-vWxkXDed9oegT7-p0,1838
@@ -17,7 +17,7 @@ vision_agent/utils/image_utils.py,sha256=_cdiS5YrLzqkq_ZgFUO897m5M4_SCIThwUy4lOk
17
17
  vision_agent/utils/sim.py,sha256=ci6Eta73dDgLP1Ajtknbgmf1g8aAvBHqlVQvBuLMKXQ,4427
18
18
  vision_agent/utils/type_defs.py,sha256=BlI8ywWHAplC7kYWLvt4AOdnKpEW3qWEFm-GEOSkrFQ,1792
19
19
  vision_agent/utils/video.py,sha256=rNmU9KEIkZB5-EztZNlUiKYN0mm_55A_2VGUM0QpqLA,8779
20
- vision_agent-0.2.73.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
21
- vision_agent-0.2.73.dist-info/METADATA,sha256=7w2efZn2Qyw6wAXN2NLRJwEMvBb1_1lUovoSNz30y68,9405
22
- vision_agent-0.2.73.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
23
- vision_agent-0.2.73.dist-info/RECORD,,
20
+ vision_agent-0.2.75.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
21
+ vision_agent-0.2.75.dist-info/METADATA,sha256=Y0bkCNXRi71LZ09EFHasQ8HJ0dvX54mIeW1IkPfQhvo,9405
22
+ vision_agent-0.2.75.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
23
+ vision_agent-0.2.75.dist-info/RECORD,,