vision-agent 0.2.73__py3-none-any.whl → 0.2.75__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- vision_agent/agent/vision_agent.py +1 -1
- vision_agent/lmm/lmm.py +5 -2
- {vision_agent-0.2.73.dist-info → vision_agent-0.2.75.dist-info}/METADATA +3 -3
- {vision_agent-0.2.73.dist-info → vision_agent-0.2.75.dist-info}/RECORD +6 -6
- {vision_agent-0.2.73.dist-info → vision_agent-0.2.75.dist-info}/LICENSE +0 -0
- {vision_agent-0.2.73.dist-info → vision_agent-0.2.75.dist-info}/WHEEL +0 -0
vision_agent/lmm/lmm.py
CHANGED
@@ -164,6 +164,7 @@ class OpenAILMM(LMM):
|
|
164
164
|
{"role": "system", "content": SYSTEM_PROMPT},
|
165
165
|
{"role": "user", "content": prompt},
|
166
166
|
],
|
167
|
+
response_format={"type": "json_object"},
|
167
168
|
)
|
168
169
|
|
169
170
|
try:
|
@@ -179,7 +180,7 @@ class OpenAILMM(LMM):
|
|
179
180
|
return lambda x: T.clip(x, params["prompt"])
|
180
181
|
|
181
182
|
def generate_detector(self, question: str) -> Callable:
|
182
|
-
api_doc = T.get_tool_documentation([T.
|
183
|
+
api_doc = T.get_tool_documentation([T.owl_v2])
|
183
184
|
prompt = CHOOSE_PARAMS.format(api_doc=api_doc, question=question)
|
184
185
|
response = self.client.chat.completions.create(
|
185
186
|
model=self.model_name,
|
@@ -187,6 +188,7 @@ class OpenAILMM(LMM):
|
|
187
188
|
{"role": "system", "content": SYSTEM_PROMPT},
|
188
189
|
{"role": "user", "content": prompt},
|
189
190
|
],
|
191
|
+
response_format={"type": "json_object"},
|
190
192
|
)
|
191
193
|
|
192
194
|
try:
|
@@ -199,7 +201,7 @@ class OpenAILMM(LMM):
|
|
199
201
|
)
|
200
202
|
raise ValueError("Failed to decode response")
|
201
203
|
|
202
|
-
return lambda x: T.
|
204
|
+
return lambda x: T.owl_v2(params["prompt"], x)
|
203
205
|
|
204
206
|
def generate_segmentor(self, question: str) -> Callable:
|
205
207
|
api_doc = T.get_tool_documentation([T.grounding_sam])
|
@@ -210,6 +212,7 @@ class OpenAILMM(LMM):
|
|
210
212
|
{"role": "system", "content": SYSTEM_PROMPT},
|
211
213
|
{"role": "user", "content": prompt},
|
212
214
|
],
|
215
|
+
response_format={"type": "json_object"},
|
213
216
|
)
|
214
217
|
|
215
218
|
try:
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: vision-agent
|
3
|
-
Version: 0.2.
|
3
|
+
Version: 0.2.75
|
4
4
|
Summary: Toolset for Vision Agent
|
5
5
|
Author: Landing AI
|
6
6
|
Author-email: dev@landing.ai
|
@@ -182,8 +182,8 @@ you. For example:
|
|
182
182
|
|
183
183
|
```python
|
184
184
|
>>> import vision_agent as va
|
185
|
-
>>>
|
186
|
-
>>> detector =
|
185
|
+
>>> lmm = va.lmm.OpenAILMM()
|
186
|
+
>>> detector = lmm.generate_detector("Can you build a jar detector for me?")
|
187
187
|
>>> detector(va.tools.load_image("jar.jpg"))
|
188
188
|
[{"labels": ["jar",],
|
189
189
|
"scores": [0.99],
|
@@ -1,12 +1,12 @@
|
|
1
1
|
vision_agent/__init__.py,sha256=EAb4-f9iyuEYkBrX4ag1syM8Syx8118_t0R6_C34M9w,57
|
2
2
|
vision_agent/agent/__init__.py,sha256=IUwfbPMcT8X_rnXMLmI8gJ4ltsHy_XSs9eLiKURJxeY,81
|
3
3
|
vision_agent/agent/agent.py,sha256=ZK-5lOtd9-eD9aWcXssJpnOyvZuO7_5hAmnb-6sWVe8,569
|
4
|
-
vision_agent/agent/vision_agent.py,sha256=
|
4
|
+
vision_agent/agent/vision_agent.py,sha256=gdWdjTOZ0KK3dnol8b_yf8MSErBPlbqgsd0lhYdZrLw,25716
|
5
5
|
vision_agent/agent/vision_agent_prompts.py,sha256=jpGJjrxDrxZej5SSgsTEK1sSYttgkTiZqxZAU1jWfvk,8656
|
6
6
|
vision_agent/fonts/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
7
7
|
vision_agent/fonts/default_font_ch_en.ttf,sha256=1YM0Z3XqLDjSNbF7ihQFSAIUdjF9m1rtHiNC_6QosTE,1594400
|
8
8
|
vision_agent/lmm/__init__.py,sha256=bw24xyQJHGzmph5e-bKCiTh9AX6tRFI2OUd0mofxjZI,68
|
9
|
-
vision_agent/lmm/lmm.py,sha256=
|
9
|
+
vision_agent/lmm/lmm.py,sha256=TzzACjTP1MNSrHolUWY7fEJzdVfZELQyImRpT8IU_1E,11690
|
10
10
|
vision_agent/tools/__init__.py,sha256=aE1O8cMeLDPO50Sc-CuAQ_Akh0viz7vBxDcVeZNqsA0,1604
|
11
11
|
vision_agent/tools/prompts.py,sha256=V1z4YJLXZuUl_iZ5rY0M5hHc_2tmMEUKr0WocXKGt4E,1430
|
12
12
|
vision_agent/tools/tool_utils.py,sha256=ZOY45bCX3nlo6iGwaZ8RVpRJB-vWxkXDed9oegT7-p0,1838
|
@@ -17,7 +17,7 @@ vision_agent/utils/image_utils.py,sha256=_cdiS5YrLzqkq_ZgFUO897m5M4_SCIThwUy4lOk
|
|
17
17
|
vision_agent/utils/sim.py,sha256=ci6Eta73dDgLP1Ajtknbgmf1g8aAvBHqlVQvBuLMKXQ,4427
|
18
18
|
vision_agent/utils/type_defs.py,sha256=BlI8ywWHAplC7kYWLvt4AOdnKpEW3qWEFm-GEOSkrFQ,1792
|
19
19
|
vision_agent/utils/video.py,sha256=rNmU9KEIkZB5-EztZNlUiKYN0mm_55A_2VGUM0QpqLA,8779
|
20
|
-
vision_agent-0.2.
|
21
|
-
vision_agent-0.2.
|
22
|
-
vision_agent-0.2.
|
23
|
-
vision_agent-0.2.
|
20
|
+
vision_agent-0.2.75.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
|
21
|
+
vision_agent-0.2.75.dist-info/METADATA,sha256=Y0bkCNXRi71LZ09EFHasQ8HJ0dvX54mIeW1IkPfQhvo,9405
|
22
|
+
vision_agent-0.2.75.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
|
23
|
+
vision_agent-0.2.75.dist-info/RECORD,,
|
File without changes
|
File without changes
|