vision-agent 0.2.244__tar.gz → 0.2.246__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {vision_agent-0.2.244 → vision_agent-0.2.246}/PKG-INFO +1 -1
- {vision_agent-0.2.244 → vision_agent-0.2.246}/pyproject.toml +1 -1
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_planner.py +1 -1
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_planner_v2.py +2 -1
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_prompts_v2.py +11 -1
- {vision_agent-0.2.244 → vision_agent-0.2.246}/LICENSE +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/README.md +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/.sim_tools/df.csv +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/.sim_tools/embs.npy +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/__init__.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/README.md +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/__init__.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/agent.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_coder.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_coder_prompts.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_coder_prompts_v2.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_coder_v2.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_planner_prompts.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_planner_prompts_v2.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_prompts.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_v2.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/clients/__init__.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/clients/http.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/configs/__init__.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/configs/anthropic_config.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/configs/anthropic_openai_config.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/configs/config.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/configs/openai_config.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/fonts/__init__.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/fonts/default_font_ch_en.ttf +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/lmm/__init__.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/lmm/lmm.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/models/__init__.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/models/agent_types.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/models/lmm_types.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/models/tools_types.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/sim/__init__.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/sim/sim.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/tools/__init__.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/tools/meta_tools.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/tools/planner_tools.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/tools/prompts.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/tools/tools.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/utils/__init__.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/utils/agent.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/utils/exceptions.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/utils/execute.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/utils/image_utils.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/utils/tools.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/utils/tools_doc.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/utils/type_defs.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/utils/video.py +0 -0
- {vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/utils/video_tracking.py +0 -0
@@ -410,7 +410,7 @@ class VisionAgentPlanner(Agent):
|
|
410
410
|
plans = write_plans(
|
411
411
|
chat,
|
412
412
|
get_tool_descriptions_by_names(
|
413
|
-
custom_tool_names, T.FUNCTION_TOOLS, T.UTIL_TOOLS # type: ignore
|
413
|
+
custom_tool_names, T.tools.FUNCTION_TOOLS, T.tools.UTIL_TOOLS # type: ignore
|
414
414
|
),
|
415
415
|
format_feedback(working_memory),
|
416
416
|
self.planner,
|
@@ -317,7 +317,8 @@ def maybe_run_code(
|
|
317
317
|
media_data = capture_media_from_exec(execution)
|
318
318
|
int_chat_elt = AgentMessage(role="observation", content=obs, media=None)
|
319
319
|
if media_list:
|
320
|
-
|
320
|
+
# Don't sned more than 3 media files to the planner or it can get overloaded
|
321
|
+
int_chat_elt.media = cast(List[Union[str, Path]], media_data[:3])
|
321
322
|
return_chat.append(int_chat_elt)
|
322
323
|
else:
|
323
324
|
return_chat.append(AgentMessage(role="planner", content=response, media=None))
|
@@ -54,12 +54,22 @@ AGENT: <response>I am VisionAgent, an agent built by LandingAI, to help users wr
|
|
54
54
|
- Understanding documents
|
55
55
|
- Pose estimation
|
56
56
|
- Visual question answering for both images and videos
|
57
|
-
-
|
57
|
+
- Activity recognition in videos
|
58
58
|
- Image inpainting
|
59
59
|
|
60
60
|
How can I help you?</response>
|
61
61
|
--- END EXAMPLE2 ---
|
62
62
|
|
63
|
+
**Helpful Context**:
|
64
|
+
- You are helping the user write vision code that utilizes the `vision-agent` library to solve different vision tasks.
|
65
|
+
- The goal is to write code the user can use to solve a visual task and then deploy the code so they can run it repeatedly on that task.
|
66
|
+
- If the user wants to run the code, they can `pip install vision-agent` to install the library, copy the code, and run it locally themselves.
|
67
|
+
- They can find the vision-agent source code at https://github.com/landing-ai/vision-agent. They can find the documentation for vision-agent at https://landing-ai.github.io/vision-agent/.
|
68
|
+
- The code utilizes LandingAI's API to run the different tools, the API is free to use and does not require an API key.
|
69
|
+
- The user can run VisionAgent (you) from two places, either on our website at https://va.landing.ai or locally.
|
70
|
+
- If the user is running VisionAgent on the website, they can only upload images or videos, nothing else at the moment. They can view files created by VisionAgent by clicking the "Files" button in the upper right part of the screen.
|
71
|
+
- If the user is running VisionAgent locally they can ask it to do more things like run over files in a folder. They can view files created by VisionAgent by checking their local file system.
|
72
|
+
|
63
73
|
**Conversation**:
|
64
74
|
Here is the current conversation so far:
|
65
75
|
--- START CONVERSATION ---
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_coder_prompts.py
RENAMED
File without changes
|
{vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_coder_prompts_v2.py
RENAMED
File without changes
|
File without changes
|
{vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_planner_prompts.py
RENAMED
File without changes
|
{vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/agent/vision_agent_planner_prompts_v2.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{vision_agent-0.2.244 → vision_agent-0.2.246}/vision_agent/configs/anthropic_openai_config.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|