vision-agent 0.2.233__tar.gz → 0.2.234__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (52) hide show
  1. {vision_agent-0.2.233 → vision_agent-0.2.234}/PKG-INFO +1 -1
  2. {vision_agent-0.2.233 → vision_agent-0.2.234}/pyproject.toml +1 -1
  3. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/vision_agent_planner_prompts_v2.py +1 -1
  4. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/vision_agent_planner_v2.py +2 -3
  5. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/vision_agent_v2.py +1 -2
  6. {vision_agent-0.2.233 → vision_agent-0.2.234}/LICENSE +0 -0
  7. {vision_agent-0.2.233 → vision_agent-0.2.234}/README.md +0 -0
  8. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/.sim_tools/df.csv +0 -0
  9. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/.sim_tools/embs.npy +0 -0
  10. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/__init__.py +0 -0
  11. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/README.md +0 -0
  12. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/__init__.py +0 -0
  13. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/agent.py +0 -0
  14. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/agent_utils.py +0 -0
  15. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/types.py +0 -0
  16. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/vision_agent.py +0 -0
  17. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/vision_agent_coder.py +0 -0
  18. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/vision_agent_coder_prompts.py +0 -0
  19. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/vision_agent_coder_prompts_v2.py +0 -0
  20. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/vision_agent_coder_v2.py +0 -0
  21. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/vision_agent_planner.py +0 -0
  22. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/vision_agent_planner_prompts.py +0 -0
  23. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/vision_agent_prompts.py +0 -0
  24. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/agent/vision_agent_prompts_v2.py +0 -0
  25. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/clients/__init__.py +0 -0
  26. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/clients/http.py +0 -0
  27. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/clients/landing_public_api.py +0 -0
  28. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/configs/__init__.py +0 -0
  29. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/configs/anthropic_config.py +0 -0
  30. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/configs/anthropic_openai_config.py +0 -0
  31. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/configs/config.py +0 -0
  32. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/configs/openai_config.py +0 -0
  33. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/fonts/__init__.py +0 -0
  34. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/fonts/default_font_ch_en.ttf +0 -0
  35. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/lmm/__init__.py +0 -0
  36. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/lmm/lmm.py +0 -0
  37. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/lmm/types.py +0 -0
  38. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/tools/__init__.py +0 -0
  39. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/tools/meta_tools.py +0 -0
  40. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/tools/planner_tools.py +0 -0
  41. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/tools/prompts.py +0 -0
  42. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/tools/tool_utils.py +0 -0
  43. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/tools/tools.py +0 -0
  44. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/tools/tools_types.py +0 -0
  45. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/utils/__init__.py +0 -0
  46. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/utils/exceptions.py +0 -0
  47. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/utils/execute.py +0 -0
  48. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/utils/image_utils.py +0 -0
  49. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/utils/sim.py +0 -0
  50. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/utils/type_defs.py +0 -0
  51. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/utils/video.py +0 -0
  52. {vision_agent-0.2.233 → vision_agent-0.2.234}/vision_agent/utils/video_tracking.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: vision-agent
3
- Version: 0.2.233
3
+ Version: 0.2.234
4
4
  Summary: Toolset for Vision Agent
5
5
  Author: Landing AI
6
6
  Author-email: dev@landing.ai
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
4
4
 
5
5
  [tool.poetry]
6
6
  name = "vision-agent"
7
- version = "0.2.233"
7
+ version = "0.2.234"
8
8
  description = "Toolset for Vision Agent"
9
9
  authors = ["Landing AI <dev@landing.ai>"]
10
10
  readme = "README.md"
@@ -20,7 +20,7 @@ PLAN = """
20
20
  3. Only output <finalize_plan> when you are done planning and want to end the planning process. DO NOT output <finalize_plan> with <execute_python> tags, only after OBSERVATION's.
21
21
  4. Only load/save files from {media_list} unless you specifically saved the file previously.
22
22
  5. Ensure you always call `suggestion` initially and `get_tool_for_task` to get the right tool for the subtask.
23
- 6. Calling `plt.imshow` or `save_image` will display the image to you, use this to visually check your results.
23
+ 6. Calling `plt.imshow` or `save_image` will display the image to you so you can check your results. If you see an image after <execute_python> it's generated from your code.
24
24
  7. DO NOT hard code the answer into your code, it should be dynamic and work for any similar request.
25
25
  8. DO NOT over index on claude35_vqa, if tool output is close to claude35_vqa's output you do not need to improve the tool.
26
26
  9. You can only respond in the following format with a single <thinking>, <execute_python> or <finalize_plan> tag:
@@ -97,8 +97,7 @@ def run_planning(
97
97
  media_list: List[Union[str, Path]],
98
98
  model: LMM,
99
99
  ) -> str:
100
- # only keep last 10 messages for planning
101
- planning = get_planning(chat[-10:])
100
+ planning = get_planning(chat)
102
101
  prompt = PLAN.format(
103
102
  tool_desc=PLANNING_TOOLS_DOCSTRING,
104
103
  examples=f"{EXAMPLE_PLAN1}\n{EXAMPLE_PLAN2}",
@@ -372,7 +371,7 @@ def replace_interaction_with_obs(chat: List[AgentMessage]) -> List[AgentMessage]
372
371
  function_name = response["function_name"]
373
372
  tool_doc = get_tool_documentation(function_name)
374
373
  if "box_threshold" in response:
375
- tool_doc = f"Use the following function with box_threshold={response['box_threshold']}\n\n{tool_doc}"
374
+ tool_doc = f"Use the following function with box_threshold={response['box_threshold']}. This tool and its parameters were chosen by the user so do not change them in your planning.\n\n{tool_doc}."
376
375
  new_chat.append(AgentMessage(role="observation", content=tool_doc))
377
376
  except (json.JSONDecodeError, KeyError):
378
377
  raise ValueError(f"Invalid JSON in interaction response: {chat_i}")
@@ -91,8 +91,6 @@ def maybe_run_action(
91
91
  code_interpreter: Optional[CodeInterpreter] = None,
92
92
  ) -> Optional[List[AgentMessage]]:
93
93
  extracted_chat, final_code = extract_conversation(chat)
94
- # only keep last 5 messages to keep context recent and not overwhelm LLM
95
- extracted_chat = extracted_chat[-5:]
96
94
  if action == "generate_or_edit_vision_code":
97
95
  # there's an issue here because coder.generate_code will send it's code_context
98
96
  # to the outside user via it's update_callback, but we don't necessarily have
@@ -125,6 +123,7 @@ def maybe_run_action(
125
123
  ],
126
124
  code="",
127
125
  )
126
+
128
127
  context = coder.generate_code_from_plan(
129
128
  extracted_chat, plan_context, code_interpreter=code_interpreter
130
129
  )
File without changes
File without changes