vision-agent 0.2.138__py3-none-any.whl → 0.2.140__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- vision_agent/agent/vision_agent.py +27 -0
- vision_agent/tools/meta_tools.py +1 -0
- vision_agent/tools/tool_utils.py +12 -6
- {vision_agent-0.2.138.dist-info → vision_agent-0.2.140.dist-info}/METADATA +1 -1
- {vision_agent-0.2.138.dist-info → vision_agent-0.2.140.dist-info}/RECORD +7 -7
- {vision_agent-0.2.138.dist-info → vision_agent-0.2.140.dist-info}/LICENSE +0 -0
- {vision_agent-0.2.138.dist-info → vision_agent-0.2.140.dist-info}/WHEEL +0 -0
| @@ -218,6 +218,7 @@ class VisionAgent(Agent): | |
| 218 218 | 
             
                    ) as code_interpreter:
         | 
| 219 219 | 
             
                        orig_chat = copy.deepcopy(chat)
         | 
| 220 220 | 
             
                        int_chat = copy.deepcopy(chat)
         | 
| 221 | 
            +
                        last_user_message_content = chat[-1].get("content")
         | 
| 221 222 | 
             
                        media_list = []
         | 
| 222 223 | 
             
                        for chat_i in int_chat:
         | 
| 223 224 | 
             
                            if "media" in chat_i:
         | 
| @@ -266,6 +267,32 @@ class VisionAgent(Agent): | |
| 266 267 | 
             
                        orig_chat.append({"role": "observation", "content": artifacts_loaded})
         | 
| 267 268 | 
             
                        self.streaming_message({"role": "observation", "content": artifacts_loaded})
         | 
| 268 269 |  | 
| 270 | 
            +
                        if isinstance(last_user_message_content, str):
         | 
| 271 | 
            +
                            user_code_action = parse_execution(last_user_message_content, False)
         | 
| 272 | 
            +
                            if user_code_action is not None:
         | 
| 273 | 
            +
                                user_result, user_obs = run_code_action(
         | 
| 274 | 
            +
                                    user_code_action, code_interpreter, str(remote_artifacts_path)
         | 
| 275 | 
            +
                                )
         | 
| 276 | 
            +
                                if self.verbosity >= 1:
         | 
| 277 | 
            +
                                    _LOGGER.info(user_obs)
         | 
| 278 | 
            +
                                int_chat.append({"role": "observation", "content": user_obs})
         | 
| 279 | 
            +
                                orig_chat.append(
         | 
| 280 | 
            +
                                    {
         | 
| 281 | 
            +
                                        "role": "observation",
         | 
| 282 | 
            +
                                        "content": user_obs,
         | 
| 283 | 
            +
                                        "execution": user_result,
         | 
| 284 | 
            +
                                    }
         | 
| 285 | 
            +
                                )
         | 
| 286 | 
            +
                                self.streaming_message(
         | 
| 287 | 
            +
                                    {
         | 
| 288 | 
            +
                                        "role": "observation",
         | 
| 289 | 
            +
                                        "content": user_obs,
         | 
| 290 | 
            +
                                        "execution": user_result,
         | 
| 291 | 
            +
                                        "finished": True,
         | 
| 292 | 
            +
                                    }
         | 
| 293 | 
            +
                                )
         | 
| 294 | 
            +
                                finished = True
         | 
| 295 | 
            +
             | 
| 269 296 | 
             
                        while not finished and iterations < self.max_iterations:
         | 
| 270 297 | 
             
                            response = run_conversation(self.agent, int_chat)
         | 
| 271 298 | 
             
                            if self.verbosity >= 1:
         | 
    
        vision_agent/tools/meta_tools.py
    CHANGED
    
    
    
        vision_agent/tools/tool_utils.py
    CHANGED
    
    | @@ -208,19 +208,25 @@ def _call_post( | |
| 208 208 | 
             
                if files:
         | 
| 209 209 | 
             
                    files_in_b64 = [(file[0], b64encode(file[1]).decode("utf-8")) for file in files]
         | 
| 210 210 | 
             
                try:
         | 
| 211 | 
            +
                    if files is not None:
         | 
| 212 | 
            +
                        response = session.post(url, data=payload, files=files)
         | 
| 213 | 
            +
                    else:
         | 
| 214 | 
            +
                        response = session.post(url, json=payload)
         | 
| 215 | 
            +
             | 
| 216 | 
            +
                    # make sure function_name is in the payload so we can display it
         | 
| 217 | 
            +
                    tool_call_trace_payload = (
         | 
| 218 | 
            +
                        payload
         | 
| 219 | 
            +
                        if "function_name" in payload
         | 
| 220 | 
            +
                        else {**payload, **{"function_name": function_name}}
         | 
| 221 | 
            +
                    )
         | 
| 211 222 | 
             
                    tool_call_trace = ToolCallTrace(
         | 
| 212 223 | 
             
                        endpoint_url=url,
         | 
| 213 | 
            -
                        request= | 
| 224 | 
            +
                        request=tool_call_trace_payload,
         | 
| 214 225 | 
             
                        response={},
         | 
| 215 226 | 
             
                        error=None,
         | 
| 216 227 | 
             
                        files=files_in_b64,
         | 
| 217 228 | 
             
                    )
         | 
| 218 229 |  | 
| 219 | 
            -
                    if files is not None:
         | 
| 220 | 
            -
                        response = session.post(url, data=payload, files=files)
         | 
| 221 | 
            -
                    else:
         | 
| 222 | 
            -
                        response = session.post(url, json=payload)
         | 
| 223 | 
            -
             | 
| 224 230 | 
             
                    if response.status_code != 200:
         | 
| 225 231 | 
             
                        tool_call_trace.error = Error(
         | 
| 226 232 | 
             
                            name="RemoteToolCallFailed",
         | 
| @@ -2,7 +2,7 @@ vision_agent/__init__.py,sha256=EAb4-f9iyuEYkBrX4ag1syM8Syx8118_t0R6_C34M9w,57 | |
| 2 2 | 
             
            vision_agent/agent/__init__.py,sha256=TddDT4e3JVc68Dt0zSk0B4OBORx_R2WhAGK71uqEe2w,204
         | 
| 3 3 | 
             
            vision_agent/agent/agent.py,sha256=2cjIOxEuSJrqbfPXYoV0qER5ihXsPFCoEFJa4jpqan0,597
         | 
| 4 4 | 
             
            vision_agent/agent/agent_utils.py,sha256=qOYQn-wJsa4j4YjFOBQ41xyklCg8Y94CIIGw9ZXmgIU,2053
         | 
| 5 | 
            -
            vision_agent/agent/vision_agent.py,sha256= | 
| 5 | 
            +
            vision_agent/agent/vision_agent.py,sha256=Ed10_rWzHu-hejb5jF9lAF7xbmQ_qAGpCxDvByZw6M8,14100
         | 
| 6 6 | 
             
            vision_agent/agent/vision_agent_coder.py,sha256=OI95goKTqVaEEPYwkn6bVsHsHZeifoBC8rjG9nD0Znc,36909
         | 
| 7 7 | 
             
            vision_agent/agent/vision_agent_coder_prompts.py,sha256=a7P19QscKNiaweke0zHPCfi5GQImpG-ZGKv_kXz0seg,13452
         | 
| 8 8 | 
             
            vision_agent/agent/vision_agent_prompts.py,sha256=-fXiIIb48duXVljWYcJ0Y4ZzfNnRFi3C5cKdF4SdDo8,10075
         | 
| @@ -15,9 +15,9 @@ vision_agent/lmm/__init__.py,sha256=YuUZRsMHdn8cMOv6iBU8yUqlIOLrbZQqZl9KPnofsHQ, | |
| 15 15 | 
             
            vision_agent/lmm/lmm.py,sha256=soWmEjtleQUSH2G3tYZWxOmteIqkgMVcmuZfx4mxszU,16838
         | 
| 16 16 | 
             
            vision_agent/lmm/types.py,sha256=ZEXR_ptBL0ZwDMTDYkgxUCmSZFmBYPQd2jreNzr_8UY,221
         | 
| 17 17 | 
             
            vision_agent/tools/__init__.py,sha256=nufZNzbcLTuXwxFmvZNj99qE8EO2qtEPT8wFsuI9vyE,2397
         | 
| 18 | 
            -
            vision_agent/tools/meta_tools.py,sha256= | 
| 18 | 
            +
            vision_agent/tools/meta_tools.py,sha256=orYbEPWOENXwmKSmbg52_2eMAoYT9ZbV5GjudUd-f0o,22563
         | 
| 19 19 | 
             
            vision_agent/tools/prompts.py,sha256=V1z4YJLXZuUl_iZ5rY0M5hHc_2tmMEUKr0WocXKGt4E,1430
         | 
| 20 | 
            -
            vision_agent/tools/tool_utils.py,sha256= | 
| 20 | 
            +
            vision_agent/tools/tool_utils.py,sha256=5ukuDMxbEH4iKetYR9I7twzsA8ECyP4tVwYXQq54mxI,8020
         | 
| 21 21 | 
             
            vision_agent/tools/tools.py,sha256=WKeB99ED0o_ISS_vZc-ch_1Dc8_Fl2fhnGlfVNwNouc,70024
         | 
| 22 22 | 
             
            vision_agent/tools/tools_types.py,sha256=rLpCUODPY0yI65SLOTJOxfHFfqWM3WjOq-AYX25Chjk,2356
         | 
| 23 23 | 
             
            vision_agent/utils/__init__.py,sha256=7fMgbZiEwbNS0fBOS_hJI5PuEYBblw36zLi_UjUzvj4,244
         | 
| @@ -27,7 +27,7 @@ vision_agent/utils/image_utils.py,sha256=zTTOJFOieMzwIquTFnW7T6ssx9o6XfoZ0Unqyk7 | |
| 27 27 | 
             
            vision_agent/utils/sim.py,sha256=ebE9Cs00pVEDI1HMjAzUBk88tQQmc2U-yAzIDinnekU,5572
         | 
| 28 28 | 
             
            vision_agent/utils/type_defs.py,sha256=BE12s3JNQy36QvauXHjwyeffVh5enfcvd4vTzSwvEZI,1384
         | 
| 29 29 | 
             
            vision_agent/utils/video.py,sha256=hOjfEOZNcddYdoa0CoviXA4Vo9kwURKuojIJgLLJdp0,4745
         | 
| 30 | 
            -
            vision_agent-0.2. | 
| 31 | 
            -
            vision_agent-0.2. | 
| 32 | 
            -
            vision_agent-0.2. | 
| 33 | 
            -
            vision_agent-0.2. | 
| 30 | 
            +
            vision_agent-0.2.140.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
         | 
| 31 | 
            +
            vision_agent-0.2.140.dist-info/METADATA,sha256=B33v0XI-5ZlEBBu-I8DT7JrbU04PophTYEmRQMVEkBQ,12291
         | 
| 32 | 
            +
            vision_agent-0.2.140.dist-info/WHEEL,sha256=7Z8_27uaHI_UZAc4Uox4PpBhQ9Y5_modZXWMxtUi4NU,88
         | 
| 33 | 
            +
            vision_agent-0.2.140.dist-info/RECORD,,
         | 
| 
            File without changes
         | 
| 
            File without changes
         |