PyPI - agentscope-runtime - Versions diffs - 0.1.1__py3-none-any.whl → 0.1.2__py3-none-any.whl - Mend

agentscope-runtime 0.1.1py3-none-any.whl → 0.1.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

agentscope_runtime/sandbox/box/training_box/environments/bfcl/bfcl_env.py ADDED Viewed

@@ -0,0 +1,380 @@
+# -*- coding: utf-8 -*-
+"""
+This file is part of https://github.com/ShishirPatil/gorilla
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+    http://www.apache.org/licenses/LICENSE-2.0
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+# environments/bfcl_env.py
+from __future__ import annotations
+import json
+import os
+from pathlib import Path
+from typing import Any, Dict
+import re
+from training_box.base import BaseEnv
+from training_box.registry import Registry
+from training_box.src.trajectory import StateMessage
+from training_box.environments.bfcl.env_handler import EnvHandler
+os.environ.setdefault(
+    "BFCL_DATA_PATH",
+    "./bfcl/multiturn_dataset/multiturn_data.jsonl",
+)
+os.environ.setdefault("BFCL_ANSWER_PATH", "./bfcl/data/possible_answer")
+__all__ = ["BfclEnv"]
+def parse_assistant_content_to_tool_calls(
+    msg: Dict[str, Any],
+) -> Dict[str, Any]:
+    content = msg.get("content", "") or ""
+    if not isinstance(content, str):
+        content = str(content)
+    tool_calls = []
+    call_id_counter = 1
+    pattern = r"<tool_call>\s*\n?({.*?})\s*\n?\</tool_call>"
+    matches = list(re.finditer(pattern, content, re.DOTALL))
+    if not matches:
+        return {
+            "role": "assistant",
+            "content": content.strip(),
+            "tool_calls": [],
+        }
+    for match in matches:
+        json_str = match.group(1).strip()
+        try:
+            data = json.loads(json_str)
+            if not isinstance(data, dict):
+                continue
+            if "name" not in data or "arguments" not in data:
+                continue
+            func_name = data["name"]
+            tool_call = {
+                "id": f"{func_name}_{call_id_counter}",
+                "type": "function",
+                "function": {
+                    "name": data["name"],
+                    "arguments": data["arguments"],
+                },
+            }
+            tool_calls.append(tool_call)
+            call_id_counter += 1
+        except json.JSONDecodeError as e:
+            print(f"JSON 解析失败: {json_str[:50]}... -> {e}")
+            continue
+    cleaned_content = re.sub(pattern, "", content, flags=re.DOTALL).strip()
+    cleaned_content = re.sub(r"\n\s*\n", "\n\n", cleaned_content).strip()
+    result = {
+        "role": "assistant",
+        "content": cleaned_content,
+        "tool_calls": tool_calls,
+    }
+    return result
+def tools_schema_to_qwen_prompt(tools_schema):
+    if not tools_schema:
+        return ""
+    lines = []
+    lines.append("\n\n# Tools\n")
+    lines.append(
+        "You may call one or more functions to assist with the user query.\n",
+    )
+    lines.append(
+        "You are provided with function signatures within <tools></tools> \
+            XML tags:",
+    )
+    lines.append("<tools>")
+    for tool in tools_schema:
+        tool_json = json.dumps(
+            tool,
+            ensure_ascii=False,
+            separators=(",", ":"),
+        )
+        lines.append(tool_json)
+    lines.append("</tools>\n")
+    lines.append(
+        "Important: Always use only the latest tool list provided, \
+        ignoring any functions mentioned in previous messages.",
+    )
+    lines.append(
+        "For each function call, return a json object with function name \
+            and arguments within <tool_call> and <tool_call> XML tags:",
+    )
+    lines.append("<tool_call>")
+    lines.append('{"name": <function-name>, "arguments": <args-json-object>}')
+    lines.append("</tool_call>")
+    return "\n".join(lines)
+def tool_message_to_qwen_text(tool_messages):
+    if isinstance(tool_messages, dict):
+        tool_messages = [tool_messages]
+    if not tool_messages:
+        return ""
+    tool_entries = []
+    for msg in tool_messages:
+        if msg.get("role") != "tool":
+            raise ValueError("All messages must have role 'tool'")
+        content = msg.get("content", "")
+        tool_call_id = msg.get("tool_call_id", "")
+        name = msg.get("name", tool_call_id)
+        if not name:
+            raise ValueError("Missing 'name' in tool message.")
+        try:
+            if isinstance(content, str):
+                parsed_content = (
+                    json.loads(content)
+                    if content.strip().startswith(("{", "["))
+                    else content
+                )
+            else:
+                parsed_content = content
+        except Exception:
+            parsed_content = content
+        entry = {
+            "name": name,
+            "content": parsed_content,
+        }
+        tool_entries.append(
+            f"<tool_call>\n{json.dumps(entry, ensure_ascii=False)}"
+            f"\n</tool_call>",
+        )
+    inner_text = "\n".join(tool_entries) + "\n"
+    return inner_text
+@Registry.register("bfcl")
+class BfclEnv(BaseEnv):
+    def __init__(
+        self,
+        task_id: str | None = None,
+        instance_id: str | None = None,
+        params: Dict[str, Any] | None = None,
+    ):
+        self.task_id, self.instance_id = task_id, instance_id
+        self.params: Dict[str, Any] = params or {}
+        self.data_path = self.params.get(
+            "data_path",
+            os.getenv("BFCL_DATA_PATH"),
+        )
+        self.answer_path = self.params.get(
+            "answer_path",
+            os.getenv("BFCL_ANSWER_PATH"),
+        )
+        self.model_name = self.params.get("model_name", "env_handler")
+        self.test_entry: Dict[str, Any] | None = None
+        self.original_test_entry: Dict[str, Any] | None = None
+        self.env_handler: EnvHandler | None = None
+        self.conversation_history: list[Dict[str, Any]] = []
+        self.current_turn = 0
+        self.total_input_tokens = 0
+        self.total_output_tokens = 0
+        self.tools_info = ""
+    def get_init_state(
+        self,
+        _params: Dict[str, Any] | None = None,
+    ) -> Dict[str, Any]:
+        self.test_entry = self._load_test_case(self.data_path, self.task_id)
+        self.original_test_entry = self.test_entry
+        self.env_handler = EnvHandler(
+            model_name=self.model_name,
+            answer_path=Path(self.answer_path),
+        )
+        self.conversation_history = self.test_entry.get("question", [[]])[
+            0
+        ].copy()
+        self.current_turn = 0
+        tools = self.test_entry.get("function", [])
+        self.tools_info = "Available tools:\n" + "\n".join(
+            f"- {t.get('function', {}).get('name', 'unknown')}" for t in tools
+        )
+        first_query = (
+            self.conversation_history[0]["content"]
+            if self.conversation_history
+            else ""
+        )
+        tool_prompt = tools_schema_to_qwen_prompt(tools)
+        return {
+            "state": [
+                {"role": "system", "content": tool_prompt},
+                {"role": "user", "content": first_query},
+            ],
+            "info": {
+                "instance_id": self.instance_id,
+                "task_id": self.task_id,
+                "test_id": self.test_entry.get("id", "unknown"),
+                "tools_count": len(tools),
+                "questions_count": len(
+                    self.original_test_entry.get("question", []),
+                ),
+            },
+        }
+    def step(
+        self,
+        action: Dict[str, Any],
+        params: Dict[str, Any] | None = None,
+    ) -> Dict[str, Any]:
+        state_msg = self.transition(
+            action,
+            params or {},
+        )
+        terminated = self._is_terminated(
+            state_msg.simple_dict["content"],
+        )
+        reward = self.evaluate(params={"sparse": True}) if terminated else 0.0
+        return {
+            "state": [state_msg.simple_dict],
+            "reward": reward,
+            "is_terminated": terminated,
+            "info": {},
+        }
+    def transition(
+        self,
+        assistant_entry: Dict[str, Any],
+        _params: Dict[str, Any],
+    ) -> StateMessage:
+        assistant_entry = parse_assistant_content_to_tool_calls(
+            assistant_entry,
+        )
+        self.conversation_history.append(
+            assistant_entry,
+        )
+        if self.env_handler is None or self.original_test_entry is None:
+            raise RuntimeError(
+                "EnvHandler not initialised – call get_init_state() first.",
+            )
+        env_resp = self.env_handler.interact(
+            self.conversation_history,
+            self.original_test_entry,
+        )
+        next_msg_content = ""
+        for _idx, msg in enumerate(env_resp.get("messages", [])):
+            self.conversation_history.append(msg)
+            if msg["role"] == "tool":
+                next_msg_content += tool_message_to_qwen_text(msg)
+            elif msg["role"] == "user":
+                next_msg_content = msg.get("content", "")
+                self.current_turn += 1
+            elif msg["role"] == "env":
+                next_msg_content = msg.get("content", "")
+        return StateMessage(role="user", content=next_msg_content)
+    def evaluate(
+        self,
+        _messages: Dict[str, Any] | None = None,
+        params: Dict[str, Any] | None = None,
+    ):
+        if self.env_handler is None:
+            raise RuntimeError("EnvHandler not initialised – cannot evaluate.")
+        conv_result = {
+            "test_id": self.test_entry.get("id", "unknown"),
+            "messages": self.conversation_history,
+            "turn_count": self.current_turn,
+            "total_input_tokens": self.total_input_tokens,
+            "total_output_tokens": self.total_output_tokens,
+            "completed": self._is_terminated(
+                self.conversation_history[-1]["content"],
+            ),
+            "original_test_entry": self.original_test_entry,
+        }
+        sparse = (params or {}).get("sparse", False)
+        result = self.env_handler.evaluate(conv_result)
+        return result.get("accuracy", 0.0) if sparse else result
+    def get_info(
+        self,
+        _messages: Dict[str, Any] | None = None,
+        _params: Dict[str, Any] | None = None,
+    ) -> str:
+        return self.tools_info
+    def close(self):
+        self.conversation_history.clear()
+    def _is_terminated(self, env_content) -> bool:
+        return env_content == "[CONVERSATION_COMPLETED]"
+    @staticmethod
+    def _load_test_case(data_path: str, test_id: str | None) -> Dict[str, Any]:
+        if not Path(data_path).exists():
+            raise FileNotFoundError(f"BFCL data file '{data_path}' not found")
+        if test_id is None:
+            raise ValueError("task_id is required")
+        with open(data_path, "r", encoding="utf-8") as f:
+            if str(test_id).isdigit():
+                idx = int(test_id)
+                for line_no, line in enumerate(f):
+                    if line_no == idx:
+                        return json.loads(line)
+                raise ValueError(
+                    f"Test case index {idx} not found in {data_path}",
+                )
+            for line in f:
+                data = json.loads(line)
+                if data.get("id") == test_id:
+                    return data
+            raise ValueError(
+                f"Test case id '{test_id}' not found in {data_path}",
+            )
+    @staticmethod
+    def get_query_list(
+        split: str = "train",
+    ):
+        path = os.getenv("BFCL_SPLID_ID_PATH")
+        if path is None:
+            raise ValueError("path must be provided")
+        with open(path, "r", encoding="utf-8") as f:
+            return json.load(f)[split]

agentscope-runtime 0.1.1__py3-none-any.whl → 0.1.2__py3-none-any.whl

agentscope-runtime 0.1.1py3-none-any.whl → 0.1.2py3-none-any.whl