PyPI - abstractagent - Versions diffs - 0.2.0__py3-none-any.whl → 0.3.1__py3-none-any.whl - Mend

abstractagent 0.2.0py3-none-any.whl → 0.3.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

abstractagent/adapters/__init__.py +2 -1
abstractagent/adapters/codeact_runtime.py +907 -60
abstractagent/adapters/generation_params.py +82 -0
abstractagent/adapters/media.py +45 -0
abstractagent/adapters/memact_runtime.py +959 -0
abstractagent/adapters/react_runtime.py +1357 -135
abstractagent/agents/__init__.py +4 -0
abstractagent/agents/base.py +89 -1
abstractagent/agents/codeact.py +125 -18
abstractagent/agents/memact.py +280 -0
abstractagent/agents/react.py +129 -18
abstractagent/logic/__init__.py +2 -0
abstractagent/logic/builtins.py +270 -5
abstractagent/logic/codeact.py +91 -81
abstractagent/logic/memact.py +128 -0
abstractagent/logic/react.py +91 -50
abstractagent/repl.py +24 -447
abstractagent/scripts/__init__.py +5 -0
abstractagent/scripts/lmstudio_tool_eval.py +426 -0
abstractagent/tools/__init__.py +9 -0
abstractagent-0.3.1.dist-info/METADATA +112 -0
abstractagent-0.3.1.dist-info/RECORD +33 -0
{abstractagent-0.2.0.dist-info → abstractagent-0.3.1.dist-info}/WHEEL +1 -1
abstractagent/ui/__init__.py +0 -5
abstractagent/ui/question.py +0 -197
abstractagent-0.2.0.dist-info/METADATA +0 -134
abstractagent-0.2.0.dist-info/RECORD +0 -28
{abstractagent-0.2.0.dist-info → abstractagent-0.3.1.dist-info}/entry_points.txt +0 -0
{abstractagent-0.2.0.dist-info → abstractagent-0.3.1.dist-info}/licenses/LICENSE +0 -0
{abstractagent-0.2.0.dist-info → abstractagent-0.3.1.dist-info}/top_level.txt +0 -0

abstractagent/adapters/react_runtime.py CHANGED Viewed

@@ -1,15 +1,31 @@
-"""AbstractRuntime adapter for ReAct-like agents."""
+"""AbstractRuntime adapter for canonical ReAct agents.
+This adapter implements a deterministic ReAct loop:
+  init → reason → parse → (act → observe → reason)* → done
+Policy (for now):
+- Do NOT truncate ReAct loop context (history/scratchpad).
+- Do NOT cap tool-steps to tiny token budgets.
+- Do NOT require "FINAL:" markers or other termination hacks.
+The loop continues whenever the model emits tool calls.
+It ends only when the model emits **no tool calls** and provides an answer.
+"""
 from __future__ import annotations
 import hashlib
 import json
+import re
 from typing import Any, Callable, Dict, List, Optional
 from abstractcore.tools import ToolCall
 from abstractruntime import Effect, EffectType, RunState, StepPlan, WorkflowSpec
 from abstractruntime.core.vars import ensure_limits, ensure_namespaces
+from .generation_params import runtime_llm_params
+from .media import extract_media_from_context
 from ..logic.react import ReActLogic
@@ -29,20 +45,60 @@ def _new_message(
         timestamp = datetime.now(timezone.utc).isoformat()
+    import uuid
+    meta = dict(metadata or {})
+    meta.setdefault("message_id", f"msg_{uuid.uuid4().hex}")
     return {
         "role": role,
         "content": content,
         "timestamp": timestamp,
-        "metadata": metadata or {},
+        "metadata": meta,
     }
-def ensure_react_vars(run: RunState) -> tuple[Dict[str, Any], Dict[str, Any], Dict[str, Any], Dict[str, Any], Dict[str, Any]]:
-    """Ensure namespaced vars exist and migrate legacy flat keys in-place.
+def _new_assistant_message_with_tool_calls(
+    ctx: Any,
+    *,
+    content: str,
+    tool_calls: List[ToolCall],
+    metadata: Optional[Dict[str, Any]] = None,
+) -> Dict[str, Any]:
+    """Create an assistant message that preserves tool call metadata for OpenAI transcripts."""
+    msg = _new_message(ctx, role="assistant", content=content, metadata=metadata)
+    tc_payload: list[dict[str, Any]] = []
+    for i, tc in enumerate(tool_calls):
+        if not isinstance(tc, ToolCall):
+            continue
+        name = str(tc.name or "").strip()
+        if not name:
+            continue
+        call_id = tc.call_id
+        call_id_str = str(call_id).strip() if call_id is not None else ""
+        if not call_id_str:
+            call_id_str = f"call_{i+1}"
+        args = tc.arguments if isinstance(tc.arguments, dict) else {}
+        tc_payload.append(
+            {
+                "type": "function",
+                "id": call_id_str,
+                "function": {"name": name, "arguments": json.dumps(args, ensure_ascii=False)},
+            }
+        )
+    if tc_payload:
+        msg["tool_calls"] = tc_payload
+    return msg
+def ensure_react_vars(
+    run: RunState,
+) -> tuple[Dict[str, Any], Dict[str, Any], Dict[str, Any], Dict[str, Any], Dict[str, Any]]:
+    """Ensure namespaced vars exist and migrate legacy flat keys in-place."""
-    Returns:
-        Tuple of (context, scratchpad, runtime_ns, temp, limits) dicts.
-    """
     ensure_namespaces(run.vars)
     limits = ensure_limits(run.vars)
     context = run.vars["context"]
@@ -70,6 +126,9 @@ def ensure_react_vars(run: RunState) -> tuple[Dict[str, Any], Dict[str, Any], Di
     if not isinstance(runtime_ns.get("inbox"), list):
         runtime_ns["inbox"] = []
+    if not isinstance(scratchpad.get("cycles"), list):
+        scratchpad["cycles"] = []
     iteration = scratchpad.get("iteration")
     if not isinstance(iteration, int):
         try:
@@ -85,10 +144,13 @@ def ensure_react_vars(run: RunState) -> tuple[Dict[str, Any], Dict[str, Any], Di
             scratchpad["max_iterations"] = int(max_iterations)
         except (TypeError, ValueError):
             scratchpad["max_iterations"] = 25
     if scratchpad["max_iterations"] < 1:
         scratchpad["max_iterations"] = 1
+    used_tools = scratchpad.get("used_tools")
+    if not isinstance(used_tools, bool):
+        scratchpad["used_tools"] = bool(used_tools) if used_tools is not None else False
     return context, scratchpad, runtime_ns, temp, limits
@@ -99,10 +161,470 @@ def _compute_toolset_id(tool_specs: List[Dict[str, Any]]) -> str:
     return f"ts_{digest}"
+def _tool_call_signature(name: str, args: Any) -> str:
+    def _abbrev(v: Any, *, max_chars: int = 140) -> str:
+        if v is None:
+            return ""
+        s = str(v)
+        if len(s) <= max_chars:
+            return s
+        return f"{s[: max(0, max_chars - 1)]}…"
+    def _hash_str(s: str) -> str:
+        try:
+            return hashlib.sha256(s.encode("utf-8")).hexdigest()[:12]
+        except Exception:
+            return "sha256_err"
+    n = str(name or "").strip() or "tool"
+    if not isinstance(args, dict) or not args:
+        return f"{n}()"
+    # Special-case common large-argument tools so the system prompt doesn't explode.
+    if n == "write_file":
+        fp = args.get("file_path") if isinstance(args.get("file_path"), str) else args.get("path")
+        mode = args.get("mode") if isinstance(args.get("mode"), str) else "w"
+        content = args.get("content")
+        if isinstance(content, str):
+            tag = f"<str len={len(content)} sha256={_hash_str(content)}>"
+        else:
+            tag = "<str len=0>"
+        return f"write_file(file_path={_abbrev(fp)!r}, mode={_abbrev(mode)!r}, content={tag})"
+    if n == "edit_file":
+        fp = args.get("file_path") if isinstance(args.get("file_path"), str) else args.get("path")
+        edits = args.get("edits")
+        n_edits = len(edits) if isinstance(edits, list) else 0
+        return f"edit_file(file_path={_abbrev(fp)!r}, edits={n_edits})"
+    if n == "fetch_url":
+        url = args.get("url")
+        include_full = args.get("include_full_content")
+        return f"fetch_url(url={_abbrev(url)!r}, include_full_content={include_full})"
+    if n == "web_search":
+        q = args.get("query")
+        num = args.get("num_results")
+        return f"web_search(query={_abbrev(q)!r}, num_results={num})"
+    if n == "execute_command":
+        cmd = args.get("command")
+        return f"execute_command(command={_abbrev(cmd, max_chars=220)!r})"
+    # Generic, but bounded: hash long strings to avoid leaking large blobs into the prompt.
+    summarized: Dict[str, Any] = {}
+    for k, v in args.items():
+        if isinstance(v, str) and len(v) > 160:
+            summarized[str(k)] = f"<str len={len(v)} sha256={_hash_str(v)}>"
+        else:
+            summarized[str(k)] = v
+    try:
+        arg_str = json.dumps(summarized, ensure_ascii=False, sort_keys=True)
+    except Exception:
+        arg_str = str(summarized)
+    arg_str = _abbrev(arg_str, max_chars=260)
+    return f"{n}({arg_str})"
+def _tool_call_fingerprint(name: str, args: Any) -> str:
+    """Return a stable, bounded fingerprint for tool-call repeat detection.
+    Important: do not embed large string blobs (file contents / web pages) in the fingerprint.
+    """
+    def _hash_str(s: str) -> str:
+        try:
+            return hashlib.sha256(s.encode("utf-8")).hexdigest()
+        except Exception:
+            return "sha256_err"
+    def _canon(v: Any) -> Any:
+        if v is None or isinstance(v, (bool, int, float)):
+            return v
+        if isinstance(v, str):
+            if len(v) <= 200:
+                return v
+            return {"_type": "str", "len": len(v), "sha256": _hash_str(v)[:16]}
+        if isinstance(v, list):
+            return [_canon(x) for x in v[:25]]
+        if isinstance(v, dict):
+            out: Dict[str, Any] = {}
+            for k in sorted(v.keys(), key=lambda x: str(x)):
+                out[str(k)] = _canon(v.get(k))
+            return out
+        return {"_type": type(v).__name__}
+    payload = {"name": str(name or "").strip(), "args": _canon(args if isinstance(args, dict) else {})}
+    try:
+        raw = json.dumps(payload, ensure_ascii=False, sort_keys=True, separators=(",", ":"))
+    except Exception:
+        raw = str(payload)
+    try:
+        return hashlib.sha256(raw.encode("utf-8")).hexdigest()[:16]
+    except Exception:
+        return "fingerprint_err"
+_FINALISH_RE = re.compile(
+    r"(?i)\b(final answer|here is|here['’]s|here are|below is|below are|done|completed|in summary|summary|result)\b"
+)
+_WAITING_RE = re.compile(
+    r"(?i)\b("
+    r"let me know|your next step|what would you like|tell me|"
+    r"i can help|i'm ready|i am ready|"
+    r"i'll wait|i will wait|waiting for|"
+    r"no tool calls?"
+    r")\b"
+)
+_DEFERRED_ACTION_INTENT_RE = re.compile(
+    # Only treat as "missing tool calls" when the model *commits to acting*
+    # (first-person intent) rather than providing a final answer.
+    r"(?i)\b(i will|i['’]?ll|let me|i am going to|i['’]?m going to|i need to)\b"
+)
+_DEFERRED_ACTION_VERB_RE = re.compile(
+    # Verbs that typically imply external actions (tools/files/web/edits).
+    r"(?i)\b(read|open|search|list|skim|inspect|explore|scan|run|execute|edit|fetch|download|creat(?:e|ing))\b"
+)
+_TOOL_CALL_MARKERS = ("<function_call>", "<tool_call>", "<|tool_call|>", "```tool_code")
+def _contains_tool_call_markup(text: str) -> bool:
+    s = str(text or "")
+    if not s.strip():
+        return False
+    low = s.lower()
+    return any(m in low for m in _TOOL_CALL_MARKERS)
+_TOOL_CALL_STRIP_RE = re.compile(
+    r"(?is)"
+    r"<function_call>\s*.*?\s*</function_call>|"
+    r"<tool_call>\s*.*?\s*</tool_call>|"
+    r"<\|tool_call\|>.*?<\|/tool_call\|>|"
+    r"```tool_code\s*.*?```"
+)
+def _strip_tool_call_markup(text: str) -> str:
+    raw = str(text or "")
+    if not raw.strip():
+        return ""
+    try:
+        return _TOOL_CALL_STRIP_RE.sub("", raw)
+    except Exception:
+        return raw
+def _looks_like_deferred_action(text: str) -> bool:
+    """Return True when the model claims it will take actions but emits no tool calls.
+    This is intentionally conservative: false positives waste iterations and can "force"
+    unnecessary tool calls. It should only trigger when the assistant message strongly
+    suggests it is about to act (not answer).
+    """
+    s = str(text or "").strip()
+    if not s:
+        return False
+    # If the model is explicitly waiting for user direction, that's a valid final response.
+    if _WAITING_RE.search(s):
+        return False
+    # Common “final answer” framing (incl. typographic apostrophes).
+    if _FINALISH_RE.search(s):
+        return False
+    # If the model already produced a structured answer (headings/sections), don't retry.
+    if re.search(r"(?m)^(#{1,6}\s+\\S|\\*\\*\\S)", s):
+        return False
+    # Must contain first-person intent *and* an action-ish verb.
+    if not _DEFERRED_ACTION_INTENT_RE.search(s):
+        return False
+    if not _DEFERRED_ACTION_VERB_RE.search(s):
+        return False
+    return True
+def _push_inbox(runtime_ns: Dict[str, Any], content: str) -> None:
+    if not isinstance(runtime_ns, dict):
+        return
+    inbox = runtime_ns.get("inbox")
+    if not isinstance(inbox, list):
+        inbox = []
+        runtime_ns["inbox"] = inbox
+    inbox.append({"role": "system", "content": str(content or "")})
+def _drain_inbox(runtime_ns: Dict[str, Any]) -> str:
+    inbox = runtime_ns.get("inbox")
+    if not isinstance(inbox, list) or not inbox:
+        return ""
+    parts: list[str] = []
+    for m in inbox:
+        if not isinstance(m, dict):
+            continue
+        c = m.get("content")
+        if isinstance(c, str) and c.strip():
+            parts.append(c.strip())
+    runtime_ns["inbox"] = []
+    return "\n".join(parts).strip()
+def _boolish(value: Any) -> bool:
+    """Best-effort coercion for runtime flags (bool/int/str)."""
+    if isinstance(value, bool):
+        return value
+    if isinstance(value, (int, float)) and not isinstance(value, bool):
+        return value != 0
+    if isinstance(value, str):
+        return value.strip().lower() in {"1", "true", "yes", "y", "on", "enabled"}
+    return False
+def _system_prompt_override(runtime_ns: Dict[str, Any]) -> Optional[str]:
+    raw = runtime_ns.get("system_prompt") if isinstance(runtime_ns, dict) else None
+    if isinstance(raw, str) and raw.strip():
+        return raw.strip()
+    return None
+def _system_prompt_extra(runtime_ns: Dict[str, Any]) -> Optional[str]:
+    raw = runtime_ns.get("system_prompt_extra") if isinstance(runtime_ns, dict) else None
+    if isinstance(raw, str) and raw.strip():
+        return raw.strip()
+    return None
+def _compose_system_prompt(runtime_ns: Dict[str, Any], *, base: str) -> str:
+    override = _system_prompt_override(runtime_ns)
+    extra = _system_prompt_extra(runtime_ns)
+    sys = override if override is not None else base
+    if extra:
+        sys = f"{sys.rstrip()}\n\nAdditional system instructions:\n{extra}"
+    return sys.strip()
+def _max_output_tokens(runtime_ns: Dict[str, Any], limits: Dict[str, Any]) -> Optional[int]:
+    # Canonical limit: _limits.max_output_tokens (None = unset).
+    raw = None
+    if isinstance(limits, dict) and "max_output_tokens" in limits:
+        raw = limits.get("max_output_tokens")
+    if raw is None and isinstance(runtime_ns, dict):
+        raw = runtime_ns.get("max_output_tokens")
+    if raw is None:
+        return None
+    try:
+        val = int(raw)
+    except Exception:
+        return None
+    return val if val > 0 else None
+def _render_cycles_for_system_prompt(scratchpad: Dict[str, Any]) -> str:
+    cycles = scratchpad.get("cycles")
+    if not isinstance(cycles, list) or not cycles:
+        return ""
+    # Keep the system prompt bounded: tool outputs can be very large (fetch_url/web_search).
+    max_cycles = 6
+    max_thought_chars = 600
+    max_obs_chars = 220
+    view = [c for c in cycles if isinstance(c, dict)]
+    if len(view) > max_cycles:
+        view = view[-max_cycles:]
+    lines: list[str] = []
+    for c in view:
+        i = c.get("i")
+        thought = str(c.get("thought") or "").strip()
+        if len(thought) > max_thought_chars:
+            thought = f"{thought[: max(0, max_thought_chars - 1)]}…"
+        tcs = c.get("tool_calls")
+        obs = c.get("observations")
+        if i is None:
+            continue
+        lines.append(f"[cycle {i}]")
+        if thought:
+            lines.append(f"thought: {thought}")
+        if isinstance(tcs, list) and tcs:
+            sigs: list[str] = []
+            for tc in tcs:
+                if isinstance(tc, dict):
+                    sigs.append(_tool_call_signature(tc.get("name", ""), tc.get("arguments")))
+            if sigs:
+                lines.append("actions:")
+                for s in sigs:
+                    lines.append(f"- {s}")
+        if isinstance(obs, list) and obs:
+            lines.append("observations:")
+            for o in obs:
+                if not isinstance(o, dict):
+                    continue
+                name = str(o.get("name") or "tool")
+                ok = bool(o.get("success"))
+                out = o.get("output")
+                err = o.get("error")
+                if not ok:
+                    text = str(err or out or "").strip()
+                else:
+                    if isinstance(out, dict):
+                        # Prefer metadata-ish fields; do not dump full `rendered` bodies into the prompt.
+                        url = out.get("url") if isinstance(out.get("url"), str) else None
+                        status = out.get("status_code") if out.get("status_code") is not None else None
+                        content_type = out.get("content_type") if isinstance(out.get("content_type"), str) else None
+                        rendered = out.get("rendered") if isinstance(out.get("rendered"), str) else None
+                        rendered_len = len(rendered) if isinstance(rendered, str) else None
+                        parts: list[str] = []
+                        if url:
+                            parts.append(f"url={url}")
+                        if status is not None:
+                            parts.append(f"status={status}")
+                        if content_type:
+                            parts.append(f"type={content_type}")
+                        if rendered_len is not None:
+                            parts.append(f"rendered_len={rendered_len}")
+                        text = ", ".join(parts) if parts else f"keys={list(out.keys())[:8]}"
+                    else:
+                        text = str(out or "").strip()
+                if len(text) > max_obs_chars:
+                    text = f"{text[: max(0, max_obs_chars - 1)]}…"
+                lines.append(f"- [{name}] {'OK' if ok else 'ERR'}: {text}")
+        lines.append("")
+    return "\n".join(lines).strip()
+def _render_cycles_for_conclusion_prompt(scratchpad: Dict[str, Any]) -> str:
+    cycles = scratchpad.get("cycles")
+    if not isinstance(cycles, list) or not cycles:
+        return ""
+    # The conclusion prompt should have access to the full loop trace, but still needs
+    # to be bounded (tool outputs may be huge).
+    max_cycles = 25
+    max_thought_chars = 900
+    max_obs_chars = 360
+    view = [c for c in cycles if isinstance(c, dict)]
+    total = len(view)
+    if total > max_cycles:
+        view = view[-max_cycles:]
+    lines: list[str] = []
+    if total > len(view):
+        lines.append(f"(showing last {len(view)} of {total} cycles)")
+        lines.append("")
+    for c in view:
+        i = c.get("i")
+        if i is None:
+            continue
+        lines.append(f"[cycle {i}]")
+        thought = str(c.get("thought") or "").strip()
+        if len(thought) > max_thought_chars:
+            thought = f"{thought[: max(0, max_thought_chars - 1)]}…"
+        if thought:
+            lines.append(f"thought: {thought}")
+        tcs = c.get("tool_calls")
+        if isinstance(tcs, list) and tcs:
+            sigs: list[str] = []
+            for tc in tcs:
+                if isinstance(tc, dict):
+                    sigs.append(_tool_call_signature(tc.get("name", ""), tc.get("arguments")))
+            if sigs:
+                lines.append("actions:")
+                for s in sigs:
+                    lines.append(f"- {s}")
+        obs = c.get("observations")
+        if isinstance(obs, list) and obs:
+            lines.append("observations:")
+            for o in obs:
+                if not isinstance(o, dict):
+                    continue
+                name = str(o.get("name") or "tool")
+                ok = bool(o.get("success"))
+                out = o.get("output")
+                err = o.get("error")
+                if not ok:
+                    text = str(err or out or "").strip()
+                else:
+                    if isinstance(out, dict):
+                        url = out.get("url") if isinstance(out.get("url"), str) else None
+                        status = out.get("status_code") if out.get("status_code") is not None else None
+                        content_type = out.get("content_type") if isinstance(out.get("content_type"), str) else None
+                        rendered = out.get("rendered") if isinstance(out.get("rendered"), str) else None
+                        rendered_len = len(rendered) if isinstance(rendered, str) else None
+                        parts: list[str] = []
+                        if url:
+                            parts.append(f"url={url}")
+                        if status is not None:
+                            parts.append(f"status={status}")
+                        if content_type:
+                            parts.append(f"type={content_type}")
+                        if rendered_len is not None:
+                            parts.append(f"rendered_len={rendered_len}")
+                        text = ", ".join(parts) if parts else f"keys={list(out.keys())[:8]}"
+                    else:
+                        text = str(out or "").strip()
+                if len(text) > max_obs_chars:
+                    text = f"{text[: max(0, max_obs_chars - 1)]}…"
+                lines.append(f"- [{name}] {'OK' if ok else 'ERR'}: {text}")
+        lines.append("")
+    return "\n".join(lines).strip()
+def _render_final_report(task: str, scratchpad: Dict[str, Any]) -> str:
+    cycles = scratchpad.get("cycles")
+    if not isinstance(cycles, list):
+        cycles = []
+    lines: list[str] = []
+    lines.append(f"task: {task}")
+    lines.append(f"cycles: {len([c for c in cycles if isinstance(c, dict)])}")
+    lines.append("")
+    for c in cycles:
+        if not isinstance(c, dict):
+            continue
+        i = c.get("i")
+        lines.append(f"cycle {i}")
+        thought = str(c.get("thought") or "").strip()
+        if thought:
+            lines.append(f"- thought: {thought}")
+        tcs = c.get("tool_calls")
+        if isinstance(tcs, list) and tcs:
+            lines.append("- actions:")
+            for tc in tcs:
+                if not isinstance(tc, dict):
+                    continue
+                lines.append(f"  - {_tool_call_signature(tc.get('name',''), tc.get('arguments'))}")
+        obs = c.get("observations")
+        if isinstance(obs, list) and obs:
+            lines.append("- observations:")
+            for o in obs:
+                if not isinstance(o, dict):
+                    continue
+                name = str(o.get("name") or "tool")
+                ok = bool(o.get("success"))
+                out = o.get("output")
+                err = o.get("error")
+                text = str(out if ok else (err or out) or "").strip()
+                lines.append(f"  - [{name}] {'OK' if ok else 'ERR'}: {text}")
+        lines.append("")
+    return "\n".join(lines).strip()
 def create_react_workflow(
     *,
     logic: ReActLogic,
     on_step: Optional[Callable[[str, Dict[str, Any]], None]] = None,
+    workflow_id: str = "react_agent",
+    provider: Optional[str] = None,
+    model: Optional[str] = None,
+    allowed_tools: Optional[List[str]] = None,
 ) -> WorkflowSpec:
     """Adapt ReActLogic to an AbstractRuntime workflow."""
@@ -110,177 +632,708 @@ def create_react_workflow(
         if on_step:
             on_step(step, data)
-    tool_defs = logic.tools
-    tool_specs = [t.to_dict() for t in tool_defs]
-    toolset_id = _compute_toolset_id(tool_specs)
+    def _current_tool_defs() -> list[Any]:
+        defs = getattr(logic, "tools", None)
+        if not isinstance(defs, list):
+            try:
+                defs = list(defs)  # type: ignore[arg-type]
+            except Exception:
+                defs = []
+        return [t for t in defs if getattr(t, "name", None)]
+    def _tool_by_name() -> dict[str, Any]:
+        out: dict[str, Any] = {}
+        for t in _current_tool_defs():
+            name = getattr(t, "name", None)
+            if isinstance(name, str) and name.strip():
+                out[name] = t
+        return out
+    def _default_allowlist() -> list[str]:
+        if isinstance(allowed_tools, list):
+            allow = [str(t).strip() for t in allowed_tools if isinstance(t, str) and t.strip()]
+            return allow if allow else []
+        out: list[str] = []
+        seen: set[str] = set()
+        for t in _current_tool_defs():
+            name = getattr(t, "name", None)
+            if not isinstance(name, str) or not name.strip() or name in seen:
+                continue
+            seen.add(name)
+            out.append(name)
+        return out
+    def _normalize_allowlist(raw: Any) -> list[str]:
+        if isinstance(raw, list):
+            items = raw
+        elif isinstance(raw, tuple):
+            items = list(raw)
+        elif isinstance(raw, str):
+            items = [raw]
+        else:
+            items = []
+        current = _tool_by_name()
+        out: list[str] = []
+        seen: set[str] = set()
+        for t in items:
+            if not isinstance(t, str):
+                continue
+            name = t.strip()
+            if not name or name in seen or name not in current:
+                continue
+            seen.add(name)
+            out.append(name)
+        return out
+    def _effective_allowlist(runtime_ns: Dict[str, Any]) -> list[str]:
+        if isinstance(runtime_ns, dict) and "allowed_tools" in runtime_ns:
+            normalized = _normalize_allowlist(runtime_ns.get("allowed_tools"))
+            runtime_ns["allowed_tools"] = normalized
+            return normalized
+        return _normalize_allowlist(list(_default_allowlist()))
+    def _allowed_tool_defs(allow: list[str]) -> list[Any]:
+        out: list[Any] = []
+        current = _tool_by_name()
+        for name in allow:
+            tool = current.get(name)
+            if tool is not None:
+                out.append(tool)
+        return out
+    def _tool_prompt_examples_enabled(runtime_ns: Dict[str, Any]) -> bool:
+        raw = runtime_ns.get("tool_prompt_examples") if isinstance(runtime_ns, dict) else None
+        if raw is None:
+            return True
+        if isinstance(raw, bool):
+            return raw
+        if isinstance(raw, (int, float)):
+            return bool(raw)
+        if isinstance(raw, str):
+            lowered = raw.strip().lower()
+            if lowered in {"0", "false", "no", "off", "disabled"}:
+                return False
+            if lowered in {"1", "true", "yes", "on", "enabled"}:
+                return True
+        return True
+    def _materialize_tool_specs(defs: list[Any], *, include_examples: bool) -> list[dict[str, Any]]:
+        out: list[dict[str, Any]] = []
+        for t in defs:
+            try:
+                d = t.to_dict()
+            except Exception:
+                continue
+            if isinstance(d, dict):
+                if not include_examples:
+                    d = dict(d)
+                    d.pop("examples", None)
+                out.append(d)
+        return out
+    def _sanitize_llm_messages(messages: Any) -> List[Dict[str, Any]]:
+        if not isinstance(messages, list) or not messages:
+            return []
+        out: List[Dict[str, Any]] = []
+        def _sanitize_tool_calls(raw: Any) -> Optional[list[dict[str, Any]]]:
+            if not isinstance(raw, list) or not raw:
+                return None
+            cleaned: list[dict[str, Any]] = []
+            for i, tc in enumerate(raw):
+                if not isinstance(tc, dict):
+                    continue
+                tc_type = str(tc.get("type") or "function")
+                if tc_type != "function":
+                    continue
+                call_id = tc.get("id")
+                call_id_str = str(call_id).strip() if call_id is not None else ""
+                if not call_id_str:
+                    call_id_str = f"call_{i+1}"
+                fn = tc.get("function") if isinstance(tc.get("function"), dict) else {}
+                name = str(fn.get("name") or "").strip()
+                if not name:
+                    continue
+                args = fn.get("arguments")
+                if isinstance(args, dict):
+                    args_str = json.dumps(args, ensure_ascii=False)
+                else:
+                    args_str = "" if args is None else str(args)
+                cleaned.append({"type": "function", "id": call_id_str, "function": {"name": name, "arguments": args_str}})
+            return cleaned or None
+        for m in messages:
+            if not isinstance(m, dict):
+                continue
+            role = str(m.get("role") or "").strip()
+            if not role:
+                continue
+            content = m.get("content")
+            content_str = "" if content is None else str(content)
+            tool_calls_raw = m.get("tool_calls")
+            tool_calls = _sanitize_tool_calls(tool_calls_raw)
+            # Assistant tool-calls messages may legitimately have empty content, but must still be included.
+            if not content_str.strip() and not (role == "assistant" and tool_calls):
+                continue
+            entry: Dict[str, Any] = {"role": role, "content": content_str}
+            if role == "tool":
+                meta = m.get("metadata") if isinstance(m.get("metadata"), dict) else {}
+                call_id = meta.get("call_id") if isinstance(meta, dict) else None
+                if call_id is not None and str(call_id).strip():
+                    entry["tool_call_id"] = str(call_id).strip()
+            elif role == "assistant" and tool_calls:
+                entry["tool_calls"] = tool_calls
+            out.append(entry)
+        return out
+    builtin_effect_tools = {
+        "ask_user",
+        "recall_memory",
+        "inspect_vars",
+        "remember",
+        "remember_note",
+        "compact_memory",
+        "delegate_agent",
+    }
     def init_node(run: RunState, ctx) -> StepPlan:
         context, scratchpad, runtime_ns, _, limits = ensure_react_vars(run)
         scratchpad["iteration"] = 0
         limits["current_iteration"] = 0
+        # Disable runtime-level input trimming for ReAct loops.
+        if isinstance(runtime_ns, dict):
+            runtime_ns.setdefault("disable_input_trimming", True)
+        # Disable all truncation/capping knobs for ReAct runs (policy: full context for now).
+        # These can be re-enabled later once correctness is proven.
+        if isinstance(limits, dict):
+            limits["max_output_tokens"] = None
+            limits["max_input_tokens"] = None
+            limits["max_history_messages"] = -1
+            limits["max_message_chars"] = -1
+            limits["max_tool_message_chars"] = -1
         task = str(context.get("task", "") or "")
         context["task"] = task
-        messages = context["messages"]
-        if task and (not messages or messages[-1].get("role") != "user" or messages[-1].get("content") != task):
-            messages.append(_new_message(ctx, role="user", content=task))
-        # Ensure toolset metadata is present for audit/debug.
-        runtime_ns.setdefault("tool_specs", tool_specs)
-        runtime_ns.setdefault("toolset_id", toolset_id)
-        runtime_ns.setdefault("inbox", [])
-        emit("init", {"task": task})
+        msgs = context.get("messages")
+        if not isinstance(msgs, list):
+            msgs = []
+            context["messages"] = msgs
+        if task and (not msgs or msgs[-1].get("role") != "user" or msgs[-1].get("content") != task):
+            msgs.append(_new_message(ctx, role="user", content=task))
+        allow = _effective_allowlist(runtime_ns)
+        allowed_defs = _allowed_tool_defs(allow)
+        include_examples = _tool_prompt_examples_enabled(runtime_ns)
+        tool_specs = _materialize_tool_specs(allowed_defs, include_examples=include_examples)
+        runtime_ns["tool_specs"] = tool_specs
+        runtime_ns["toolset_id"] = _compute_toolset_id(tool_specs)
+        runtime_ns.setdefault("allowed_tools", allow)
+        scratchpad.setdefault("cycles", [])
         return StepPlan(node_id="init", next_node="reason")
     def reason_node(run: RunState, ctx) -> StepPlan:
-        context, scratchpad, runtime_ns, _, limits = ensure_react_vars(run)
+        context, scratchpad, runtime_ns, temp, limits = ensure_react_vars(run)
-        # Read from _limits (canonical) with fallback to scratchpad (backward compat)
-        if "current_iteration" in limits:
-            iteration = int(limits.get("current_iteration", 0) or 0)
-            max_iterations = int(limits.get("max_iterations", 25) or 25)
-        else:
-            # Backward compatibility: use scratchpad
-            iteration = int(scratchpad.get("iteration", 0) or 0)
-            max_iterations = int(scratchpad.get("max_iterations") or 25)
+        # Durable resume safety:
+        # - tool definitions can change across restarts (env/toolset swaps, staged deploy swaps)
+        # - allowlists can be edited at runtime by hosts
+        # `tool_specs` must match the effective allowlist + current tool defs, otherwise the LLM may
+        # see tools it cannot execute ("tool not allowed") or see stale schemas (signature mismatch).
+        try:
+            if isinstance(runtime_ns, dict):
+                allow = _effective_allowlist(runtime_ns)
+                allowed_defs = _allowed_tool_defs(allow)
+                include_examples = _tool_prompt_examples_enabled(runtime_ns)
+                refreshed_specs = _materialize_tool_specs(allowed_defs, include_examples=include_examples)
+                refreshed_id = _compute_toolset_id(refreshed_specs)
+                prev_id = str(runtime_ns.get("toolset_id") or "")
+                prev_specs = runtime_ns.get("tool_specs")
+                if refreshed_id != prev_id or not isinstance(prev_specs, list):
+                    runtime_ns["tool_specs"] = refreshed_specs
+                    runtime_ns["toolset_id"] = refreshed_id
+                    runtime_ns.setdefault("allowed_tools", allow)
+        except Exception:
+            pass
+        max_iterations = int(limits.get("max_iterations", 0) or scratchpad.get("max_iterations", 25) or 25)
         if max_iterations < 1:
             max_iterations = 1
-        if iteration >= max_iterations:
+        iteration = int(scratchpad.get("iteration", 0) or 0) + 1
+        if iteration > max_iterations:
             return StepPlan(node_id="reason", next_node="max_iterations")
-        # Update both for transition period
-        scratchpad["iteration"] = iteration + 1
-        limits["current_iteration"] = iteration + 1
+        scratchpad["iteration"] = iteration
+        limits["current_iteration"] = iteration
         task = str(context.get("task", "") or "")
-        messages = context["messages"]
-        inbox = runtime_ns.get("inbox", [])
-        guidance = ""
-        if isinstance(inbox, list) and inbox:
-            inbox_messages = [str(m.get("content", "") or "") for m in inbox if isinstance(m, dict)]
-            guidance = " | ".join([m for m in inbox_messages if m])
-            runtime_ns["inbox"] = []
+        messages_view = list(context.get("messages") or [])
+        guidance = _drain_inbox(runtime_ns)
         req = logic.build_request(
             task=task,
-            messages=messages,
+            messages=messages_view,
             guidance=guidance,
-            iteration=iteration + 1,
+            iteration=iteration,
             max_iterations=max_iterations,
-            vars=run.vars,  # Pass vars for _limits access
+            vars=run.vars,
         )
-        emit("reason", {"iteration": iteration + 1, "max_iterations": max_iterations, "has_guidance": bool(guidance)})
+        emit("reason", {"iteration": iteration, "max_iterations": max_iterations, "has_guidance": bool(guidance)})
-        payload = {"prompt": req.prompt, "tools": [t.to_dict() for t in req.tools]}
-        if req.max_tokens is not None:
-            payload["params"] = {"max_tokens": req.max_tokens}
+        payload: Dict[str, Any] = {"prompt": ""}
+        sanitized_messages = _sanitize_llm_messages(messages_view)
+        if sanitized_messages:
+            payload["messages"] = sanitized_messages
+        else:
+            # Ensure LLM_CALL contract is satisfied even for one-shot runs where callers
+            # provide only `context.task` and no `context.messages`.
+            task_text = str(task or "").strip()
+            if task_text:
+                payload["prompt"] = task_text
+        media = extract_media_from_context(context)
+        if media:
+            payload["media"] = media
+        tool_specs = runtime_ns.get("tool_specs") if isinstance(runtime_ns, dict) else None
+        if isinstance(tool_specs, list) and tool_specs:
+            payload["tools"] = list(tool_specs)
+        sys_base = str(req.system_prompt or "").strip()
+        sys = _compose_system_prompt(runtime_ns, base=sys_base)
+        # Append scratchpad only when not using a full override prompt.
+        if _system_prompt_override(runtime_ns) is None:
+            scratch_txt = _render_cycles_for_system_prompt(scratchpad)
+            if scratch_txt:
+                sys = f"{sys.rstrip()}\n\n## Scratchpad (ReAct cycles so far)\n{scratch_txt}".strip()
+        if sys:
+            payload["system_prompt"] = sys
+        eff_provider = provider if isinstance(provider, str) and provider.strip() else runtime_ns.get("provider")
+        eff_model = model if isinstance(model, str) and model.strip() else runtime_ns.get("model")
+        if isinstance(eff_provider, str) and eff_provider.strip():
+            payload["provider"] = eff_provider.strip()
+        if isinstance(eff_model, str) and eff_model.strip():
+            payload["model"] = eff_model.strip()
+        params: Dict[str, Any] = {}
+        max_out = _max_output_tokens(runtime_ns, limits)
+        if isinstance(max_out, int) and max_out > 0:
+            params["max_tokens"] = max_out
+        # Tool calling is formatting-sensitive; bias toward a lower temperature when tools are present,
+        # unless the caller explicitly sets `_runtime.temperature`.
+        default_temp = 0.2 if isinstance(tool_specs, list) and tool_specs else 0.7
+        payload["params"] = runtime_llm_params(runtime_ns, extra=params, default_temperature=default_temp)
         return StepPlan(
             node_id="reason",
-            effect=Effect(
-                type=EffectType.LLM_CALL,
-                payload=payload,
-                result_key="_temp.llm_response",
-            ),
+            effect=Effect(type=EffectType.LLM_CALL, payload=payload, result_key="_temp.llm_response"),
             next_node="parse",
         )
     def parse_node(run: RunState, ctx) -> StepPlan:
-        context, _, _, temp, _ = ensure_react_vars(run)
+        context, scratchpad, runtime_ns, temp, limits = ensure_react_vars(run)
         response = temp.get("llm_response", {})
-        content, tool_calls = logic.parse_response(response)
-        context["messages"].append(_new_message(ctx, role="assistant", content=content))
+        content, tool_calls = logic.parse_response(response)
+        finish_reason = ""
+        if isinstance(response, dict):
+            fr = response.get("finish_reason")
+            finish_reason = str(fr or "").strip().lower() if fr is not None else ""
+        cycle_i = int(scratchpad.get("iteration", 0) or 0)
+        max_iterations = int(limits.get("max_iterations", 0) or scratchpad.get("max_iterations", 25) or 25)
+        if max_iterations < 1:
+            max_iterations = 1
+        reasoning_text = ""
+        try:
+            if isinstance(response, dict):
+                rc = response.get("reasoning")
+                if rc is None:
+                    rc = response.get("reasoning_content")
+                reasoning_text = str(rc or "")
+        except Exception:
+            reasoning_text = ""
         emit(
             "parse",
             {
+                "iteration": cycle_i,
+                "max_iterations": max_iterations,
                 "has_tool_calls": bool(tool_calls),
-                "content_preview": content[:100] if content else "(no content)",
+                "content": str(content or ""),
+                "reasoning": reasoning_text,
             },
         )
-        temp.pop("llm_response", None)
+        cycle: Dict[str, Any] = {"i": cycle_i, "thought": content, "tool_calls": [], "observations": []}
+        cycles = scratchpad.get("cycles")
+        if isinstance(cycles, list):
+            cycles.append(cycle)
+        else:
+            scratchpad["cycles"] = [cycle]
         if tool_calls:
+            cycle["tool_calls"] = [tc.__dict__ for tc in tool_calls]
+            # Loop guard: some models may repeat the exact same tool calls (including side effects)
+            # even after receiving successful observations. Skip executing duplicates to avoid
+            # repeatedly overwriting files or re-running commands.
+            try:
+                side_effect_tools = {
+                    "write_file",
+                    "edit_file",
+                    "execute_command",
+                    # Comms tools (side-effectful; avoid duplicate sends).
+                    "send_email",
+                    "send_whatsapp_message",
+                    "send_telegram_message",
+                    "send_telegram_artifact",
+                }
+                has_side_effect = any(
+                    isinstance(getattr(tc, "name", None), str) and str(getattr(tc, "name") or "").strip() in side_effect_tools
+                    for tc in tool_calls
+                )
+                if has_side_effect:
+                    cycles_list = scratchpad.get("cycles")
+                    prev_cycle: Optional[Dict[str, Any]] = None
+                    if isinstance(cycles_list, list) and len(cycles_list) >= 2:
+                        for c in reversed(cycles_list[:-1]):
+                            if not isinstance(c, dict):
+                                continue
+                            prev_tcs = c.get("tool_calls")
+                            if isinstance(prev_tcs, list) and prev_tcs:
+                                prev_cycle = c
+                                break
+                    def _cycle_fps(c: Dict[str, Any]) -> list[str]:
+                        tcs2 = c.get("tool_calls")
+                        if not isinstance(tcs2, list) or not tcs2:
+                            return []
+                        fps: list[str] = []
+                        for tc in tcs2:
+                            if not isinstance(tc, dict):
+                                continue
+                            fps.append(_tool_call_fingerprint(tc.get("name", ""), tc.get("arguments")))
+                        return fps
+                    def _cycle_obs_all_ok(c: Dict[str, Any]) -> bool:
+                        obs2 = c.get("observations")
+                        if not isinstance(obs2, list) or not obs2:
+                            return False
+                        for o in obs2:
+                            if not isinstance(o, dict):
+                                return False
+                            if o.get("success") is not True:
+                                return False
+                        return True
+                    if prev_cycle is not None and _cycle_obs_all_ok(prev_cycle):
+                        prev_fps = _cycle_fps(prev_cycle)
+                        cur_fps = [_tool_call_fingerprint(tc.name, tc.arguments) for tc in tool_calls]
+                        if prev_fps and prev_fps == cur_fps:
+                            _push_inbox(
+                                runtime_ns,
+                                "You are repeating the exact same tool calls as the previous cycle, and they already succeeded.\n"
+                                "Do NOT execute them again (to avoid duplicate side effects).\n"
+                                "Instead, use the existing tool outputs and provide the final answer with NO tool calls.",
+                            )
+                            emit("parse_repeat_tool_calls", {"cycle": cycle_i, "count": len(tool_calls)})
+                            temp["pending_tool_calls"] = []
+                            return StepPlan(node_id="parse", next_node="reason")
+            except Exception:
+                pass
+            # Keep tool transcript in context for OpenAI-compatible tool calling.
+            context["messages"].append(
+                _new_assistant_message_with_tool_calls(
+                    ctx,
+                    content="",  # thought is stored in scratchpad (not user-visible history)
+                    tool_calls=tool_calls,
+                    metadata={"kind": "tool_calls", "cycle": cycle_i},
+                )
+            )
             temp["pending_tool_calls"] = [tc.__dict__ for tc in tool_calls]
+            emit("parse_tool_calls", {"count": len(tool_calls)})
             return StepPlan(node_id="parse", next_node="act")
-        temp["final_answer"] = content
+        # If the model hit an output limit, treat the step as incomplete and continue.
+        if finish_reason in {"length", "max_tokens"}:
+            _push_inbox(
+                runtime_ns,
+                "Your previous response hit an output token limit before producing a complete tool call.\n"
+                "Retry now: emit ONLY the next tool call(s) needed to make progress.\n"
+                "Keep tool call arguments small (avoid large file contents / giant JSON blobs) to prevent tool-call truncation.\n"
+                "For large files, create a small skeleton first, then refine via multiple smaller edits/tool calls.\n"
+                "Do not write a long plan before tool calls.",
+            )
+            emit("parse_retry_truncated", {"cycle": cycle_i})
+            return StepPlan(node_id="parse", next_node="reason")
+        if not isinstance(content, str) or not content.strip():
+            _push_inbox(runtime_ns, "Your previous response was empty. Continue the task.")
+            emit("parse_retry_empty", {"cycle": cycle_i})
+            return StepPlan(node_id="parse", next_node="reason")
+        # Followthrough heuristic: retry when the model claims it will take actions but emits no tool calls.
+        # Default ON (disable with `_runtime.check_plan=false`).
+        raw_check_plan = runtime_ns.get("check_plan") if isinstance(runtime_ns, dict) else None
+        check_plan = True if raw_check_plan is None else _boolish(raw_check_plan)
+        if check_plan and cycle_i < max_iterations and _looks_like_deferred_action(content):
+            _push_inbox(
+                runtime_ns,
+                "You said you would take an action, but you did not call any tools.\n"
+                "If you need to act, call the next tool now (emit ONLY the next tool call(s)).\n"
+                "If you are already done, provide the final answer with NO tool calls.",
+            )
+            emit("parse_retry_plan_only", {"cycle": cycle_i})
+            return StepPlan(node_id="parse", next_node="reason")
+        # Final answer: stop the loop.
+        answer = str(content).strip()
+        temp["final_answer"] = answer
+        emit("parse_final", {"cycle": cycle_i})
         return StepPlan(node_id="parse", next_node="done")
     def act_node(run: RunState, ctx) -> StepPlan:
-        _, _, _, temp, _ = ensure_react_vars(run)
-        tool_calls = temp.get("pending_tool_calls", [])
-        if not isinstance(tool_calls, list):
-            tool_calls = []
+        context, scratchpad, runtime_ns, temp, limits = ensure_react_vars(run)
-        if not tool_calls:
-            return StepPlan(node_id="act", next_node="reason")
+        pending = temp.get("pending_tool_calls", [])
+        if not isinstance(pending, list):
+            pending = []
-        # Handle ask_user specially with ASK_USER effect.
-        for i, tc in enumerate(tool_calls):
-            if not isinstance(tc, dict):
-                continue
-            if tc.get("name") != "ask_user":
+        cycle_i = int(scratchpad.get("iteration", 0) or 0)
+        max_iterations = int(limits.get("max_iterations", 0) or scratchpad.get("max_iterations", 25) or 25)
+        if max_iterations < 1:
+            max_iterations = 1
+        tool_queue: list[Dict[str, Any]] = []
+        for idx, tc in enumerate(pending):
+            if isinstance(tc, ToolCall):
+                d = tc.__dict__
+            elif isinstance(tc, dict):
+                d = dict(tc)
+            else:
                 continue
+            if "call_id" not in d or not d.get("call_id"):
+                d["call_id"] = str(idx)
+            tool_queue.append(d)
+        if not tool_queue:
+            temp["pending_tool_calls"] = []
+            return StepPlan(node_id="act", next_node="reason")
+        allow = _effective_allowlist(runtime_ns)
+        def _is_builtin(tc: Dict[str, Any]) -> bool:
+            name = tc.get("name")
+            return isinstance(name, str) and name in builtin_effect_tools
+        if _is_builtin(tool_queue[0]):
+            tc = tool_queue[0]
+            name = str(tc.get("name") or "").strip()
             args = tc.get("arguments") or {}
-            question = str(args.get("question") or "Please provide input:")
-            choices = args.get("choices")
-            choices = list(choices) if isinstance(choices, list) else None
+            if not isinstance(args, dict):
+                args = {}
+            temp["pending_tool_calls"] = list(tool_queue[1:])
+            if name and name not in allow:
+                temp["tool_results"] = {
+                    "results": [
+                        {
+                            "call_id": str(tc.get("call_id") or ""),
+                            "name": name,
+                            "success": False,
+                            "output": None,
+                            "error": f"Tool '{name}' is not allowed for this agent",
+                        }
+                    ]
+                }
+                emit("act_blocked", {"tool": name})
+                return StepPlan(node_id="act", next_node="observe")
+            if name == "ask_user":
+                question = str(args.get("question") or "Please provide input:")
+                choices = args.get("choices")
+                choices = list(choices) if isinstance(choices, list) else None
+                msgs = context.get("messages")
+                if isinstance(msgs, list):
+                    msgs.append(
+                        _new_message(ctx, role="assistant", content=f"[Agent question]: {question}", metadata={"kind": "ask_user_prompt"})
+                    )
+                emit("ask_user", {"question": question, "choices": choices or []})
+                return StepPlan(
+                    node_id="act",
+                    effect=Effect(
+                        type=EffectType.ASK_USER,
+                        payload={"prompt": question, "choices": choices, "allow_free_text": True},
+                        result_key="_temp.user_response",
+                    ),
+                    next_node="handle_user_response",
+                )
-            temp["pending_tool_calls"] = tool_calls[i + 1 :]
-            emit("ask_user", {"question": question, "choices": choices or []})
-            return StepPlan(
-                node_id="act",
-                effect=Effect(
-                    type=EffectType.ASK_USER,
-                    payload={"prompt": question, "choices": choices, "allow_free_text": True},
-                    result_key="_temp.user_response",
-                ),
-                next_node="handle_user_response",
-            )
+            if name == "recall_memory":
+                payload = dict(args)
+                payload.setdefault("tool_name", "recall_memory")
+                payload.setdefault("call_id", tc.get("call_id") or "memory")
+                emit("memory_query", {"query": payload.get("query"), "span_id": payload.get("span_id")})
+                return StepPlan(
+                    node_id="act",
+                    effect=Effect(type=EffectType.MEMORY_QUERY, payload=payload, result_key="_temp.tool_results"),
+                    next_node="observe",
+                )
-        for tc in tool_calls:
-            if isinstance(tc, dict):
-                emit("act", {"tool": tc.get("name", ""), "args": tc.get("arguments", {})})
+            if name == "inspect_vars":
+                payload = dict(args)
+                payload.setdefault("tool_name", "inspect_vars")
+                payload.setdefault("call_id", tc.get("call_id") or "vars")
+                emit("vars_query", {"path": payload.get("path")})
+                return StepPlan(
+                    node_id="act",
+                    effect=Effect(type=EffectType.VARS_QUERY, payload=payload, result_key="_temp.tool_results"),
+                    next_node="observe",
+                )
-        formatted_calls: List[Dict[str, Any]] = []
-        for tc in tool_calls:
-            if isinstance(tc, dict):
-                formatted_calls.append(
-                    {
-                        "name": tc.get("name", ""),
-                        "arguments": tc.get("arguments", {}),
-                        "call_id": tc.get("call_id", "1"),
-                    }
+            if name == "remember":
+                payload = dict(args)
+                payload.setdefault("tool_name", "remember")
+                payload.setdefault("call_id", tc.get("call_id") or "memory")
+                emit("memory_tag", {"span_id": payload.get("span_id"), "tags": payload.get("tags")})
+                return StepPlan(
+                    node_id="act",
+                    effect=Effect(type=EffectType.MEMORY_TAG, payload=payload, result_key="_temp.tool_results"),
+                    next_node="observe",
+                )
+            if name == "remember_note":
+                payload = dict(args)
+                payload.setdefault("tool_name", "remember_note")
+                payload.setdefault("call_id", tc.get("call_id") or "memory")
+                emit("memory_note", {"note": payload.get("note"), "tags": payload.get("tags")})
+                return StepPlan(
+                    node_id="act",
+                    effect=Effect(type=EffectType.MEMORY_NOTE, payload=payload, result_key="_temp.tool_results"),
+                    next_node="observe",
                 )
-            elif isinstance(tc, ToolCall):
-                formatted_calls.append(
-                    {
-                        "name": tc.name,
-                        "arguments": tc.arguments,
-                        "call_id": tc.call_id or "1",
+            if name == "compact_memory":
+                payload = dict(args)
+                payload.setdefault("tool_name", "compact_memory")
+                payload.setdefault("call_id", tc.get("call_id") or "compact")
+                emit("memory_compact", {"preserve_recent": payload.get("preserve_recent"), "mode": payload.get("compression_mode")})
+                return StepPlan(
+                    node_id="act",
+                    effect=Effect(type=EffectType.MEMORY_COMPACT, payload=payload, result_key="_temp.tool_results"),
+                    next_node="observe",
+                )
+            if name == "delegate_agent":
+                delegated_task = str(args.get("task") or "").strip()
+                delegated_context = str(args.get("context") or "").strip()
+                tools_raw = args.get("tools")
+                if tools_raw is None:
+                    # Inherit the current allowlist, but avoid recursive delegation and avoid waiting on ask_user
+                    # unless explicitly enabled.
+                    child_allow = [t for t in allow if t not in {"delegate_agent", "ask_user"}]
+                else:
+                    child_allow = _normalize_allowlist(tools_raw)
+                if not delegated_task:
+                    temp["tool_results"] = {
+                        "results": [
+                            {
+                                "call_id": str(tc.get("call_id") or ""),
+                                "name": "delegate_agent",
+                                "success": False,
+                                "output": None,
+                                "error": "delegate_agent requires a non-empty task",
+                            }
+                        ]
                     }
+                    return StepPlan(node_id="act", next_node="observe")
+                combined_task = delegated_task
+                if delegated_context:
+                    combined_task = f"{delegated_task}\n\nContext:\n{delegated_context}"
+                sub_vars: Dict[str, Any] = {
+                    "context": {"task": combined_task, "messages": []},
+                    "_runtime": {
+                        "allowed_tools": list(child_allow),
+                        "system_prompt_extra": (
+                            "You are a delegated sub-agent.\n"
+                            "- Focus ONLY on the delegated task.\n"
+                            "- Use ONLY the allowed tools when needed.\n"
+                            "- Do not ask the user questions; if blocked, state assumptions and proceed.\n"
+                            "- Return a concise result suitable for the parent agent to act on.\n"
+                        ),
+                    },
+                    "_limits": {"max_iterations": 10},
+                }
+                payload = {
+                    "workflow_id": str(getattr(run, "workflow_id", "") or "react_agent"),
+                    "vars": sub_vars,
+                    "async": False,
+                    "include_traces": False,
+                    # Tool-mode wrapper so the parent receives a normal tool observation (no run failure on child failure).
+                    "wrap_as_tool_result": True,
+                    "tool_name": "delegate_agent",
+                    "call_id": str(tc.get("call_id") or ""),
+                }
+                emit("delegate_agent", {"tools": list(child_allow), "call_id": payload.get("call_id")})
+                return StepPlan(
+                    node_id="act",
+                    effect=Effect(type=EffectType.START_SUBWORKFLOW, payload=payload, result_key="_temp.tool_results"),
+                    next_node="observe",
                 )
+            # Unknown builtin: continue.
+            return StepPlan(node_id="act", next_node="act" if temp.get("pending_tool_calls") else "reason")
+        batch: List[Dict[str, Any]] = []
+        for tc in tool_queue:
+            if _is_builtin(tc):
+                break
+            batch.append(tc)
+        remaining = tool_queue[len(batch) :]
+        temp["pending_tool_calls"] = list(remaining)
+        formatted_calls: List[Dict[str, Any]] = []
+        for tc in batch:
+            emit(
+                "act",
+                {
+                    "iteration": cycle_i,
+                    "max_iterations": max_iterations,
+                    "tool": tc.get("name", ""),
+                    "args": tc.get("arguments", {}),
+                    "call_id": str(tc.get("call_id") or ""),
+                },
+            )
+            formatted_calls.append(
+                {"name": tc.get("name", ""), "arguments": tc.get("arguments", {}), "call_id": str(tc.get("call_id") or "")}
+            )
         return StepPlan(
             node_id="act",
-            effect=Effect(
-                type=EffectType.TOOL_CALLS,
-                payload={"tool_calls": formatted_calls},
-                result_key="_temp.tool_results",
-            ),
+            effect=Effect(type=EffectType.TOOL_CALLS, payload={"tool_calls": formatted_calls, "allowed_tools": list(allow)}, result_key="_temp.tool_results"),
             next_node="observe",
         )
     def observe_node(run: RunState, ctx) -> StepPlan:
-        context, _, _, temp, _ = ensure_react_vars(run)
+        context, scratchpad, _, temp, _ = ensure_react_vars(run)
         tool_results = temp.get("tool_results", {})
         if not isinstance(tool_results, dict):
             tool_results = {}
@@ -289,6 +1342,26 @@ def create_react_workflow(
         if not isinstance(results, list):
             results = []
+        if results:
+            scratchpad["used_tools"] = True
+        # Attach observations to the most recent cycle.
+        cycles = scratchpad.get("cycles")
+        last_cycle: Optional[Dict[str, Any]] = None
+        if isinstance(cycles, list):
+            for c in reversed(cycles):
+                if isinstance(c, dict) and int(c.get("i") or -1) == int(scratchpad.get("iteration") or -1):
+                    last_cycle = c
+                    break
+        def _display(v: Any) -> str:
+            if isinstance(v, dict):
+                rendered = v.get("rendered")
+                if isinstance(rendered, str) and rendered.strip():
+                    return rendered.strip()
+            return "" if v is None else str(v)
+        obs_list: list[dict[str, Any]] = []
         for r in results:
             if not isinstance(r, dict):
                 continue
@@ -296,26 +1369,39 @@ def create_react_workflow(
             success = bool(r.get("success"))
             output = r.get("output", "")
             error = r.get("error", "")
-            rendered = logic.format_observation(
-                name=name,
-                output=str(output if success else (error or output)),
-                success=success,
-            )
-            emit("observe", {"tool": name, "result": rendered[:150]})
+            display = _display(output)
+            if not success:
+                display = _display(output) if isinstance(output, dict) else str(error or output)
+            rendered = logic.format_observation(name=name, output=display, success=success)
+            emit("observe", {"tool": name, "success": success, "result": rendered})
             context["messages"].append(
                 _new_message(
                     ctx,
                     role="tool",
                     content=rendered,
-                    metadata={
-                        "name": name,
-                        "call_id": r.get("call_id"),
-                        "success": success,
-                    },
+                    metadata={"name": name, "call_id": r.get("call_id"), "success": success},
                 )
             )
+            obs_list.append(
+                {
+                    "call_id": r.get("call_id"),
+                    "name": name,
+                    "success": success,
+                    "output": output,
+                    "error": error,
+                    "rendered": rendered,
+                }
+            )
+        if last_cycle is not None:
+            last_cycle["observations"] = obs_list
         temp.pop("tool_results", None)
+        pending = temp.get("pending_tool_calls", [])
+        if isinstance(pending, list) and pending:
+            return StepPlan(node_id="observe", next_node="act")
         temp["pending_tool_calls"] = []
         return StepPlan(node_id="observe", next_node="reason")
@@ -327,9 +1413,7 @@ def create_react_workflow(
         response_text = str(user_response.get("response", "") or "")
         emit("user_response", {"response": response_text})
-        context["messages"].append(
-            _new_message(ctx, role="user", content=f"[User response]: {response_text}")
-        )
+        context["messages"].append(_new_message(ctx, role="user", content=f"[User response]: {response_text}"))
         temp.pop("user_response", None)
         if temp.get("pending_tool_calls"):
@@ -338,43 +1422,182 @@ def create_react_workflow(
     def done_node(run: RunState, ctx) -> StepPlan:
         context, scratchpad, _, temp, limits = ensure_react_vars(run)
+        task = str(context.get("task", "") or "")
         answer = str(temp.get("final_answer") or "No answer provided")
         emit("done", {"answer": answer})
-        # Prefer _limits.current_iteration, fall back to scratchpad
+        messages = context.get("messages")
+        if isinstance(messages, list):
+            last = messages[-1] if messages else None
+            last_role = last.get("role") if isinstance(last, dict) else None
+            last_content = last.get("content") if isinstance(last, dict) else None
+            if last_role != "assistant" or str(last_content or "") != answer:
+                messages.append(_new_message(ctx, role="assistant", content=answer, metadata={"kind": "final_answer"}))
         iterations = int(limits.get("current_iteration", 0) or scratchpad.get("iteration", 0) or 0)
+        report = _render_final_report(task, scratchpad)
         return StepPlan(
             node_id="done",
             complete_output={
                 "answer": answer,
+                "report": report,
                 "iterations": iterations,
                 "messages": list(context.get("messages") or []),
+                "scratchpad": dict(scratchpad),
             },
         )
     def max_iterations_node(run: RunState, ctx) -> StepPlan:
-        context, scratchpad, _, _, limits = ensure_react_vars(run)
-        # Prefer _limits, fall back to scratchpad
+        context, scratchpad, runtime_ns, temp, limits = ensure_react_vars(run)
         max_iterations = int(limits.get("max_iterations", 0) or scratchpad.get("max_iterations", 25) or 25)
         if max_iterations < 1:
             max_iterations = 1
         emit("max_iterations", {"iterations": max_iterations})
-        messages = list(context.get("messages") or [])
-        last_content = messages[-1]["content"] if messages else "Max iterations reached"
+        # Deterministic conclusion: when we hit the iteration cap, run one tool-free LLM call
+        # to synthesize a final report + next steps while the scratchpad is still in context.
+        resp = temp.get("max_iterations_llm_response")
+        if not isinstance(resp, dict):
+            drained_guidance = _drain_inbox(runtime_ns)
+            conclude_directive = (
+                "You have reached the maximum allowed ReAct iterations.\n"
+                "You MUST stop using tools now and provide a best-effort conclusion.\n\n"
+                "In your response, include:\n"
+                "1) A concise progress report (what you did + key observations).\n"
+                "2) The best current answer you can give based on evidence.\n"
+                "3) Remaining uncertainties / missing info.\n"
+                "4) Next steps: exact actions to finish (files to inspect/edit, commands/tools to run, what to look for).\n\n"
+                "Rules:\n"
+                "- Do NOT call tools.\n"
+                "- Do NOT output tool-call markup (e.g. <tool_call>...</tool_call>).\n"
+                "- Do NOT mention internal scratchpads; just present the report.\n"
+                "- Prefer bullet points and concrete next steps."
+            )
+            task = str(context.get("task", "") or "")
+            messages_view = list(context.get("messages") or [])
+            req = logic.build_request(
+                task=task,
+                messages=messages_view,
+                guidance="",
+                iteration=max_iterations,
+                max_iterations=max_iterations,
+                vars=run.vars,
+            )
+            payload: Dict[str, Any] = {"prompt": ""}
+            sanitized_messages = _sanitize_llm_messages(messages_view)
+            if sanitized_messages:
+                payload["messages"] = sanitized_messages
+            else:
+                task_text = str(task or "").strip()
+                if task_text:
+                    payload["prompt"] = task_text
+            media = extract_media_from_context(context)
+            if media:
+                payload["media"] = media
+            sys_base = str(req.system_prompt or "").strip()
+            sys = _compose_system_prompt(runtime_ns, base=sys_base)
+            block_parts: list[str] = []
+            if drained_guidance:
+                block_parts.append(f"Host guidance:\n{drained_guidance}")
+            block_parts.append(conclude_directive)
+            sys = (f"{sys.rstrip()}\n\n## Max iterations reached\n" + "\n\n".join(block_parts)).strip()
+            scratch_txt = _render_cycles_for_conclusion_prompt(scratchpad)
+            if scratch_txt:
+                sys = f"{sys.rstrip()}\n\n## Scratchpad (ReAct cycles so far)\n{scratch_txt}".strip()
+            if sys:
+                payload["system_prompt"] = sys
+            eff_provider = provider if isinstance(provider, str) and provider.strip() else runtime_ns.get("provider")
+            eff_model = model if isinstance(model, str) and model.strip() else runtime_ns.get("model")
+            if isinstance(eff_provider, str) and eff_provider.strip():
+                payload["provider"] = eff_provider.strip()
+            if isinstance(eff_model, str) and eff_model.strip():
+                payload["model"] = eff_model.strip()
+            params: Dict[str, Any] = {}
+            max_out = _max_output_tokens(runtime_ns, limits)
+            if isinstance(max_out, int) and max_out > 0:
+                params["max_tokens"] = max_out
+            payload["params"] = runtime_llm_params(runtime_ns, extra=params, default_temperature=0.2)
+            return StepPlan(
+                node_id="max_iterations",
+                effect=Effect(type=EffectType.LLM_CALL, payload=payload, result_key="_temp.max_iterations_llm_response"),
+                next_node="max_iterations",
+            )
+        # We have a conclusion LLM response. Parse it and complete the run.
+        content, tool_calls = logic.parse_response(resp)
+        answer = str(content or "").strip()
+        temp.pop("max_iterations_llm_response", None)
+        # If the model still emitted tool calls, or if it leaked tool-call markup as plain text,
+        # retry once with a stricter instruction.
+        tool_tags = _contains_tool_call_markup(answer)
+        if tool_calls or tool_tags:
+            retries = int(temp.get("max_iterations_conclude_retries", 0) or 0)
+            if retries < 1:
+                temp["max_iterations_conclude_retries"] = retries + 1
+                _push_inbox(
+                    runtime_ns,
+                    "You are out of iterations and tool use is disabled.\n"
+                    "Return ONLY the final report and next steps as plain text.\n"
+                    "Do NOT include any tool calls or tool-call markup (e.g. <tool_call>...</tool_call>).",
+                )
+                return StepPlan(node_id="max_iterations", next_node="max_iterations")
+            # Last resort: strip any leaked tool markup so we don't persist it as the final answer.
+            answer = _strip_tool_call_markup(answer).strip()
+        if not answer:
+            # Fallback: avoid returning the last tool observation as the "answer".
+            # Provide a deterministic report so users don't lose scratchpad context.
+            scratch_view = _render_cycles_for_conclusion_prompt(scratchpad)
+            parts = [
+                "Max iterations reached.",
+                "I could not produce a final assistant response in time.",
+            ]
+            if scratch_view:
+                parts.append("## Progress (from scratchpad)\n" + scratch_view)
+            parts.append(
+                "## Next steps\n"
+                "- Increase `max_iterations` and rerun, or use `/conclude` earlier to force a wrap-up.\n"
+                "- If you need me to continue, re-run with a higher iteration budget and I will pick up from the report above."
+            )
+            answer = "\n\n".join(parts).strip()
+        # Persist final answer into the conversation history (so it shows up in /history and seeds next runs).
+        messages = context.get("messages")
+        if isinstance(messages, list):
+            last = messages[-1] if messages else None
+            last_role = last.get("role") if isinstance(last, dict) else None
+            last_content = last.get("content") if isinstance(last, dict) else None
+            if last_role != "assistant" or str(last_content or "") != answer:
+                messages.append(_new_message(ctx, role="assistant", content=answer, metadata={"kind": "final_answer"}))
+        temp["final_answer"] = answer
+        report = _render_final_report(str(context.get("task") or ""), scratchpad)
+        iterations = int(limits.get("current_iteration", 0) or scratchpad.get("iteration", 0) or max_iterations)
         return StepPlan(
             node_id="max_iterations",
             complete_output={
-                "answer": last_content,
-                "iterations": max_iterations,
-                "messages": messages,
+                "answer": answer,
+                "report": report,
+                "iterations": iterations,
+                "messages": list(context.get("messages") or []),
+                "scratchpad": dict(scratchpad),
             },
         )
     return WorkflowSpec(
-        workflow_id="react_agent",
+        workflow_id=str(workflow_id or "react_agent"),
         entry_node="init",
         nodes={
             "init": init_node,
@@ -387,4 +1610,3 @@ def create_react_workflow(
             "max_iterations": max_iterations_node,
         },
     )

abstractagent 0.2.0__py3-none-any.whl → 0.3.1__py3-none-any.whl

abstractagent 0.2.0py3-none-any.whl → 0.3.1py3-none-any.whl