PyPI - jaf-py - Versions diffs - 2.5.3__py3-none-any.whl → 2.5.5__py3-none-any.whl - Mend

jaf-py 2.5.3py3-none-any.whl → 2.5.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

jaf/__init__.py +1 -1
jaf/core/engine.py +159 -117
jaf/core/regeneration.py +392 -0
jaf/core/tracing.py +1 -1
jaf/core/types.py +115 -2
jaf/memory/providers/in_memory.py +174 -1
jaf/memory/providers/postgres.py +211 -1
jaf/memory/providers/redis.py +189 -1
jaf/memory/types.py +35 -1
jaf/memory/utils.py +2 -0
jaf/server/server.py +163 -0
jaf/server/types.py +49 -1
{jaf_py-2.5.3.dist-info → jaf_py-2.5.5.dist-info}/METADATA +2 -2
{jaf_py-2.5.3.dist-info → jaf_py-2.5.5.dist-info}/RECORD +18 -17
{jaf_py-2.5.3.dist-info → jaf_py-2.5.5.dist-info}/WHEEL +0 -0
{jaf_py-2.5.3.dist-info → jaf_py-2.5.5.dist-info}/entry_points.txt +0 -0
{jaf_py-2.5.3.dist-info → jaf_py-2.5.5.dist-info}/licenses/LICENSE +0 -0
{jaf_py-2.5.3.dist-info → jaf_py-2.5.5.dist-info}/top_level.txt +0 -0

jaf/__init__.py CHANGED Viewed

@@ -191,7 +191,7 @@ def generate_run_id() -> RunId:
     """Generate a new run ID."""
     return create_run_id(str(uuid.uuid4()))
-__version__ = "2.5.3"
+__version__ = "2.5.5"
 __all__ = [
     # Core types and functions
     "TraceId", "RunId", "ValidationResult", "Message", "ModelConfig",

jaf/core/engine.py CHANGED Viewed

@@ -293,15 +293,7 @@ async def _load_conversation_history(state: RunState[Ctx], config: RunConfig[Ctx
         # For HITL scenarios, append new messages to memory messages
         # This prevents duplication when resuming from interruptions
         if memory_messages:
-            combined_messages = memory_messages + [
-                msg for msg in state.messages
-                if not any(
-                    mem_msg.role == msg.role and
-                    mem_msg.content == msg.content and
-                    getattr(mem_msg, 'tool_calls', None) == getattr(msg, 'tool_calls', None)
-                    for mem_msg in memory_messages
-                )
-            ]
+            combined_messages = memory_messages + list(state.messages)
         else:
             combined_messages = list(state.messages)
@@ -535,6 +527,17 @@ async def _run_internal(
         "gpt-4o"
     )
+    # Apply before_llm_call callback if provided
+    if config.before_llm_call:
+        if asyncio.iscoroutinefunction(config.before_llm_call):
+            state = await config.before_llm_call(state, current_agent)
+        else:
+            result = config.before_llm_call(state, current_agent)
+            if asyncio.iscoroutine(result):
+                state = await result
+            else:
+                state = result
     # Emit LLM call start event
     if config.on_event:
         config.on_event(LLMCallStartEvent(data=to_event_data(LLMCallStartEventData(
@@ -546,121 +549,157 @@ async def _run_internal(
             messages=state.messages
         ))))
-    # Get completion from model provider, prefer streaming if available
+    # Retry logic for empty LLM responses
     llm_response: Dict[str, Any]
     assistant_event_streamed = False
-    get_stream = getattr(config.model_provider, "get_completion_stream", None)
-    if callable(get_stream):
-        try:
-            aggregated_text = ""
-            # Working array of partial tool calls
-            partial_tool_calls: List[Dict[str, Any]] = []
-            async for chunk in get_stream(state, current_agent, config):  # type: ignore[arg-type]
-                # Text deltas
-                delta_text = getattr(chunk, "delta", None)
-                if delta_text:
-                    aggregated_text += delta_text
-                # Tool call deltas
-                tcd = getattr(chunk, "tool_call_delta", None)
-                if tcd is not None:
-                    idx = getattr(tcd, "index", 0) or 0
-                    # Ensure slot exists
-                    while len(partial_tool_calls) <= idx:
-                        partial_tool_calls.append({
-                            "id": None,
-                            "type": "function",
-                            "function": {"name": None, "arguments": ""}
-                        })
-                    target = partial_tool_calls[idx]
-                    # id
-                    tc_id = getattr(tcd, "id", None)
-                    if tc_id:
-                        target["id"] = tc_id
-                    # function fields
-                    fn = getattr(tcd, "function", None)
-                    if fn is not None:
-                        fn_name = getattr(fn, "name", None)
-                        if fn_name:
-                            target["function"]["name"] = fn_name
-                        args_delta = getattr(fn, "arguments_delta", None)
-                        if args_delta:
-                            target["function"]["arguments"] += args_delta
-                # Emit partial assistant message when something changed
-                if delta_text or tcd is not None:
-                    assistant_event_streamed = True
-                    # Normalize tool_calls for message
-                    message_tool_calls = None
-                    if len(partial_tool_calls) > 0:
-                        message_tool_calls = []
-                        for i, tc in enumerate(partial_tool_calls):
-                            arguments = tc["function"]["arguments"]
-                            if isinstance(arguments, str):
-                                arguments = _normalize_tool_call_arguments(arguments)
-                            message_tool_calls.append({
-                                "id": tc["id"] or f"call_{i}",
+    for retry_attempt in range(config.max_empty_response_retries + 1):
+        # Get completion from model provider, prefer streaming if available
+        get_stream = getattr(config.model_provider, "get_completion_stream", None)
+        if callable(get_stream):
+            try:
+                aggregated_text = ""
+                # Working array of partial tool calls
+                partial_tool_calls: List[Dict[str, Any]] = []
+                async for chunk in get_stream(state, current_agent, config):  # type: ignore[arg-type]
+                    # Text deltas
+                    delta_text = getattr(chunk, "delta", None)
+                    if delta_text:
+                        aggregated_text += delta_text
+                    # Tool call deltas
+                    tcd = getattr(chunk, "tool_call_delta", None)
+                    if tcd is not None:
+                        idx = getattr(tcd, "index", 0) or 0
+                        # Ensure slot exists
+                        while len(partial_tool_calls) <= idx:
+                            partial_tool_calls.append({
+                                "id": None,
                                 "type": "function",
-                                "function": {
-                                    "name": tc["function"]["name"] or "",
-                                    "arguments": arguments
-                                }
+                                "function": {"name": None, "arguments": ""}
                             })
+                        target = partial_tool_calls[idx]
+                        # id
+                        tc_id = getattr(tcd, "id", None)
+                        if tc_id:
+                            target["id"] = tc_id
+                        # function fields
+                        fn = getattr(tcd, "function", None)
+                        if fn is not None:
+                            fn_name = getattr(fn, "name", None)
+                            if fn_name:
+                                target["function"]["name"] = fn_name
+                            args_delta = getattr(fn, "arguments_delta", None)
+                            if args_delta:
+                                target["function"]["arguments"] += args_delta
+                    # Emit partial assistant message when something changed
+                    if delta_text or tcd is not None:
+                        assistant_event_streamed = True
+                        # Normalize tool_calls for message
+                        message_tool_calls = None
+                        if len(partial_tool_calls) > 0:
+                            message_tool_calls = []
+                            for i, tc in enumerate(partial_tool_calls):
+                                arguments = tc["function"]["arguments"]
+                                if isinstance(arguments, str):
+                                    arguments = _normalize_tool_call_arguments(arguments)
+                                message_tool_calls.append({
+                                    "id": tc["id"] or f"call_{i}",
+                                    "type": "function",
+                                    "function": {
+                                        "name": tc["function"]["name"] or "",
+                                        "arguments": arguments
+                                    }
+                                })
+                        partial_msg = Message(
+                            role=ContentRole.ASSISTANT,
+                            content=aggregated_text or "",
+                            tool_calls=None if not message_tool_calls else [
+                                ToolCall(
+                                    id=mc["id"],
+                                    type="function",
+                                    function=ToolCallFunction(
+                                        name=mc["function"]["name"],
+                                        arguments=_normalize_tool_call_arguments(mc["function"]["arguments"])
+                                    ),
+                                ) for mc in message_tool_calls
+                            ],
+                        )
+                        try:
+                            if config.on_event:
+                                config.on_event(AssistantMessageEvent(data=to_event_data(
+                                    AssistantMessageEventData(message=partial_msg)
+                                )))
+                        except Exception as _e:
+                            # Do not fail the run on callback errors
+                            pass
+                # Build final response object compatible with downstream logic
+                final_tool_calls = None
+                if len(partial_tool_calls) > 0:
+                    final_tool_calls = []
+                    for i, tc in enumerate(partial_tool_calls):
+                        arguments = tc["function"]["arguments"]
+                        if isinstance(arguments, str):
+                            arguments = _normalize_tool_call_arguments(arguments)
+                        final_tool_calls.append({
+                            "id": tc["id"] or f"call_{i}",
+                            "type": "function",
+                            "function": {
+                                "name": tc["function"]["name"] or "",
+                                "arguments": arguments
+                            }
+                        })
-                    partial_msg = Message(
-                        role=ContentRole.ASSISTANT,
-                        content=aggregated_text or "",
-                        tool_calls=None if not message_tool_calls else [
-                            ToolCall(
-                                id=mc["id"],
-                                type="function",
-                                function=ToolCallFunction(
-                                    name=mc["function"]["name"],
-                                    arguments=_normalize_tool_call_arguments(mc["function"]["arguments"])
-                                ),
-                            ) for mc in message_tool_calls
-                        ],
-                    )
-                    try:
-                        if config.on_event:
-                            config.on_event(AssistantMessageEvent(data=to_event_data(
-                                AssistantMessageEventData(message=partial_msg)
-                            )))
-                    except Exception as _e:
-                        # Do not fail the run on callback errors
-                        pass
-            # Build final response object compatible with downstream logic
-            final_tool_calls = None
-            if len(partial_tool_calls) > 0:
-                final_tool_calls = []
-                for i, tc in enumerate(partial_tool_calls):
-                    arguments = tc["function"]["arguments"]
-                    if isinstance(arguments, str):
-                        arguments = _normalize_tool_call_arguments(arguments)
-                    final_tool_calls.append({
-                        "id": tc["id"] or f"call_{i}",
-                        "type": "function",
-                        "function": {
-                            "name": tc["function"]["name"] or "",
-                            "arguments": arguments
-                        }
-                    })
-            llm_response = {
-                "message": {
-                    "content": aggregated_text or None,
-                    "tool_calls": final_tool_calls
+                llm_response = {
+                    "message": {
+                        "content": aggregated_text or None,
+                        "tool_calls": final_tool_calls
+                    }
                 }
-            }
-        except Exception:
-            # Fallback to non-streaming on error
-            assistant_event_streamed = False
+            except Exception:
+                # Fallback to non-streaming on error
+                assistant_event_streamed = False
+                llm_response = await config.model_provider.get_completion(state, current_agent, config)
+        else:
             llm_response = await config.model_provider.get_completion(state, current_agent, config)
-    else:
-        llm_response = await config.model_provider.get_completion(state, current_agent, config)
+        # Check if response has meaningful content
+        has_content = llm_response.get('message', {}).get('content')
+        has_tool_calls = llm_response.get('message', {}).get('tool_calls')
+        # If we got a valid response, break out of retry loop
+        if has_content or has_tool_calls:
+            break
+        # If this is not the last attempt, retry with exponential backoff
+        if retry_attempt < config.max_empty_response_retries:
+            delay = config.empty_response_retry_delay * (2 ** retry_attempt)
+            if config.log_empty_responses:
+                print(f"[JAF:ENGINE] Empty LLM response on attempt {retry_attempt + 1}/{config.max_empty_response_retries + 1}, retrying in {delay:.1f}s...")
+                print(f"[JAF:ENGINE] Response had message: {bool(llm_response.get('message'))}, content: {bool(has_content)}, tool_calls: {bool(has_tool_calls)}")
+            await asyncio.sleep(delay)
+        else:
+            # Last attempt failed, log detailed diagnostic info
+            if config.log_empty_responses:
+                print(f"[JAF:ENGINE] Empty LLM response after {config.max_empty_response_retries + 1} attempts")
+                print(f"[JAF:ENGINE] Agent: {current_agent.name}, Model: {model}")
+                print(f"[JAF:ENGINE] Message count: {len(state.messages)}, Turn: {state.turn_count}")
+                print(f"[JAF:ENGINE] Response structure: {json.dumps(llm_response, indent=2)[:1000]}")
+    # Apply after_llm_call callback if provided
+    if config.after_llm_call:
+        if asyncio.iscoroutinefunction(config.after_llm_call):
+            llm_response = await config.after_llm_call(state, llm_response)
+        else:
+            result = config.after_llm_call(state, llm_response)
+            if asyncio.iscoroutine(result):
+                llm_response = await result
+            else:
+                llm_response = result
     # Emit LLM call end event
     if config.on_event:
@@ -673,6 +712,9 @@ async def _run_internal(
     # Check if response has message
     if not llm_response.get('message'):
+        if config.log_empty_responses:
+            print(f"[JAF:ENGINE] ERROR: No message in LLM response")
+            print(f"[JAF:ENGINE] Response structure: {json.dumps(llm_response, indent=2)[:500]}")
         return RunResult(
             final_state=state,
             outcome=ErrorOutcome(error=ModelBehaviorError(

jaf-py 2.5.3__py3-none-any.whl → 2.5.5__py3-none-any.whl

jaf-py 2.5.3py3-none-any.whl → 2.5.5py3-none-any.whl