PyPI - synth-ai - Versions diffs - 0.2.9.dev4__py3-none-any.whl → 0.2.9.dev7__py3-none-any.whl - Mend

synth-ai 0.2.9.dev4py3-none-any.whl → 0.2.9.dev7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of synth-ai might be problematic. Click here for more details.

Files changed (157) hide show

examples/common_old/backend.py +0 -1
examples/crafter_debug_render.py +15 -6
examples/evals_old/compare_models.py +1 -0
examples/finetuning_old/_backup_synth_qwen/filter_traces_achievements.py +6 -2
examples/finetuning_old/_backup_synth_qwen/react_agent_lm.py +4 -4
examples/finetuning_old/_backup_synth_qwen/sft_kickoff.py +4 -3
examples/finetuning_old/synth_qwen_v1/filter_traces_achievements.py +6 -2
examples/finetuning_old/synth_qwen_v1/finetune.py +1 -1
examples/finetuning_old/synth_qwen_v1/hello_ft_model.py +4 -4
examples/finetuning_old/synth_qwen_v1/infer.py +1 -2
examples/finetuning_old/synth_qwen_v1/poll.py +4 -2
examples/finetuning_old/synth_qwen_v1/prepare_data.py +8 -8
examples/finetuning_old/synth_qwen_v1/react_agent_lm.py +5 -4
examples/finetuning_old/synth_qwen_v1/run_crafter_sft_job.py +11 -8
examples/finetuning_old/synth_qwen_v1/run_ft_job.py +17 -12
examples/finetuning_old/synth_qwen_v1/upload_data.py +1 -1
examples/finetuning_old/synth_qwen_v1/util.py +7 -2
examples/rl/configs/eval_base_qwen.toml +1 -1
examples/rl/configs/rl_from_base_qwen17.toml +1 -1
examples/rl/download_dataset.py +26 -10
examples/rl/run_eval.py +17 -15
examples/rl/run_rl_and_save.py +24 -7
examples/rl/task_app/math_single_step.py +128 -11
examples/rl/task_app/math_task_app.py +11 -3
examples/rl_old/task_app.py +222 -53
examples/warming_up_to_rl/analyze_trace_db.py +7 -5
examples/warming_up_to_rl/export_trace_sft.py +141 -16
examples/warming_up_to_rl/groq_test.py +11 -4
examples/warming_up_to_rl/manage_secrets.py +15 -6
examples/warming_up_to_rl/readme.md +9 -2
examples/warming_up_to_rl/run_eval.py +108 -30
examples/warming_up_to_rl/run_fft_and_save.py +128 -52
examples/warming_up_to_rl/run_local_rollout.py +87 -36
examples/warming_up_to_rl/run_local_rollout_modal.py +113 -25
examples/warming_up_to_rl/run_local_rollout_parallel.py +80 -16
examples/warming_up_to_rl/run_local_rollout_traced.py +125 -20
examples/warming_up_to_rl/run_rl_and_save.py +31 -7
examples/warming_up_to_rl/run_rollout_remote.py +37 -10
examples/warming_up_to_rl/task_app/grpo_crafter.py +90 -27
examples/warming_up_to_rl/task_app/grpo_crafter_task_app.py +9 -27
examples/warming_up_to_rl/task_app/synth_envs_hosted/environment_routes.py +46 -108
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/__init__.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/__init__.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/app.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/environment.py +50 -17
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/policy.py +35 -21
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/react_agent.py +8 -4
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/shared.py +29 -26
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/tools.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/hosted_app.py +17 -13
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/__init__.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py +106 -63
examples/warming_up_to_rl/task_app/synth_envs_hosted/policy_routes.py +82 -84
examples/warming_up_to_rl/task_app/synth_envs_hosted/rollout.py +76 -59
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/__init__.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/volume.py +43 -49
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_service.py +5 -15
synth_ai/__init__.py +1 -0
synth_ai/api/train/builders.py +34 -10
synth_ai/api/train/cli.py +172 -32
synth_ai/api/train/config_finder.py +59 -4
synth_ai/api/train/env_resolver.py +32 -14
synth_ai/api/train/pollers.py +11 -3
synth_ai/api/train/task_app.py +4 -1
synth_ai/api/train/utils.py +20 -4
synth_ai/cli/__init__.py +11 -4
synth_ai/cli/balance.py +1 -1
synth_ai/cli/demo.py +19 -5
synth_ai/cli/rl_demo.py +75 -16
synth_ai/cli/root.py +116 -37
synth_ai/cli/task_apps.py +1286 -170
synth_ai/cli/traces.py +1 -0
synth_ai/cli/turso.py +73 -0
synth_ai/core/experiment.py +0 -2
synth_ai/demo_registry.py +67 -30
synth_ai/demos/core/cli.py +493 -164
synth_ai/demos/demo_task_apps/core.py +50 -6
synth_ai/demos/demo_task_apps/crafter/configs/crafter_fft_4b.toml +2 -3
synth_ai/demos/demo_task_apps/crafter/grpo_crafter_task_app.py +36 -28
synth_ai/demos/demo_task_apps/math/_common.py +1 -2
synth_ai/demos/demo_task_apps/math/deploy_modal.py +0 -2
synth_ai/demos/demo_task_apps/math/modal_task_app.py +168 -65
synth_ai/demos/demo_task_apps/math/task_app_entry.py +0 -1
synth_ai/environments/examples/bandit/engine.py +12 -4
synth_ai/environments/examples/bandit/taskset.py +4 -4
synth_ai/environments/reproducibility/tree.py +3 -1
synth_ai/environments/service/core_routes.py +6 -2
synth_ai/evals/base.py +0 -2
synth_ai/experimental/synth_oss.py +11 -12
synth_ai/handshake.py +3 -1
synth_ai/http_client.py +31 -7
synth_ai/inference/__init__.py +0 -2
synth_ai/inference/client.py +8 -4
synth_ai/jobs/client.py +40 -10
synth_ai/learning/client.py +33 -8
synth_ai/learning/config.py +0 -2
synth_ai/learning/constants.py +0 -2
synth_ai/learning/ft_client.py +6 -3
synth_ai/learning/health.py +9 -2
synth_ai/learning/jobs.py +17 -5
synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +1 -3
synth_ai/learning/prompts/random_search.py +4 -1
synth_ai/learning/prompts/run_random_search_banking77.py +6 -1
synth_ai/learning/rl_client.py +42 -14
synth_ai/learning/sse.py +0 -2
synth_ai/learning/validators.py +6 -2
synth_ai/lm/caching/ephemeral.py +1 -3
synth_ai/lm/core/exceptions.py +0 -2
synth_ai/lm/core/main.py +13 -1
synth_ai/lm/core/synth_models.py +0 -1
synth_ai/lm/core/vendor_clients.py +4 -2
synth_ai/lm/overrides.py +2 -2
synth_ai/lm/vendors/core/anthropic_api.py +7 -7
synth_ai/lm/vendors/core/openai_api.py +2 -0
synth_ai/lm/vendors/openai_standard.py +3 -1
synth_ai/lm/vendors/openai_standard_responses.py +6 -3
synth_ai/lm/vendors/supported/custom_endpoint.py +1 -3
synth_ai/lm/vendors/synth_client.py +37 -10
synth_ai/rl/__init__.py +0 -1
synth_ai/rl/contracts.py +0 -2
synth_ai/rl/env_keys.py +6 -1
synth_ai/task/__init__.py +1 -0
synth_ai/task/apps/__init__.py +11 -11
synth_ai/task/auth.py +29 -17
synth_ai/task/client.py +3 -1
synth_ai/task/contracts.py +1 -0
synth_ai/task/datasets.py +3 -1
synth_ai/task/errors.py +3 -2
synth_ai/task/health.py +0 -2
synth_ai/task/json.py +0 -1
synth_ai/task/proxy.py +2 -5
synth_ai/task/rubrics.py +9 -3
synth_ai/task/server.py +31 -5
synth_ai/task/tracing_utils.py +8 -3
synth_ai/task/validators.py +0 -1
synth_ai/task/vendors.py +0 -1
synth_ai/tracing_v3/db_config.py +26 -1
synth_ai/tracing_v3/decorators.py +1 -0
synth_ai/tracing_v3/examples/basic_usage.py +3 -2
synth_ai/tracing_v3/hooks.py +2 -0
synth_ai/tracing_v3/replica_sync.py +1 -0
synth_ai/tracing_v3/session_tracer.py +24 -3
synth_ai/tracing_v3/storage/base.py +4 -1
synth_ai/tracing_v3/storage/factory.py +0 -1
synth_ai/tracing_v3/turso/manager.py +102 -38
synth_ai/tracing_v3/turso/models.py +4 -1
synth_ai/tracing_v3/utils.py +1 -0
synth_ai/v0/tracing/upload.py +32 -135
{synth_ai-0.2.9.dev4.dist-info → synth_ai-0.2.9.dev7.dist-info}/METADATA +1 -1
{synth_ai-0.2.9.dev4.dist-info → synth_ai-0.2.9.dev7.dist-info}/RECORD +154 -156
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_stepwise_rewards.py +0 -58
synth_ai/environments/examples/sokoban/units/astar_common.py +0 -95
synth_ai/install_sqld.sh +0 -40
{synth_ai-0.2.9.dev4.dist-info → synth_ai-0.2.9.dev7.dist-info}/WHEEL +0 -0
{synth_ai-0.2.9.dev4.dist-info → synth_ai-0.2.9.dev7.dist-info}/entry_points.txt +0 -0
{synth_ai-0.2.9.dev4.dist-info → synth_ai-0.2.9.dev7.dist-info}/licenses/LICENSE +0 -0
{synth_ai-0.2.9.dev4.dist-info → synth_ai-0.2.9.dev7.dist-info}/top_level.txt +0 -0

examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py CHANGED Viewed

@@ -11,7 +11,7 @@ logger = logging.getLogger(__name__)
 class OpenAIClient:
     """Async HTTP client for OpenAI-compatible inference servers (vLLM)."""
     def __init__(
         self,
         base_url: str,
@@ -22,11 +22,13 @@ class OpenAIClient:
         self.api_key = api_key
         self.timeout_s = timeout_s
         self.headers = {}
         if api_key:
             self.headers["Authorization"] = f"Bearer {api_key}"
-    def _fix_model_parameters(self, request: Dict[str, Any], target_url: Optional[str] = None) -> Dict[str, Any]:
+    def _fix_model_parameters(
+        self, request: Dict[str, Any], target_url: Optional[str] = None
+    ) -> Dict[str, Any]:
         """
         Fix parameter compatibility for newer OpenAI models.
@@ -75,7 +77,9 @@ class OpenAIClient:
                 if "max_tokens" in fixed_request:
                     if "max_completion_tokens" not in fixed_request:
                         fixed_request["max_completion_tokens"] = fixed_request.pop("max_tokens")
-                        logger.info(f"Converted max_tokens to max_completion_tokens for model {model}")
+                        logger.info(
+                            f"Converted max_tokens to max_completion_tokens for model {model}"
+                        )
                     else:
                         fixed_request.pop("max_tokens")
                         logger.info(f"Removed conflicting max_tokens parameter for model {model}")
@@ -145,7 +149,9 @@ class OpenAIClient:
                     logger.info("Removed stop_after_tool_calls for OpenAI request")
             # Groq-specific requirement: when using JSON mode, one of the messages must contain the word 'json'
             low_url = url.lower()
-            if ("groq.com" in low_url or "/openai" in low_url) and isinstance(processed_request, dict):
+            if ("groq.com" in low_url or "/openai" in low_url) and isinstance(
+                processed_request, dict
+            ):
                 rf = processed_request.get("response_format")
                 rf_type = None
                 if isinstance(rf, dict):
@@ -164,7 +170,9 @@ class OpenAIClient:
                                     # Join any text segments
                                     parts = []
                                     for seg in content:
-                                        if isinstance(seg, dict) and isinstance(seg.get("text"), str):
+                                        if isinstance(seg, dict) and isinstance(
+                                            seg.get("text"), str
+                                        ):
                                             parts.append(seg["text"])
                                     text = "\n".join(parts)
                                 if isinstance(text, str) and ("json" in text.lower()):
@@ -174,13 +182,17 @@ class OpenAIClient:
                                 continue
                     if not has_json_word:
                         try:
-                            instruction = "Respond in strict JSON only. Output a single valid JSON object."
+                            instruction = (
+                                "Respond in strict JSON only. Output a single valid JSON object."
+                            )
                             if not isinstance(msgs, list):
                                 msgs = []
                             # Prepend a system message to satisfy Groq requirement without changing user intent
                             prepend = {"role": "system", "content": instruction}
                             processed_request["messages"] = [prepend] + list(msgs)
-                            logger.info("Injected JSON-mode system instruction for Groq response_format compliance")
+                            logger.info(
+                                "Injected JSON-mode system instruction for Groq response_format compliance"
+                            )
                         except Exception:
                             pass
         except Exception:
@@ -194,7 +206,7 @@ class OpenAIClient:
                     headers=headers,
                 )
                 response.raise_for_status()
                 # Rich response diagnostics
                 content_type = response.headers.get("content-type")
                 body_text = response.text
@@ -203,12 +215,14 @@ class OpenAIClient:
                 )
                 if body_text:
                     preview_len = min(800, len(body_text))
-                    logger.info(f"Inference response preview ({preview_len} bytes): {body_text[:preview_len]}")
+                    logger.info(
+                        f"Inference response preview ({preview_len} bytes): {body_text[:preview_len]}"
+                    )
                 result = response.json()
                 logger.info(f"Inference response parsed_type={type(result).__name__}")
                 return result
             except httpx.TimeoutException:
                 logger.error(f"Request to {url} timed out after {timeout}s")
                 raise
@@ -217,12 +231,14 @@ class OpenAIClient:
                 text = e.response.text if e.response is not None else str(e)
                 # Log full body for debugging remote failures
                 try:
-                    logger.error({
-                        "openai_http_error": True,
-                        "status": status,
-                        "url": url,
-                        "body": text,
-                    })
+                    logger.error(
+                        {
+                            "openai_http_error": True,
+                            "status": status,
+                            "url": url,
+                            "body": text,
+                        }
+                    )
                 except Exception:
                     logger.error(f"HTTP error from {url}: {status} - {text}")
                 # For 4xx/5xx, print full sanitized request to aid debugging (especially Groq 400s)
@@ -230,13 +246,15 @@ class OpenAIClient:
                     redacted_headers = dict(headers)
                     if "Authorization" in redacted_headers:
                         redacted_headers["Authorization"] = "***REDACTED***"
-                    logger.error({
-                        "request_debug": True,
-                        "status": status,
-                        "target": url,
-                        "headers": redacted_headers,
-                        "payload": processed_request,
-                    })
+                    logger.error(
+                        {
+                            "request_debug": True,
+                            "status": status,
+                            "target": url,
+                            "headers": redacted_headers,
+                            "payload": processed_request,
+                        }
+                    )
                 except Exception:
                     pass
                 # Special case: token budget exceeded (OpenAI-compatible error schema)
@@ -270,23 +288,38 @@ class OpenAIClient:
                                         try:
                                             tools_arr = processed_request.get("tools") or []
                                             if isinstance(tools_arr, list) and tools_arr:
-                                                f = tools_arr[0].get("function") if isinstance(tools_arr[0], dict) else None
-                                                cand = (f or {}).get("name") if isinstance(f, dict) else None
+                                                f = (
+                                                    tools_arr[0].get("function")
+                                                    if isinstance(tools_arr[0], dict)
+                                                    else None
+                                                )
+                                                cand = (
+                                                    (f or {}).get("name")
+                                                    if isinstance(f, dict)
+                                                    else None
+                                                )
                                                 if isinstance(cand, str) and cand:
                                                     func_name = cand
                                         except Exception:
                                             pass
-                                        processed_request["tool_choice"] = {"type": "function", "function": {"name": func_name}}
+                                        processed_request["tool_choice"] = {
+                                            "type": "function",
+                                            "function": {"name": func_name},
+                                        }
                                         processed_request["parallel_tool_calls"] = False
-                                    logger.warning({
-                                        "token_budget_recovery": True,
-                                        "messages_tokens": messages_tokens,
-                                        "model_limit": model_limit,
-                                        "retry_max_tokens": new_max,
-                                    })
+                                    logger.warning(
+                                        {
+                                            "token_budget_recovery": True,
+                                            "messages_tokens": messages_tokens,
+                                            "model_limit": model_limit,
+                                            "retry_max_tokens": new_max,
+                                        }
+                                    )
                                     # Retry once with reduced budget
                                     async with httpx.AsyncClient(timeout=timeout) as client2:
-                                        r2 = await client2.post(url, json=processed_request, headers=headers)
+                                        r2 = await client2.post(
+                                            url, json=processed_request, headers=headers
+                                        )
                                         r2.raise_for_status()
                                         return r2.json()
                             except Exception:
@@ -302,14 +335,17 @@ class OpenAIClient:
                             err = e.response.json()
                         except Exception:
                             err = {"error": "unprocessable", "detail": (text or "")[:200]}
-                        logger.warning({
-                            "inference_422_recovered": True,
-                            "detail": err,
-                        })
+                        logger.warning(
+                            {
+                                "inference_422_recovered": True,
+                                "detail": err,
+                            }
+                        )
                     except Exception:
                         pass
                     # Return a minimal OpenAI-compatible response with no tool_calls/content
                     import time as _t
                     return {
                         "id": f"cmpl-{int(_t.time())}",
                         "object": "chat.completion",
@@ -328,7 +364,7 @@ class OpenAIClient:
             except Exception as e:
                 logger.error(f"Unexpected error calling {url}: {e}")
                 raise
     async def check_health(
         self,
         base_url: Optional[str] = None,
@@ -336,17 +372,17 @@ class OpenAIClient:
     ) -> Dict[str, Any]:
         """
         Check if the inference service is healthy.
         Args:
             base_url: Override base URL for this request
             timeout_s: Override timeout for this request
         Returns:
             Health status dict with 'status' field
         """
         url = (base_url or self.base_url).rstrip("/") + "/health"
         timeout = timeout_s or 10.0
         try:
             async with httpx.AsyncClient(timeout=timeout) as client:
                 response = await client.get(url, headers=self.headers)
@@ -364,7 +400,7 @@ class OpenAIClient:
             return {"status": "unhealthy", "error": str(e)}
         except Exception as e:
             return {"status": "unhealthy", "error": str(e)}
     async def generate_with_retries(
         self,
         request: Dict[str, Any],
@@ -376,7 +412,7 @@ class OpenAIClient:
     ) -> Dict[str, Any]:
         """
         Generate with exponential backoff retries for transient errors.
         Args:
             request: OpenAI-compatible chat completion request
             base_url: Override base URL
@@ -384,13 +420,13 @@ class OpenAIClient:
             max_retries: Maximum number of retry attempts
             backoff_factor: Exponential backoff multiplier
             extra_headers: Additional headers to include (e.g., X-Policy-Name)
         Returns:
             OpenAI-compatible chat completion response
         """
         last_error = None
         wait_time = 1.0
         for attempt in range(max_retries + 1):
             try:
                 # Apply parameter fixes to the request
@@ -417,7 +453,9 @@ class OpenAIClient:
                             retry_after = response_data.get("retry_after", 1)
                             # Use the suggested retry_after time instead of exponential backoff for overload
                             wait_time = max(wait_time, float(retry_after))
-                            logger.warning(f"Inference service overloaded (400). {response_data} Retrying after {wait_time}s...")
+                            logger.warning(
+                                f"Inference service overloaded (400). {response_data} Retrying after {wait_time}s..."
+                            )
                         else:
                             # This is a different type of 400 error, don't retry
                             try:
@@ -428,13 +466,15 @@ class OpenAIClient:
                                         redacted_headers["Authorization"] = "***REDACTED***"
                                 except Exception:
                                     redacted_headers = {}
-                                logger.error({
-                                    "non_overload_400": True,
-                                    "target": (base_url or self.base_url),
-                                    "payload": processed_request,
-                                    "headers": redacted_headers,
-                                    "body": e.response.text if e.response is not None else None,
-                                })
+                                logger.error(
+                                    {
+                                        "non_overload_400": True,
+                                        "target": (base_url or self.base_url),
+                                        "payload": processed_request,
+                                        "headers": redacted_headers,
+                                        "body": e.response.text if e.response is not None else None,
+                                    }
+                                )
                             except Exception:
                                 pass
                             raise RuntimeError(
@@ -443,11 +483,13 @@ class OpenAIClient:
                     except Exception:
                         # If we can't parse the response, don't retry 400 errors
                         try:
-                            logger.error({
-                                "non_overload_400_unparsed": True,
-                                "target": (base_url or self.base_url),
-                                "payload": processed_request,
-                            })
+                            logger.error(
+                                {
+                                    "non_overload_400_unparsed": True,
+                                    "target": (base_url or self.base_url),
+                                    "payload": processed_request,
+                                }
+                            )
                         except Exception:
                             pass
                         raise RuntimeError(
@@ -472,7 +514,7 @@ class OpenAIClient:
                     )
             except httpx.TimeoutException as e:
                 last_error = e
             if attempt < max_retries:
                 logger.warning(
                     f"Inference request failed (attempt {attempt + 1}/{max_retries + 1}), "
@@ -480,7 +522,7 @@ class OpenAIClient:
                 )
                 await asyncio.sleep(wait_time)
                 wait_time *= backoff_factor
         raise last_error
@@ -490,11 +532,11 @@ def create_inference_client(
 ) -> OpenAIClient:
     """
     Create an inference client using TaskApp configuration.
     Args:
         task_app: TaskApp instance with vllm_base_url
         api_key: Optional API key for authentication
     Returns:
         Configured OpenAIClient instance
     """
@@ -502,6 +544,7 @@ def create_inference_client(
     if api_key is None:
         try:
             import os as _os  # local import to avoid module-level side effects
             api_key = _os.getenv("OPENAI_API_KEY") or getattr(task_app, "openai_api_key", None)
         except Exception:
             api_key = None

synth-ai 0.2.9.dev4__py3-none-any.whl → 0.2.9.dev7__py3-none-any.whl

Potentially problematic release.

synth-ai 0.2.9.dev4py3-none-any.whl → 0.2.9.dev7py3-none-any.whl