PyPI - synth-ai - Versions diffs - 0.2.4.dev6__py3-none-any.whl → 0.2.4.dev8__py3-none-any.whl - Mend

synth-ai 0.2.4.dev6py3-none-any.whl → 0.2.4.dev8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (256) hide show

synth_ai/__init__.py +18 -9
synth_ai/cli/__init__.py +10 -5
synth_ai/cli/balance.py +25 -32
synth_ai/cli/calc.py +2 -3
synth_ai/cli/demo.py +3 -5
synth_ai/cli/legacy_root_backup.py +58 -32
synth_ai/cli/man.py +22 -19
synth_ai/cli/recent.py +9 -8
synth_ai/cli/root.py +58 -13
synth_ai/cli/status.py +13 -6
synth_ai/cli/traces.py +45 -21
synth_ai/cli/watch.py +40 -37
synth_ai/config/base_url.py +47 -2
synth_ai/core/experiment.py +1 -2
synth_ai/environments/__init__.py +2 -6
synth_ai/environments/environment/artifacts/base.py +3 -1
synth_ai/environments/environment/db/sqlite.py +1 -1
synth_ai/environments/environment/registry.py +19 -20
synth_ai/environments/environment/resources/sqlite.py +2 -3
synth_ai/environments/environment/rewards/core.py +3 -2
synth_ai/environments/environment/tools/__init__.py +6 -4
synth_ai/environments/examples/crafter_classic/__init__.py +1 -1
synth_ai/environments/examples/crafter_classic/engine.py +13 -13
synth_ai/environments/examples/crafter_classic/engine_deterministic_patch.py +1 -0
synth_ai/environments/examples/crafter_classic/engine_helpers/action_map.py +2 -1
synth_ai/environments/examples/crafter_classic/engine_helpers/serialization.py +2 -1
synth_ai/environments/examples/crafter_classic/engine_serialization_patch_v3.py +3 -2
synth_ai/environments/examples/crafter_classic/environment.py +16 -15
synth_ai/environments/examples/crafter_classic/taskset.py +2 -2
synth_ai/environments/examples/crafter_classic/trace_hooks_v3.py +2 -3
synth_ai/environments/examples/crafter_classic/world_config_patch_simple.py +2 -1
synth_ai/environments/examples/crafter_custom/crafter/__init__.py +2 -2
synth_ai/environments/examples/crafter_custom/crafter/config.py +2 -2
synth_ai/environments/examples/crafter_custom/crafter/env.py +1 -5
synth_ai/environments/examples/crafter_custom/crafter/objects.py +1 -2
synth_ai/environments/examples/crafter_custom/crafter/worldgen.py +1 -2
synth_ai/environments/examples/crafter_custom/dataset_builder.py +5 -5
synth_ai/environments/examples/crafter_custom/environment.py +13 -13
synth_ai/environments/examples/crafter_custom/run_dataset.py +5 -5
synth_ai/environments/examples/enron/art_helpers/email_search_tools.py +2 -2
synth_ai/environments/examples/enron/art_helpers/local_email_db.py +5 -4
synth_ai/environments/examples/enron/art_helpers/types_enron.py +2 -1
synth_ai/environments/examples/enron/engine.py +18 -14
synth_ai/environments/examples/enron/environment.py +12 -11
synth_ai/environments/examples/enron/taskset.py +7 -7
synth_ai/environments/examples/minigrid/__init__.py +6 -6
synth_ai/environments/examples/minigrid/engine.py +6 -6
synth_ai/environments/examples/minigrid/environment.py +6 -6
synth_ai/environments/examples/minigrid/puzzle_loader.py +3 -2
synth_ai/environments/examples/minigrid/taskset.py +13 -13
synth_ai/environments/examples/nethack/achievements.py +1 -1
synth_ai/environments/examples/nethack/engine.py +8 -7
synth_ai/environments/examples/nethack/environment.py +10 -9
synth_ai/environments/examples/nethack/helpers/__init__.py +8 -9
synth_ai/environments/examples/nethack/helpers/action_mapping.py +1 -1
synth_ai/environments/examples/nethack/helpers/nle_wrapper.py +2 -1
synth_ai/environments/examples/nethack/helpers/observation_utils.py +1 -1
synth_ai/environments/examples/nethack/helpers/recording_wrapper.py +3 -4
synth_ai/environments/examples/nethack/helpers/trajectory_recorder.py +6 -5
synth_ai/environments/examples/nethack/helpers/visualization/replay_viewer.py +5 -5
synth_ai/environments/examples/nethack/helpers/visualization/visualizer.py +7 -6
synth_ai/environments/examples/nethack/taskset.py +5 -5
synth_ai/environments/examples/red/engine.py +9 -8
synth_ai/environments/examples/red/engine_helpers/reward_components.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/__init__.py +7 -7
synth_ai/environments/examples/red/engine_helpers/reward_library/adaptive_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/battle_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/composite_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/economy_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/efficiency_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/exploration_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/novelty_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/pallet_town_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/pokemon_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/social_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/story_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/screen_analysis.py +3 -2
synth_ai/environments/examples/red/engine_helpers/state_extraction.py +2 -1
synth_ai/environments/examples/red/environment.py +18 -15
synth_ai/environments/examples/red/taskset.py +5 -3
synth_ai/environments/examples/sokoban/engine.py +16 -13
synth_ai/environments/examples/sokoban/engine_helpers/room_utils.py +3 -2
synth_ai/environments/examples/sokoban/engine_helpers/vendored/__init__.py +2 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/__init__.py +1 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/boxoban_env.py +7 -5
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/render_utils.py +1 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/room_utils.py +2 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env.py +5 -4
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_fixed_targets.py +3 -2
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_pull.py +2 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_two_player.py +5 -4
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_variations.py +1 -1
synth_ai/environments/examples/sokoban/environment.py +15 -14
synth_ai/environments/examples/sokoban/generate_verified_puzzles.py +5 -3
synth_ai/environments/examples/sokoban/puzzle_loader.py +3 -2
synth_ai/environments/examples/sokoban/taskset.py +13 -10
synth_ai/environments/examples/tictactoe/engine.py +6 -6
synth_ai/environments/examples/tictactoe/environment.py +8 -7
synth_ai/environments/examples/tictactoe/taskset.py +6 -5
synth_ai/environments/examples/verilog/engine.py +4 -3
synth_ai/environments/examples/verilog/environment.py +11 -10
synth_ai/environments/examples/verilog/taskset.py +14 -12
synth_ai/environments/examples/wordle/__init__.py +5 -5
synth_ai/environments/examples/wordle/engine.py +32 -25
synth_ai/environments/examples/wordle/environment.py +21 -16
synth_ai/environments/examples/wordle/helpers/generate_instances_wordfreq.py +6 -6
synth_ai/environments/examples/wordle/taskset.py +20 -12
synth_ai/environments/reproducibility/core.py +1 -1
synth_ai/environments/reproducibility/tree.py +21 -21
synth_ai/environments/service/app.py +3 -2
synth_ai/environments/service/core_routes.py +104 -110
synth_ai/environments/service/external_registry.py +1 -2
synth_ai/environments/service/registry.py +1 -1
synth_ai/environments/stateful/core.py +1 -2
synth_ai/environments/stateful/engine.py +1 -1
synth_ai/environments/tasks/api.py +4 -4
synth_ai/environments/tasks/core.py +14 -12
synth_ai/environments/tasks/filters.py +6 -4
synth_ai/environments/tasks/utils.py +13 -11
synth_ai/evals/base.py +2 -3
synth_ai/experimental/synth_oss.py +4 -4
synth_ai/http.py +102 -0
synth_ai/inference/__init__.py +7 -0
synth_ai/inference/client.py +20 -0
synth_ai/jobs/client.py +246 -0
synth_ai/learning/__init__.py +24 -0
synth_ai/learning/client.py +149 -0
synth_ai/learning/config.py +43 -0
synth_ai/learning/constants.py +29 -0
synth_ai/learning/ft_client.py +59 -0
synth_ai/learning/gateway.py +1 -3
synth_ai/learning/health.py +43 -0
synth_ai/learning/jobs.py +205 -0
synth_ai/learning/prompts/banking77_injection_eval.py +15 -10
synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +26 -14
synth_ai/learning/prompts/mipro.py +61 -52
synth_ai/learning/prompts/random_search.py +42 -43
synth_ai/learning/prompts/run_mipro_banking77.py +32 -20
synth_ai/learning/prompts/run_random_search_banking77.py +71 -52
synth_ai/learning/rl_client.py +256 -0
synth_ai/learning/sse.py +58 -0
synth_ai/learning/validators.py +48 -0
synth_ai/lm/__init__.py +5 -5
synth_ai/lm/caching/ephemeral.py +9 -9
synth_ai/lm/caching/handler.py +20 -20
synth_ai/lm/caching/persistent.py +10 -10
synth_ai/lm/config.py +3 -3
synth_ai/lm/constants.py +7 -7
synth_ai/lm/core/all.py +17 -3
synth_ai/lm/core/exceptions.py +0 -2
synth_ai/lm/core/main.py +26 -41
synth_ai/lm/core/main_v3.py +33 -10
synth_ai/lm/core/synth_models.py +48 -0
synth_ai/lm/core/vendor_clients.py +26 -22
synth_ai/lm/injection.py +7 -8
synth_ai/lm/overrides.py +21 -19
synth_ai/lm/provider_support/__init__.py +1 -1
synth_ai/lm/provider_support/anthropic.py +15 -15
synth_ai/lm/provider_support/openai.py +23 -21
synth_ai/lm/structured_outputs/handler.py +34 -32
synth_ai/lm/structured_outputs/inject.py +24 -27
synth_ai/lm/structured_outputs/rehabilitate.py +19 -15
synth_ai/lm/tools/base.py +17 -16
synth_ai/lm/unified_interface.py +17 -18
synth_ai/lm/vendors/base.py +20 -18
synth_ai/lm/vendors/core/anthropic_api.py +36 -27
synth_ai/lm/vendors/core/gemini_api.py +31 -36
synth_ai/lm/vendors/core/mistral_api.py +19 -19
synth_ai/lm/vendors/core/openai_api.py +42 -13
synth_ai/lm/vendors/openai_standard.py +158 -101
synth_ai/lm/vendors/openai_standard_responses.py +74 -61
synth_ai/lm/vendors/retries.py +9 -1
synth_ai/lm/vendors/supported/custom_endpoint.py +38 -28
synth_ai/lm/vendors/supported/deepseek.py +10 -10
synth_ai/lm/vendors/supported/grok.py +8 -8
synth_ai/lm/vendors/supported/ollama.py +2 -1
synth_ai/lm/vendors/supported/openrouter.py +11 -9
synth_ai/lm/vendors/synth_client.py +425 -75
synth_ai/lm/warmup.py +8 -7
synth_ai/rl/__init__.py +30 -0
synth_ai/rl/contracts.py +32 -0
synth_ai/rl/env_keys.py +137 -0
synth_ai/rl/secrets.py +19 -0
synth_ai/scripts/verify_rewards.py +100 -0
synth_ai/task/__init__.py +10 -0
synth_ai/task/contracts.py +120 -0
synth_ai/task/health.py +28 -0
synth_ai/task/validators.py +12 -0
synth_ai/tracing/__init__.py +22 -10
synth_ai/tracing_v1/__init__.py +22 -20
synth_ai/tracing_v3/__init__.py +7 -7
synth_ai/tracing_v3/abstractions.py +56 -52
synth_ai/tracing_v3/config.py +4 -2
synth_ai/tracing_v3/db_config.py +6 -8
synth_ai/tracing_v3/decorators.py +29 -30
synth_ai/tracing_v3/examples/basic_usage.py +12 -12
synth_ai/tracing_v3/hooks.py +24 -22
synth_ai/tracing_v3/llm_call_record_helpers.py +85 -98
synth_ai/tracing_v3/lm_call_record_abstractions.py +2 -4
synth_ai/tracing_v3/migration_helper.py +3 -5
synth_ai/tracing_v3/replica_sync.py +30 -32
synth_ai/tracing_v3/session_tracer.py +158 -31
synth_ai/tracing_v3/storage/__init__.py +1 -1
synth_ai/tracing_v3/storage/base.py +8 -7
synth_ai/tracing_v3/storage/config.py +4 -4
synth_ai/tracing_v3/storage/factory.py +4 -4
synth_ai/tracing_v3/storage/utils.py +9 -9
synth_ai/tracing_v3/turso/__init__.py +3 -3
synth_ai/tracing_v3/turso/daemon.py +9 -9
synth_ai/tracing_v3/turso/manager.py +278 -48
synth_ai/tracing_v3/turso/models.py +77 -19
synth_ai/tracing_v3/utils.py +5 -5
synth_ai/v0/tracing/abstractions.py +28 -28
synth_ai/v0/tracing/base_client.py +9 -9
synth_ai/v0/tracing/client_manager.py +7 -7
synth_ai/v0/tracing/config.py +7 -7
synth_ai/v0/tracing/context.py +6 -6
synth_ai/v0/tracing/decorators.py +6 -5
synth_ai/v0/tracing/events/manage.py +1 -1
synth_ai/v0/tracing/events/store.py +5 -4
synth_ai/v0/tracing/immediate_client.py +4 -5
synth_ai/v0/tracing/local.py +3 -3
synth_ai/v0/tracing/log_client_base.py +4 -5
synth_ai/v0/tracing/retry_queue.py +5 -6
synth_ai/v0/tracing/trackers.py +25 -25
synth_ai/v0/tracing/upload.py +6 -0
synth_ai/v0/tracing_v1/__init__.py +1 -1
synth_ai/v0/tracing_v1/abstractions.py +28 -28
synth_ai/v0/tracing_v1/base_client.py +9 -9
synth_ai/v0/tracing_v1/client_manager.py +7 -7
synth_ai/v0/tracing_v1/config.py +7 -7
synth_ai/v0/tracing_v1/context.py +6 -6
synth_ai/v0/tracing_v1/decorators.py +7 -6
synth_ai/v0/tracing_v1/events/manage.py +1 -1
synth_ai/v0/tracing_v1/events/store.py +5 -4
synth_ai/v0/tracing_v1/immediate_client.py +4 -5
synth_ai/v0/tracing_v1/local.py +3 -3
synth_ai/v0/tracing_v1/log_client_base.py +4 -5
synth_ai/v0/tracing_v1/retry_queue.py +5 -6
synth_ai/v0/tracing_v1/trackers.py +25 -25
synth_ai/v0/tracing_v1/upload.py +25 -24
synth_ai/zyk/__init__.py +1 -0
synth_ai-0.2.4.dev8.dist-info/METADATA +635 -0
synth_ai-0.2.4.dev8.dist-info/RECORD +317 -0
synth_ai/tui/__init__.py +0 -1
synth_ai/tui/__main__.py +0 -13
synth_ai/tui/cli/__init__.py +0 -1
synth_ai/tui/cli/query_experiments.py +0 -165
synth_ai/tui/cli/query_experiments_v3.py +0 -165
synth_ai/tui/dashboard.py +0 -329
synth_ai-0.2.4.dev6.dist-info/METADATA +0 -203
synth_ai-0.2.4.dev6.dist-info/RECORD +0 -299
{synth_ai-0.2.4.dev6.dist-info → synth_ai-0.2.4.dev8.dist-info}/WHEEL +0 -0
{synth_ai-0.2.4.dev6.dist-info → synth_ai-0.2.4.dev8.dist-info}/entry_points.txt +0 -0
{synth_ai-0.2.4.dev6.dist-info → synth_ai-0.2.4.dev8.dist-info}/licenses/LICENSE +0 -0
{synth_ai-0.2.4.dev6.dist-info → synth_ai-0.2.4.dev8.dist-info}/top_level.txt +0 -0

synth_ai/lm/warmup.py CHANGED Viewed

@@ -3,13 +3,14 @@ Model warmup utilities for Synth backend.
 Handles model preloading and warmup polling.
 """
-import httpx
 import asyncio
 import logging
 import sys
 import time
-from typing import Optional, Dict, Any
 from datetime import datetime, timedelta
+import httpx
 from .config import SynthConfig
 logger = logging.getLogger(__name__)
@@ -19,7 +20,7 @@ class WarmupStatus:
     """Track warmup status for models with TTL."""
     def __init__(self):
-        self._warmed_models: Dict[str, datetime] = {}
+        self._warmed_models: dict[str, datetime] = {}
         self._ttl = timedelta(minutes=10)  # Consider models warm for 10 minutes
     def is_warm(self, model_name: str) -> bool:
@@ -47,11 +48,11 @@ _warmup_status = WarmupStatus()
 async def warmup_synth_model(
     model_name: str,
-    config: Optional[SynthConfig] = None,
-    max_attempts: Optional[int] = None,
+    config: SynthConfig | None = None,
+    max_attempts: int | None = None,
     force: bool = False,
     verbose: bool = True,
-    gpu_preference: Optional[str] = None,
+    gpu_preference: str | None = None,
 ) -> bool:
     """
     Warm up a model on the Synth backend using fire-and-forget approach.
@@ -161,7 +162,7 @@ async def warmup_synth_model(
                 )
                 sys.stdout.flush()
                 await asyncio.sleep(1.0)
-            except Exception as e:
+            except Exception:
                 # Continue polling; update spinner line with error label
                 elapsed = int(time.time() - start_time)
                 wheel = spinner[spin_idx % len(spinner)]

synth_ai/rl/__init__.py ADDED Viewed

@@ -0,0 +1,30 @@
+from .contracts import (
+    RolloutEnvSpec,
+    RolloutPolicySpec,
+    RolloutRecordConfig,
+    RolloutSafetyConfig,
+    RolloutRequest,
+    RolloutStep,
+    RolloutTrajectory,
+    RolloutMetrics,
+    RolloutResponse,
+)
+from .env_keys import MAX_ENVIRONMENT_API_KEY_BYTES, encrypt_for_backend, setup_environment_api_key
+from .secrets import mint_environment_api_key
+__all__ = [
+    "RolloutEnvSpec",
+    "RolloutPolicySpec",
+    "RolloutRecordConfig",
+    "RolloutSafetyConfig",
+    "RolloutRequest",
+    "RolloutStep",
+    "RolloutTrajectory",
+    "RolloutMetrics",
+    "RolloutResponse",
+    "encrypt_for_backend",
+    "setup_environment_api_key",
+    "mint_environment_api_key",
+    "MAX_ENVIRONMENT_API_KEY_BYTES",
+]

synth_ai/rl/contracts.py ADDED Viewed

@@ -0,0 +1,32 @@
+from __future__ import annotations
+"""
+Compatibility layer: re-export Task App rollout contracts from synth_ai.task.contracts
+so existing imports continue to work while consolidating under synth_ai.task.
+"""
+from synth_ai.task.contracts import (
+    RolloutEnvSpec,
+    RolloutPolicySpec,
+    RolloutRecordConfig,
+    RolloutSafetyConfig,
+    RolloutRequest,
+    RolloutStep,
+    RolloutTrajectory,
+    RolloutMetrics,
+    RolloutResponse,
+)
+__all__ = [
+    "RolloutEnvSpec",
+    "RolloutPolicySpec",
+    "RolloutRecordConfig",
+    "RolloutSafetyConfig",
+    "RolloutRequest",
+    "RolloutStep",
+    "RolloutTrajectory",
+    "RolloutMetrics",
+    "RolloutResponse",
+]

synth_ai/rl/env_keys.py ADDED Viewed

@@ -0,0 +1,137 @@
+from __future__ import annotations
+"""Helpers for uploading RL environment credentials to the backend."""
+import base64
+import binascii
+import json
+from typing import Any, Dict
+import os
+import requests
+from nacl.public import PublicKey, SealedBox
+__all__ = ["encrypt_for_backend", "setup_environment_api_key", "MAX_ENVIRONMENT_API_KEY_BYTES"]
+MAX_ENVIRONMENT_API_KEY_BYTES = 8 * 1024
+_ALGORITHM = "libsodium.sealedbox.v1"
+def encrypt_for_backend(pubkey_b64: str, secret: str | bytes) -> str:
+    """Encrypt ``secret`` for storage by the backend using libsodium sealed boxes."""
+    if not isinstance(pubkey_b64, str) or not pubkey_b64.strip():
+        raise ValueError("public key must be a non-empty base64 string")
+    try:
+        key_bytes = base64.b64decode(pubkey_b64, validate=True)
+    except binascii.Error as exc:  # pragma: no cover - defensive guard
+        raise ValueError("public key must be base64-encoded") from exc
+    if len(key_bytes) != 32:
+        raise ValueError("public key must be 32 bytes for X25519")
+    if isinstance(secret, str):
+        secret_bytes = secret.encode("utf-8")
+    elif isinstance(secret, bytes):
+        secret_bytes = secret
+    else:  # pragma: no cover - type guard
+        raise TypeError("secret must be str or bytes")
+    if not secret_bytes:
+        raise ValueError("secret must not be empty")
+    box = SealedBox(PublicKey(key_bytes))
+    ciphertext = box.encrypt(secret_bytes)
+    return base64.b64encode(ciphertext).decode("ascii")
+def setup_environment_api_key(
+    backend_base: str,
+    synth_api_key: str,
+    token: str | None = None,
+    *,
+    timeout: float = 15.0,
+) -> Dict[str, Any]:
+    """Upload an ENVIRONMENT_API_KEY to the backend."""
+    backend = backend_base.rstrip("/")
+    if not backend:
+        raise ValueError("backend_base must be provided")
+    if not synth_api_key:
+        raise ValueError("synth_api_key must be provided")
+    # Require caller-provided plaintext. If not provided, read from ENVIRONMENT_API_KEY.
+    plaintext = token if token is not None else os.getenv("ENVIRONMENT_API_KEY", "").strip()
+    if not plaintext:
+        raise ValueError("ENVIRONMENT_API_KEY must be set (or pass token=...) to upload")
+    if not isinstance(plaintext, str):  # pragma: no cover - defensive guard
+        raise TypeError("token must be a string")
+    token_bytes = plaintext.encode("utf-8")
+    if not token_bytes:
+        raise ValueError("ENVIRONMENT_API_KEY token must not be empty")
+    if len(token_bytes) > MAX_ENVIRONMENT_API_KEY_BYTES:
+        raise ValueError("ENVIRONMENT_API_KEY token exceeds 8 KiB limit")
+    headers = {"Authorization": f"Bearer {synth_api_key}"}
+    pub_url = f"{backend}/api/v1/crypto/public-key"
+    response = requests.get(pub_url, headers=headers, timeout=timeout)
+    _raise_with_detail(response)
+    try:
+        doc = response.json()
+    except ValueError as exc:  # pragma: no cover - backend invariant
+        raise RuntimeError("backend returned invalid JSON for public key") from exc
+    if not isinstance(doc, dict):
+        raise RuntimeError("backend public key response must be an object")
+    pubkey = doc.get("public_key")
+    if not isinstance(pubkey, str) or not pubkey:
+        raise RuntimeError("backend response missing public_key")
+    # The backend currently returns a single algorithm identifier; keep a guard in
+    # case future versions change the value and we need to surface that to callers.
+    alg = doc.get("alg")
+    if alg is not None and alg != _ALGORITHM:
+        raise RuntimeError(f"unsupported sealed box algorithm: {alg}")
+    ciphertext_b64 = encrypt_for_backend(pubkey, token_bytes)
+    body = {"name": "ENVIRONMENT_API_KEY", "ciphertext_b64": ciphertext_b64}
+    post_url = f"{backend}/api/v1/env-keys"
+    response2 = requests.post(post_url, headers={**headers, "Content-Type": "application/json"}, json=body, timeout=timeout)
+    _raise_with_detail(response2)
+    try:
+        upload_doc = response2.json()
+    except ValueError:
+        upload_doc = {}
+    if not isinstance(upload_doc, dict):
+        upload_doc = {}
+    return {
+        "stored": True,
+        "id": upload_doc.get("id"),
+        "name": upload_doc.get("name"),
+        "updated_at": upload_doc.get("updated_at"),
+    }
+def _raise_with_detail(response: requests.Response) -> None:
+    try:
+        response.raise_for_status()
+    except requests.HTTPError as exc:
+        detail_snippet: str | None = None
+        try:
+            detail = response.json()
+            detail_snippet = json.dumps(detail, separators=(",", ":"))[:200]
+        except Exception:
+            body = response.text if response.text is not None else ""
+            detail_snippet = body[:200] if body else None
+        message = str(exc)
+        if detail_snippet:
+            message = f"{message} | body={detail_snippet}"
+        raise requests.HTTPError(message, request=exc.request, response=exc.response) from None

synth_ai/rl/secrets.py ADDED Viewed

@@ -0,0 +1,19 @@
+from __future__ import annotations
+"""Helpers for generating RL environment credentials."""
+import secrets
+__all__ = ["mint_environment_api_key"]
+def mint_environment_api_key() -> str:
+    """Mint a random ENVIRONMENT_API_KEY value.
+    The current format is 64 hexadecimal characters (256 bits of entropy), which
+    matches the shell helpers used by the RL examples. This keeps the token easy
+    to copy while remaining suitably strong for authentication.
+    """
+    # secrets.token_hex(32) → 32 random bytes rendered as 64 hex characters.
+    return secrets.token_hex(32)

synth_ai/scripts/verify_rewards.py ADDED Viewed

@@ -0,0 +1,100 @@
+#!/usr/bin/env python3
+"""
+Verify reward persistence in a traces database.
+Usage:
+  uv run python -m synth_ai.scripts.verify_rewards --db /path/to/db.sqlite --min-reward 1
+"""
+import argparse
+import asyncio
+import os
+from typing import Dict
+from sqlalchemy import text
+from synth_ai.tracing_v3.turso.manager import AsyncSQLTraceManager
+async def verify(db_path: str, min_reward: int) -> int:
+    db_url = db_path
+    if not db_url.startswith("sqlite+aiosqlite:///"):
+        db_url = f"sqlite+aiosqlite:///{os.path.abspath(db_path)}"
+    mgr = AsyncSQLTraceManager(db_url=db_url)
+    await mgr.initialize()
+    try:
+        async with mgr.session() as session:
+            # Sessions with outcome_rewards
+            q_good = text(
+                """
+                SELECT session_id, MAX(total_reward) as total_reward
+                FROM outcome_rewards
+                GROUP BY session_id
+                """
+            )
+            res = await session.execute(q_good)
+            outcomes = {row[0]: int(row[1]) for row in res.fetchall()}
+            # Sessions without outcome_rewards
+            q_missing = text(
+                """
+                SELECT s.session_id
+                FROM session_traces s
+                LEFT JOIN outcome_rewards o ON s.session_id = o.session_id
+                WHERE o.session_id IS NULL
+                """
+            )
+            res2 = await session.execute(q_missing)
+            missing = [row[0] for row in res2.fetchall()]
+            # Aggregate event_rewards per session (informational)
+            q_event = text(
+                """
+                SELECT session_id, COALESCE(SUM(reward_value), 0.0) as sum_rewards
+                FROM event_rewards
+                GROUP BY session_id
+                """
+            )
+            res3 = await session.execute(q_event)
+            event_sums: Dict[str, float] = {row[0]: float(row[1]) for row in res3.fetchall()}
+        print(f"Sessions with outcome_rewards: {len(outcomes)}")
+        print(f"Sessions missing outcome_rewards: {len(missing)}")
+        if missing:
+            print("Missing session_ids:", ", ".join(missing[:10]) + (" ..." if len(missing) > 10 else ""))
+        # Threshold check
+        qualifying = {sid: r for sid, r in outcomes.items() if r >= min_reward}
+        print(f"Sessions with total_reward >= {min_reward}: {len(qualifying)}")
+        # Show a small comparison snapshot
+        sample = list(qualifying.items())[:5]
+        for sid, tot in sample:
+            er = event_sums.get(sid, 0.0)
+            print(f"  {sid}: outcome={tot}, sum(event_rewards)={er:.2f}")
+        # Exit non-zero if any sessions are missing outcome rewards
+        if missing:
+            return 2
+        if min_reward > 0 and not qualifying:
+            return 3
+        return 0
+    finally:
+        await mgr.close()
+def main() -> int:
+    ap = argparse.ArgumentParser(description="Verify reward persistence in traces DB")
+    ap.add_argument("--db", required=True, help="Path to traces SQLite DB (aiosqlite)")
+    ap.add_argument("--min-reward", type=int, default=0, help="Minimum total_reward to consider qualifying")
+    args = ap.parse_args()
+    return asyncio.run(verify(args.db, args.min_reward))
+if __name__ == "__main__":
+    raise SystemExit(main())

synth_ai/task/__init__.py ADDED Viewed

@@ -0,0 +1,10 @@
+from .validators import validate_task_app_url
+from .health import task_app_health
+from .contracts import TaskAppContract, TaskAppEndpoints
+__all__ = [
+    "validate_task_app_url",
+    "task_app_health",
+    "TaskAppContract",
+    "TaskAppEndpoints",
+]

synth_ai/task/contracts.py ADDED Viewed

@@ -0,0 +1,120 @@
+from __future__ import annotations
+from dataclasses import dataclass
+from typing import Optional, Any, Dict, List
+from pydantic import BaseModel
+@dataclass(frozen=True)
+class TaskAppEndpoints:
+    """Canonical Task App endpoint shapes used by RL trainers.
+    The Task App is an HTTP service (often deployed on Modal) that exposes:
+    - Health: GET /health
+      • Requires header X-API-Key (when ENVIRONMENT_API_KEY is configured)
+      • Returns { healthy: true }
+    - Environment lifecycle:
+      • POST /env/{env_name}/initialize → { env_id, observation }
+      • POST /env/{env_name}/step      → { observation, reward, done, info }
+      • POST /env/{env_name}/terminate → { ok: true }
+    - Rollout (optional, unified schema):
+      • POST /rollout → { run_id, trajectories[], metrics, ... }
+    - Proxy (optional):
+      • POST /proxy/v1/chat/completions (for direct OpenAI calls from Task App)
+    """
+    health: str = "/health"
+    rollout: str = "/rollout"
+    proxy_chat_completions: str = "/proxy/v1/chat/completions"
+    env_initialize: str = "/env/{env_name}/initialize"
+    env_step: str = "/env/{env_name}/step"
+    env_terminate: str = "/env/{env_name}/terminate"
+@dataclass(frozen=True)
+class TaskAppContract:
+    """Requirements and expectations for a Task App used by RL trainers.
+    - Auth: ENVIRONMENT_API_KEY must be set in the Task App environment; requests include X-API-Key.
+    - Health: /health returns 200 and JSON; may verify X-API-Key header.
+    - Env API: initialize/step/terminate are present for the target env (e.g., CrafterClassic).
+    - Rollout API: optional; provides a single-call rollout for convenience/testing.
+    - Inference routing: policy config passes an inference_url (Synth backend or OpenAI proxy).
+    - URL: base must be reachable via HTTPS and should be under .modal.run in production.
+    """
+    base_url: str
+    env_name: Optional[str] = None
+    requires_api_key_header: bool = True
+# --- Unified rollout schema used by Task App services and SDK utilities ---
+class RolloutEnvSpec(BaseModel):
+    env_id: Optional[str] = None
+    env_name: Optional[str] = None
+    config: Dict[str, Any] = {}
+    seed: Optional[int] = None
+class RolloutPolicySpec(BaseModel):
+    policy_id: Optional[str] = None
+    policy_name: Optional[str] = None
+    config: Dict[str, Any] = {}
+class RolloutRecordConfig(BaseModel):
+    trajectories: bool = True
+    logprobs: bool = False
+    value: bool = False
+class RolloutSafetyConfig(BaseModel):
+    max_ops: int = 100000
+    max_time_s: float = 3600.0
+class RolloutRequest(BaseModel):
+    run_id: str
+    env: RolloutEnvSpec
+    policy: RolloutPolicySpec
+    ops: List[Dict[str, Any]] | List[str]
+    record: RolloutRecordConfig = RolloutRecordConfig()
+    on_done: str = "reset"
+    safety: RolloutSafetyConfig = RolloutSafetyConfig()
+    training_session_id: Optional[str] = None
+    synth_base_url: Optional[str] = None
+class RolloutStep(BaseModel):
+    obs: Dict[str, Any]
+    tool_calls: List[Dict[str, Any]]
+    reward: Optional[float] = None
+    done: bool = False
+    truncated: Optional[bool] = None
+    info: Optional[Dict[str, Any]] = None
+class RolloutTrajectory(BaseModel):
+    env_id: str
+    policy_id: str
+    steps: List[RolloutStep]
+    final: Optional[Dict[str, Any]] = None
+    length: int
+class RolloutMetrics(BaseModel):
+    episode_returns: List[float]
+    mean_return: float
+    num_steps: int
+    num_episodes: int = 0
+class RolloutResponse(BaseModel):
+    run_id: str
+    trajectories: List[RolloutTrajectory]
+    branches: Dict[str, List[str]] = {}
+    metrics: RolloutMetrics
+    aborted: bool = False
+    ops_executed: int = 0

synth_ai/task/health.py ADDED Viewed

@@ -0,0 +1,28 @@
+from __future__ import annotations
+from typing import Any, Dict
+import aiohttp
+async def task_app_health(task_app_url: str) -> Dict[str, Any]:
+    """Probe a Task App base URL for basic reachability.
+    Behavior:
+    - Try HEAD first (follows redirects)
+    - Fallback to GET if HEAD is unsupported
+    - Returns {ok: bool, status?: int, error?: str}
+    """
+    try:
+        async with aiohttp.ClientSession() as session:
+            async with session.head(task_app_url, allow_redirects=True) as r:
+                if 200 <= r.status < 400:
+                    return {"ok": True, "status": r.status}
+        async with aiohttp.ClientSession() as session:
+            async with session.get(task_app_url, allow_redirects=True) as r2:
+                if 200 <= r2.status < 400:
+                    return {"ok": True, "status": r2.status}
+        return {"ok": False, "status": None}
+    except Exception as e:
+        return {"ok": False, "error": f"{type(e).__name__}: {e}"}

synth_ai/task/validators.py ADDED Viewed

@@ -0,0 +1,12 @@
+from __future__ import annotations
+from urllib.parse import urlparse
+def validate_task_app_url(url: str, *, name: str = "TASK_APP_BASE_URL") -> None:
+    """Validate a Task App base URL (scheme + host present)."""
+    p = urlparse(url)
+    if p.scheme not in ("http", "https") or not p.netloc:
+        raise ValueError(f"Invalid {name}: malformed: {url}")

synth_ai/tracing/__init__.py CHANGED Viewed

@@ -1,18 +1,30 @@
-import sys as _sys
 import importlib as _importlib
+import sys as _sys
-_pkg = _importlib.import_module('synth_ai.v0.tracing')
+_pkg = _importlib.import_module("synth_ai.v0.tracing")
 _sys.modules[__name__] = _pkg
 _SUBMODULES = [
-    'abstractions', 'base_client', 'client_manager', 'config', 'context',
-    'decorators', 'immediate_client', 'local', 'log_client_base', 'retry_queue',
-    'trackers', 'upload', 'utils'
+    "abstractions",
+    "base_client",
+    "client_manager",
+    "config",
+    "context",
+    "decorators",
+    "immediate_client",
+    "local",
+    "log_client_base",
+    "retry_queue",
+    "trackers",
+    "upload",
+    "utils",
 ]
 for _m in _SUBMODULES:
-    _sys.modules[f'{__name__}.{_m}'] = _importlib.import_module(f'synth_ai.v0.tracing.{_m}')
+    _sys.modules[f"{__name__}.{_m}"] = _importlib.import_module(f"synth_ai.v0.tracing.{_m}")
-_events_pkg = _importlib.import_module('synth_ai.v0.tracing.events')
-_sys.modules[f'{__name__}.events'] = _events_pkg
-for _m in ['manage', 'scope', 'store']:
-    _sys.modules[f'{__name__}.events.{_m}'] = _importlib.import_module(f'synth_ai.v0.tracing.events.{_m}')
+_events_pkg = _importlib.import_module("synth_ai.v0.tracing.events")
+_sys.modules[f"{__name__}.events"] = _events_pkg
+for _m in ["manage", "scope", "store"]:
+    _sys.modules[f"{__name__}.events.{_m}"] = _importlib.import_module(
+        f"synth_ai.v0.tracing.events.{_m}"
+    )

synth_ai/tracing_v1/__init__.py CHANGED Viewed

@@ -1,31 +1,33 @@
-import sys as _sys
 import importlib as _importlib
+import sys as _sys
 # Forward top-level package
-_pkg = _importlib.import_module('synth_ai.v0.tracing_v1')
+_pkg = _importlib.import_module("synth_ai.v0.tracing_v1")
 _sys.modules[__name__] = _pkg
 # Explicitly forward submodules so `synth_ai.tracing_v1.X` works
 _SUBMODULES = [
-    'abstractions',
-    'base_client',
-    'client_manager',
-    'config',
-    'context',
-    'decorators',
-    'immediate_client',
-    'local',
-    'log_client_base',
-    'retry_queue',
-    'trackers',
-    'upload',
-    'utils',
+    "abstractions",
+    "base_client",
+    "client_manager",
+    "config",
+    "context",
+    "decorators",
+    "immediate_client",
+    "local",
+    "log_client_base",
+    "retry_queue",
+    "trackers",
+    "upload",
+    "utils",
 ]
 for _m in _SUBMODULES:
-    _sys.modules[f'{__name__}.{_m}'] = _importlib.import_module(f'synth_ai.v0.tracing_v1.{_m}')
+    _sys.modules[f"{__name__}.{_m}"] = _importlib.import_module(f"synth_ai.v0.tracing_v1.{_m}")
 # Forward events package and its submodules
-_events_pkg = _importlib.import_module('synth_ai.v0.tracing_v1.events')
-_sys.modules[f'{__name__}.events'] = _events_pkg
-for _m in ['manage', 'scope', 'store']:
-    _sys.modules[f'{__name__}.events.{_m}'] = _importlib.import_module(f'synth_ai.v0.tracing_v1.events.{_m}')
+_events_pkg = _importlib.import_module("synth_ai.v0.tracing_v1.events")
+_sys.modules[f"{__name__}.events"] = _events_pkg
+for _m in ["manage", "scope", "store"]:
+    _sys.modules[f"{__name__}.events.{_m}"] = _importlib.import_module(
+        f"synth_ai.v0.tracing_v1.events.{_m}"
+    )

synth_ai/tracing_v3/__init__.py CHANGED Viewed

@@ -1,7 +1,7 @@
 """Tracing v3 - Turso/sqld based tracing implementation.
 This module provides a modern, async-first tracing system for capturing and storing
-detailed execution traces from AI systems. It's designed to handle high-throughput
+detailed execution traces from AI systems. It's designed to handle high-throughput
 scenarios with proper async/await patterns throughout.
 Architecture Overview:
@@ -49,10 +49,10 @@ Key Features:
 Usage Example:
 -------------
     from synth_ai.tracing_v3 import SessionTracer
     tracer = SessionTracer()
     await tracer.initialize()
     async with tracer.session() as session_id:
         async with tracer.timestep("step1", turn_number=1):
             # Record events during execution
@@ -70,17 +70,17 @@ The system uses environment variables for configuration:
 See `config.py` for full configuration options.
 """
-from .session_tracer import SessionTracer
 from .abstractions import (
-    SessionTrace,
-    SessionTimeStep,
     BaseEvent,
-    RuntimeEvent,
     EnvironmentEvent,
+    RuntimeEvent,
     SessionEventMarkovBlanketMessage,
+    SessionTimeStep,
+    SessionTrace,
     TimeRecord,
 )
 from .config import TursoConfig
+from .session_tracer import SessionTracer
 __all__ = [
     "SessionTracer",

synth-ai 0.2.4.dev6__py3-none-any.whl → 0.2.4.dev8__py3-none-any.whl

synth-ai 0.2.4.dev6py3-none-any.whl → 0.2.4.dev8py3-none-any.whl