PyPI - synth-ai - Versions diffs - 0.2.13.dev2__py3-none-any.whl → 0.2.16__py3-none-any.whl - Mend

synth-ai 0.2.13.dev2py3-none-any.whl → 0.2.16py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of synth-ai might be problematic. Click here for more details.

Files changed (293) hide show

examples/README.md +1 -0
examples/multi_step/SFT_README.md +147 -0
examples/multi_step/configs/README_verilog_rl.md +77 -0
examples/multi_step/configs/VERILOG_REWARDS.md +90 -0
examples/multi_step/configs/VERILOG_RL_CHECKLIST.md +183 -0
examples/multi_step/configs/crafter_eval_synth_qwen4b.toml +35 -0
examples/multi_step/configs/crafter_eval_text_only_groq_qwen32b.toml +36 -0
examples/multi_step/configs/crafter_rl_stepwise_hosted_judge.toml +12 -11
examples/multi_step/configs/crafter_sft_qwen30b_lora.toml +62 -0
examples/multi_step/configs/crafter_synth_backend.md +40 -0
examples/multi_step/configs/verilog_eval_groq_qwen32b.toml +31 -0
examples/multi_step/configs/verilog_eval_synth_qwen8b.toml +33 -0
examples/multi_step/configs/verilog_rl_lora.toml +190 -0
examples/multi_step/convert_traces_to_sft.py +84 -0
examples/multi_step/judges/crafter_backend_judge.py +220 -0
examples/multi_step/judges/verilog_backend_judge.py +234 -0
examples/multi_step/readme.md +48 -0
examples/multi_step/run_sft_qwen30b.sh +45 -0
examples/multi_step/verilog_rl_lora.md +218 -0
examples/qwen_coder/configs/coder_lora_30b.toml +3 -2
examples/qwen_coder/configs/coder_lora_4b.toml +2 -1
examples/qwen_coder/configs/coder_lora_small.toml +2 -1
examples/qwen_vl/BUGS_AND_FIXES.md +232 -0
examples/qwen_vl/IMAGE_VALIDATION_COMPLETE.md +271 -0
examples/qwen_vl/IMAGE_VALIDATION_SUMMARY.md +260 -0
examples/qwen_vl/INFERENCE_SFT_TESTS.md +412 -0
examples/qwen_vl/NEXT_STEPS_2B.md +325 -0
examples/qwen_vl/QUICKSTART.md +327 -0
examples/qwen_vl/QUICKSTART_RL_VISION.md +110 -0
examples/qwen_vl/README.md +154 -0
examples/qwen_vl/RL_VISION_COMPLETE.md +475 -0
examples/qwen_vl/RL_VISION_TESTING.md +333 -0
examples/qwen_vl/SDK_VISION_INTEGRATION.md +328 -0
examples/qwen_vl/SETUP_COMPLETE.md +275 -0
examples/qwen_vl/VISION_TESTS_COMPLETE.md +490 -0
examples/qwen_vl/VLM_PIPELINE_COMPLETE.md +242 -0
examples/qwen_vl/__init__.py +2 -0
examples/qwen_vl/collect_data_via_cli.md +423 -0
examples/qwen_vl/collect_vision_traces.py +368 -0
examples/qwen_vl/configs/crafter_rl_vision_qwen3vl4b.toml +127 -0
examples/qwen_vl/configs/crafter_vlm_sft_example.toml +60 -0
examples/qwen_vl/configs/eval_gpt4o_mini_vision.toml +43 -0
examples/qwen_vl/configs/eval_gpt4o_vision_proper.toml +29 -0
examples/qwen_vl/configs/eval_gpt5nano_vision.toml +45 -0
examples/qwen_vl/configs/eval_qwen2vl_vision.toml +44 -0
examples/qwen_vl/configs/filter_qwen2vl_sft.toml +50 -0
examples/qwen_vl/configs/filter_vision_sft.toml +53 -0
examples/qwen_vl/configs/filter_vision_test.toml +8 -0
examples/qwen_vl/configs/sft_qwen3_vl_2b_test.toml +54 -0
examples/qwen_vl/crafter_gpt5nano_agent.py +308 -0
examples/qwen_vl/crafter_qwen_vl_agent.py +300 -0
examples/qwen_vl/run_vision_comparison.sh +62 -0
examples/qwen_vl/run_vision_sft_pipeline.sh +175 -0
examples/qwen_vl/test_image_validation.py +201 -0
examples/qwen_vl/test_sft_vision_data.py +110 -0
examples/rl/README.md +1 -1
examples/rl/configs/eval_base_qwen.toml +17 -0
examples/rl/configs/eval_rl_qwen.toml +13 -0
examples/rl/configs/rl_from_base_qwen.toml +37 -0
examples/rl/configs/rl_from_base_qwen17.toml +76 -0
examples/rl/configs/rl_from_ft_qwen.toml +37 -0
examples/rl/run_eval.py +436 -0
examples/rl/run_rl_and_save.py +111 -0
examples/rl/task_app/README.md +22 -0
examples/rl/task_app/math_single_step.py +990 -0
examples/rl/task_app/math_task_app.py +111 -0
examples/sft/README.md +5 -5
examples/sft/configs/crafter_fft_qwen0p6b.toml +4 -2
examples/sft/configs/crafter_lora_qwen0p6b.toml +4 -3
examples/sft/evaluate.py +4 -4
examples/sft/export_dataset.py +7 -4
examples/sft/generate_traces.py +2 -0
examples/swe/task_app/README.md +1 -1
examples/swe/task_app/grpo_swe_mini.py +1 -1
examples/swe/task_app/grpo_swe_mini_task_app.py +0 -12
examples/swe/task_app/hosted/envs/mini_swe/environment.py +13 -13
examples/swe/task_app/hosted/policy_routes.py +0 -2
examples/swe/task_app/hosted/rollout.py +2 -8
examples/task_apps/IMAGE_ONLY_EVAL_QUICKSTART.md +258 -0
examples/task_apps/crafter/CREATE_SFT_DATASET.md +273 -0
examples/task_apps/crafter/EVAL_IMAGE_ONLY_RESULTS.md +152 -0
examples/task_apps/crafter/FILTER_COMMAND_STATUS.md +174 -0
examples/task_apps/crafter/FILTER_COMMAND_SUCCESS.md +268 -0
examples/task_apps/crafter/QUERY_EXAMPLES.md +203 -0
examples/task_apps/crafter/README_IMAGE_ONLY_EVAL.md +316 -0
examples/task_apps/crafter/eval_image_only_gpt4o.toml +28 -0
examples/task_apps/crafter/eval_text_only_groq_llama.toml +36 -0
examples/task_apps/crafter/filter_sft_dataset.toml +16 -0
examples/task_apps/crafter/task_app/__init__.py +3 -0
examples/task_apps/crafter/task_app/grpo_crafter.py +309 -14
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/environment.py +10 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/policy.py +75 -4
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/react_agent.py +17 -2
examples/task_apps/crafter/task_app/synth_envs_hosted/inference/openai_client.py +55 -3
examples/task_apps/crafter/task_app/synth_envs_hosted/policy_routes.py +114 -32
examples/task_apps/crafter/task_app/synth_envs_hosted/rollout.py +127 -27
examples/task_apps/crafter/task_app/synth_envs_hosted/utils.py +156 -0
examples/task_apps/enron/__init__.py +1 -0
examples/task_apps/enron/filter_sft.toml +5 -0
examples/task_apps/enron/tests/__init__.py +2 -0
examples/task_apps/enron/tests/integration/__init__.py +2 -0
examples/task_apps/enron/tests/integration/test_enron_eval.py +2 -0
examples/task_apps/enron/tests/unit/__init__.py +2 -0
examples/task_apps/pokemon_red/EVAL_IMAGE_ONLY_COMPLETE.md +283 -0
examples/task_apps/pokemon_red/EVAL_IMAGE_ONLY_STATUS.md +155 -0
examples/task_apps/pokemon_red/README_IMAGE_ONLY_EVAL.md +415 -0
examples/task_apps/pokemon_red/eval_image_only_gpt4o.toml +29 -0
examples/task_apps/pokemon_red/pallet_town_rl_config.toml +2 -0
examples/task_apps/pokemon_red/task_app.py +199 -6
examples/task_apps/pokemon_red/test_pallet_town_rewards.py +2 -0
examples/task_apps/sokoban/filter_sft.toml +5 -0
examples/task_apps/sokoban/tests/__init__.py +2 -0
examples/task_apps/sokoban/tests/integration/__init__.py +2 -0
examples/task_apps/sokoban/tests/unit/__init__.py +2 -0
examples/task_apps/verilog/eval_groq_qwen32b.toml +8 -4
examples/task_apps/verilog/filter_sft.toml +5 -0
examples/task_apps/verilog/task_app/grpo_verilog.py +258 -23
examples/task_apps/verilog/tests/__init__.py +2 -0
examples/task_apps/verilog/tests/integration/__init__.py +2 -0
examples/task_apps/verilog/tests/integration/test_verilog_eval.py +2 -0
examples/task_apps/verilog/tests/unit/__init__.py +2 -0
examples/vlm/README.md +3 -3
examples/vlm/configs/crafter_vlm_gpt4o.toml +2 -0
examples/vlm/crafter_openai_vlm_agent.py +3 -5
examples/vlm/filter_image_rows.py +1 -1
examples/vlm/run_crafter_vlm_benchmark.py +2 -2
examples/warming_up_to_rl/_utils.py +92 -0
examples/warming_up_to_rl/analyze_trace_db.py +1 -1
examples/warming_up_to_rl/configs/crafter_fft.toml +2 -0
examples/warming_up_to_rl/configs/crafter_fft_4b.toml +2 -0
examples/warming_up_to_rl/configs/eval_fft_qwen4b.toml +2 -0
examples/warming_up_to_rl/configs/eval_groq_qwen32b.toml +2 -0
examples/warming_up_to_rl/configs/eval_modal_qwen4b.toml +2 -1
examples/warming_up_to_rl/configs/rl_from_base_qwen4b.toml +2 -1
examples/warming_up_to_rl/configs/rl_from_ft.toml +2 -0
examples/warming_up_to_rl/export_trace_sft.py +174 -60
examples/warming_up_to_rl/groq_test.py +2 -0
examples/warming_up_to_rl/readme.md +63 -132
examples/warming_up_to_rl/run_fft_and_save.py +1 -1
examples/warming_up_to_rl/run_local_rollout.py +2 -0
examples/warming_up_to_rl/run_local_rollout_modal.py +2 -0
examples/warming_up_to_rl/run_local_rollout_parallel.py +2 -0
examples/warming_up_to_rl/run_local_rollout_traced.py +2 -0
examples/warming_up_to_rl/run_rl_and_save.py +1 -1
examples/warming_up_to_rl/run_rollout_remote.py +2 -0
examples/warming_up_to_rl/task_app/README.md +42 -0
examples/warming_up_to_rl/task_app/grpo_crafter.py +696 -0
examples/warming_up_to_rl/task_app/grpo_crafter_task_app.py +135 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/README.md +173 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/__init__.py +5 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/branching.py +143 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/environment_routes.py +1226 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/__init__.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/__init__.py +6 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/app.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/environment.py +522 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/policy.py +478 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/react_agent.py +108 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/shared.py +305 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/tools.py +47 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/hosted_app.py +204 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/__init__.py +5 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py +618 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/main.py +100 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/policy_routes.py +1081 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/registry.py +195 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/rollout.py +1861 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/__init__.py +5 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/volume.py +211 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_agents.py +161 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_service.py +137 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/utils.py +62 -0
synth_ai/__init__.py +44 -30
synth_ai/_utils/__init__.py +47 -0
synth_ai/_utils/base_url.py +10 -0
synth_ai/_utils/http.py +10 -0
synth_ai/_utils/prompts.py +10 -0
synth_ai/_utils/task_app_state.py +12 -0
synth_ai/_utils/user_config.py +10 -0
synth_ai/api/models/supported.py +145 -7
synth_ai/api/train/__init__.py +13 -1
synth_ai/api/train/cli.py +30 -7
synth_ai/api/train/config_finder.py +18 -11
synth_ai/api/train/env_resolver.py +13 -10
synth_ai/cli/__init__.py +66 -49
synth_ai/cli/_modal_wrapper.py +9 -6
synth_ai/cli/_typer_patch.py +0 -2
synth_ai/cli/_validate_task_app.py +22 -4
synth_ai/cli/legacy_root_backup.py +3 -1
synth_ai/cli/lib/__init__.py +10 -0
synth_ai/cli/lib/task_app_discovery.py +7 -0
synth_ai/cli/lib/task_app_env.py +518 -0
synth_ai/cli/recent.py +1 -0
synth_ai/cli/setup.py +266 -0
synth_ai/cli/task_app_deploy.py +16 -0
synth_ai/cli/task_app_list.py +25 -0
synth_ai/cli/task_app_modal_serve.py +16 -0
synth_ai/cli/task_app_serve.py +18 -0
synth_ai/cli/task_apps.py +392 -141
synth_ai/cli/train.py +18 -0
synth_ai/cli/tui.py +62 -0
synth_ai/demos/__init__.py +10 -0
synth_ai/demos/core/__init__.py +28 -1
synth_ai/demos/crafter/__init__.py +1 -0
synth_ai/demos/crafter/crafter_fft_4b.toml +55 -0
synth_ai/demos/crafter/grpo_crafter_task_app.py +185 -0
synth_ai/demos/crafter/rl_from_base_qwen4b.toml +74 -0
synth_ai/demos/demo_registry.py +176 -0
synth_ai/demos/demo_task_apps/crafter/grpo_crafter_task_app.py +1 -1
synth_ai/demos/math/__init__.py +1 -0
synth_ai/demos/math/_common.py +16 -0
synth_ai/demos/math/app.py +38 -0
synth_ai/demos/math/config.toml +76 -0
synth_ai/demos/math/deploy_modal.py +54 -0
synth_ai/demos/math/modal_task_app.py +702 -0
synth_ai/demos/math/task_app_entry.py +51 -0
synth_ai/environments/environment/core.py +7 -1
synth_ai/environments/examples/bandit/engine.py +0 -1
synth_ai/environments/examples/bandit/environment.py +0 -1
synth_ai/environments/examples/crafter_classic/environment.py +1 -1
synth_ai/environments/examples/verilog/engine.py +76 -10
synth_ai/environments/examples/wordle/environment.py +0 -1
synth_ai/evals/base.py +16 -5
synth_ai/evals/client.py +1 -1
synth_ai/inference/client.py +1 -1
synth_ai/learning/client.py +1 -1
synth_ai/learning/health.py +1 -1
synth_ai/learning/jobs.py +1 -1
synth_ai/learning/rl/client.py +1 -1
synth_ai/learning/rl/env_keys.py +1 -1
synth_ai/learning/rl/secrets.py +1 -1
synth_ai/learning/sft/client.py +1 -1
synth_ai/learning/sft/data.py +407 -4
synth_ai/learning/validators.py +4 -1
synth_ai/task/__init__.py +11 -1
synth_ai/task/apps/__init__.py +5 -2
synth_ai/task/config.py +259 -0
synth_ai/task/contracts.py +15 -2
synth_ai/task/rubrics/__init__.py +4 -2
synth_ai/task/rubrics/loaders.py +27 -4
synth_ai/task/rubrics/scoring.py +3 -0
synth_ai/task/rubrics.py +219 -0
synth_ai/task/trace_correlation_helpers.py +328 -0
synth_ai/task/tracing_utils.py +14 -3
synth_ai/task/validators.py +145 -2
synth_ai/tracing_v3/config.py +15 -13
synth_ai/tracing_v3/constants.py +21 -0
synth_ai/tracing_v3/db_config.py +3 -1
synth_ai/tracing_v3/decorators.py +10 -7
synth_ai/tracing_v3/session_tracer.py +10 -0
synth_ai/tracing_v3/turso/daemon.py +2 -2
synth_ai/tracing_v3/turso/native_manager.py +108 -77
synth_ai/tracing_v3/utils.py +1 -1
synth_ai/tui/__init__.py +5 -0
synth_ai/tui/__main__.py +13 -0
synth_ai/tui/cli/__init__.py +1 -0
synth_ai/tui/cli/query_experiments.py +164 -0
synth_ai/tui/cli/query_experiments_v3.py +164 -0
synth_ai/tui/dashboard.py +911 -0
synth_ai/utils/__init__.py +101 -0
synth_ai/utils/base_url.py +94 -0
synth_ai/utils/cli.py +131 -0
synth_ai/utils/env.py +287 -0
synth_ai/utils/http.py +169 -0
synth_ai/utils/modal.py +308 -0
synth_ai/utils/process.py +212 -0
synth_ai/utils/prompts.py +39 -0
synth_ai/utils/sqld.py +122 -0
synth_ai/utils/task_app_discovery.py +882 -0
synth_ai/utils/task_app_env.py +186 -0
synth_ai/utils/task_app_state.py +318 -0
synth_ai/utils/user_config.py +137 -0
synth_ai/v0/config/__init__.py +1 -5
synth_ai/v0/config/base_url.py +1 -7
synth_ai/v0/tracing/config.py +1 -1
synth_ai/v0/tracing/decorators.py +1 -1
synth_ai/v0/tracing/upload.py +1 -1
synth_ai/v0/tracing_v1/config.py +1 -1
synth_ai/v0/tracing_v1/decorators.py +1 -1
synth_ai/v0/tracing_v1/upload.py +1 -1
{synth_ai-0.2.13.dev2.dist-info → synth_ai-0.2.16.dist-info}/METADATA +85 -31
{synth_ai-0.2.13.dev2.dist-info → synth_ai-0.2.16.dist-info}/RECORD +286 -135
synth_ai/cli/man.py +0 -106
synth_ai/compound/cais.py +0 -0
synth_ai/core/experiment.py +0 -13
synth_ai/core/system.py +0 -15
synth_ai/demo_registry.py +0 -295
synth_ai/handshake.py +0 -109
synth_ai/http.py +0 -26
{synth_ai-0.2.13.dev2.dist-info → synth_ai-0.2.16.dist-info}/WHEEL +0 -0
{synth_ai-0.2.13.dev2.dist-info → synth_ai-0.2.16.dist-info}/entry_points.txt +0 -0
{synth_ai-0.2.13.dev2.dist-info → synth_ai-0.2.16.dist-info}/licenses/LICENSE +0 -0
{synth_ai-0.2.13.dev2.dist-info → synth_ai-0.2.16.dist-info}/top_level.txt +0 -0

synth_ai/tracing_v3/turso/daemon.py CHANGED Viewed

@@ -30,7 +30,7 @@ class SqldDaemon:
         self.db_path = db_path or CONFIG.sqld_db_path
         self.http_port = http_port or CONFIG.sqld_http_port
         self.binary_path = binary_path or self._find_binary()
-        self.process: subprocess.Popen | None = None
+        self.process: subprocess.Popen[str] | None = None
     def _find_binary(self) -> str:
         """Find sqld binary in PATH."""
@@ -84,7 +84,7 @@ class SqldDaemon:
                 pass
             # Check if process crashed
-            if self.process.poll() is not None:
+            if self.process and self.process.poll() is not None:
                 stdout, stderr = self.process.communicate()
                 raise RuntimeError(
                     f"sqld daemon failed to start:\nstdout: {stdout}\nstderr: {stderr}"

synth_ai/tracing_v3/turso/native_manager.py CHANGED Viewed

@@ -370,8 +370,20 @@ class NativeLibsqlTraceManager(TraceStorage):
     async def insert_session_trace(self, trace: SessionTrace) -> str:
         await self.initialize()
-        if await self._session_exists(trace.session_id):
+        import logging as _logging
+        _logger = _logging.getLogger(__name__)
+        _logger.info(f"[TRACE_DEBUG] insert_session_trace START: session_id={trace.session_id}, {len(trace.markov_blanket_message_history)} messages")
+        session_exists = await self._session_exists(trace.session_id)
+        _logger.info(f"[TRACE_DEBUG] Session exists: {session_exists}")
+        step_id_map: dict[str, int] = {}
+        if session_exists:
+            _logger.warning(f"[TRACE_DEBUG] Session {trace.session_id} already exists, skipping events/timesteps, only updating messages!")
+            # Don't return early - we need to save messages!
+            # Just update metadata
             async with self._op_lock:
                 conn = self._conn
                 assert conn is not None
@@ -380,87 +392,102 @@ class NativeLibsqlTraceManager(TraceStorage):
                     (_json_dumps(trace.metadata or {}), trace.session_id),
                 )
                 conn.commit()
-            return trace.session_id
+            # Skip events and timesteps to ensure idempotency
+        else:
+            created_at = trace.created_at or datetime.now(UTC)
-        created_at = trace.created_at or datetime.now(UTC)
+            async with self._op_lock:
+                conn = self._conn
+                assert conn is not None
+                conn.execute(
+                    """
+                    INSERT INTO session_traces (
+                        session_id,
+                        created_at,
+                        num_timesteps,
+                        num_events,
+                        num_messages,
+                        metadata
+                    )
+                    VALUES (?, ?, 0, 0, 0, ?)
+                    """,
+                    (
+                        trace.session_id,
+                        created_at.isoformat(),
+                        _json_dumps(trace.metadata or {}),
+                    ),
+                )
+                conn.commit()
+                _logger.info("[TRACE_DEBUG] Session row inserted")
-        async with self._op_lock:
-            conn = self._conn
-            assert conn is not None
-            conn.execute(
-                """
-                INSERT INTO session_traces (
-                    session_id,
-                    created_at,
-                    num_timesteps,
-                    num_events,
-                    num_messages,
-                    metadata
+            # Only insert timesteps and events if this is a new session
+            for step in trace.session_time_steps:
+                step_db_id = await self.ensure_timestep(
+                    trace.session_id,
+                    step_id=step.step_id,
+                    step_index=step.step_index,
+                    turn_number=step.turn_number,
+                    started_at=step.timestamp,
+                    completed_at=step.completed_at,
+                    metadata=step.step_metadata or {},
                 )
-                VALUES (?, ?, 0, 0, 0, ?)
-                """,
-                (
+                step_id_map[step.step_id] = step_db_id
+            for event in trace.event_history:
+                step_ref = None
+                metadata = event.metadata or {}
+                if isinstance(metadata, dict):
+                    step_ref = metadata.get("step_id")
+                timestep_db_id = step_id_map.get(step_ref) if step_ref else None
+                await self.insert_event_row(
                     trace.session_id,
-                    created_at.isoformat(),
-                    _json_dumps(trace.metadata or {}),
-                ),
-            )
-            conn.commit()
-        step_id_map: dict[str, int] = {}
-        for step in trace.session_time_steps:
-            step_db_id = await self.ensure_timestep(
-                trace.session_id,
-                step_id=step.step_id,
-                step_index=step.step_index,
-                turn_number=step.turn_number,
-                started_at=step.timestamp,
-                completed_at=step.completed_at,
-                metadata=step.step_metadata or {},
-            )
-            step_id_map[step.step_id] = step_db_id
+                    timestep_db_id=timestep_db_id,
+                    event=event,
+                    metadata_override=event.metadata or {},
+                )
-        for event in trace.event_history:
-            step_ref = None
-            metadata = event.metadata or {}
-            if isinstance(metadata, dict):
+        import logging as _logging
+        _logger = _logging.getLogger(__name__)
+        _logger.info(f"[TRACE_DEBUG] insert_session_trace: saving {len(trace.markov_blanket_message_history)} messages (session_exists={session_exists})")
+        # Only insert messages if this is a new session (for idempotency)
+        if not session_exists:
+            for idx, msg in enumerate(trace.markov_blanket_message_history):
+                metadata = dict(getattr(msg, "metadata", {}) or {})
                 step_ref = metadata.get("step_id")
-            timestep_db_id = step_id_map.get(step_ref) if step_ref else None
-            await self.insert_event_row(
-                trace.session_id,
-                timestep_db_id=timestep_db_id,
-                event=event,
-                metadata_override=event.metadata or {},
-            )
-        for msg in trace.markov_blanket_message_history:
-            metadata = dict(getattr(msg, "metadata", {}) or {})
-            step_ref = metadata.get("step_id")
-            content_value = msg.content
-            if isinstance(msg.content, SessionMessageContent):
-                if msg.content.json_payload:
-                    metadata.setdefault("json_payload", msg.content.json_payload)
-                    content_value = msg.content.json_payload
-                else:
-                    content_value = msg.content.as_text()
-                    if msg.content.text:
-                        metadata.setdefault("text", msg.content.text)
-            elif not isinstance(content_value, str):
+                content_value = msg.content
+                if isinstance(msg.content, SessionMessageContent):
+                    if msg.content.json_payload:
+                        metadata.setdefault("json_payload", msg.content.json_payload)
+                        content_value = msg.content.json_payload
+                    else:
+                        content_value = msg.content.as_text()
+                        if msg.content.text:
+                            metadata.setdefault("text", msg.content.text)
+                elif not isinstance(content_value, str):
+                    try:
+                        content_value = json.dumps(content_value, ensure_ascii=False)
+                    except (TypeError, ValueError):
+                        content_value = str(content_value)
+                _logger.info(f"[TRACE_DEBUG]   Message {idx+1}: type={msg.message_type}, content_len={len(str(content_value))}")
                 try:
-                    content_value = json.dumps(content_value, ensure_ascii=False)
-                except (TypeError, ValueError):
-                    content_value = str(content_value)
-            await self.insert_message_row(
-                trace.session_id,
-                timestep_db_id=step_id_map.get(step_ref) if step_ref else None,
-                message_type=msg.message_type,
-                content=content_value,
-                event_time=msg.time_record.event_time,
-                message_time=msg.time_record.message_time,
-                metadata=metadata,
-            )
+                    await self.insert_message_row(
+                        trace.session_id,
+                        timestep_db_id=step_id_map.get(step_ref) if step_ref else None,
+                        message_type=msg.message_type,
+                        content=content_value,
+                        event_time=msg.time_record.event_time,
+                        message_time=msg.time_record.message_time,
+                        metadata=metadata,
+                    )
+                    _logger.info(f"[TRACE_DEBUG]   Message {idx+1}: saved successfully")
+                except Exception as exc:
+                    _logger.error(f"[TRACE_DEBUG]   Message {idx+1}: FAILED TO SAVE: {exc}", exc_info=True)
+                    raise
+        else:
+            _logger.info("[TRACE_DEBUG] Skipping message insertion for existing session (idempotency)")
         async with self._op_lock:
             conn = self._conn
@@ -904,7 +931,11 @@ class NativeLibsqlTraceManager(TraceStorage):
         if isinstance(event, LMCAISEvent):
             call_records = None
             if getattr(event, "call_records", None):
-                call_records = [asdict(record) for record in event.call_records]
+                # Handle both dataclass instances and dicts (from deserialization)
+                call_records = [
+                    asdict(record) if not isinstance(record, dict) else record
+                    for record in event.call_records
+                ]
             payload.update(
                 {
                     "event_type": "cais",

synth_ai/tracing_v3/utils.py CHANGED Viewed

@@ -10,7 +10,7 @@ from typing import Any
 def iso_now() -> str:
-    """Get current UTC time as ISO format string."""
+    """Get current timezone.utc time as ISO format string."""
     return datetime.now(UTC).isoformat()

synth_ai/tui/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+"""Text User Interface utilities for synth-ai."""
+from .dashboard import main
+__all__ = ["main"]

synth_ai/tui/__main__.py ADDED Viewed

@@ -0,0 +1,13 @@
+#!/usr/bin/env python3
+"""
+Entry point for Synth AI TUI dashboard.
+Usage:
+    python -m synth_ai.tui
+    python -m synth_ai.tui --url sqlite+aiosqlite:///path/to/db
+"""
+from .dashboard import main
+if __name__ == "__main__":
+    main()

synth_ai/tui/cli/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ """Command Line Interface tools for synth-ai."""

synth_ai/tui/cli/query_experiments.py ADDED Viewed

@@ -0,0 +1,164 @@
+#!/usr/bin/env python3
+"""
+Query experiments and sessions from Turso/sqld using v3 tracing.
+"""
+import argparse
+import asyncio
+from synth_ai.tracing_v3.turso import NativeLibsqlTraceManager
+async def list_experiments(db_url: str):
+    """List all experiments in the database."""
+    db = NativeLibsqlTraceManager(db_url)
+    await db.initialize()
+    try:
+        df = await db.query_traces("""
+            SELECT
+                e.experiment_id,
+                e.name,
+                e.description,
+                e.created_at,
+                COUNT(DISTINCT st.session_id) as num_sessions,
+                COUNT(DISTINCT ev.id) as num_events,
+                SUM(CASE WHEN ev.event_type = 'cais' THEN ev.cost_usd ELSE 0 END) / 100.0 as total_cost,
+                SUM(CASE WHEN ev.event_type = 'cais' THEN ev.total_tokens ELSE 0 END) as total_tokens
+            FROM experiments e
+            LEFT JOIN session_traces st ON e.experiment_id = st.experiment_id
+            LEFT JOIN events ev ON st.session_id = ev.session_id
+            GROUP BY e.experiment_id, e.name, e.description, e.created_at
+            ORDER BY e.created_at DESC
+        """)
+        if df.empty:
+            print("No experiments found in database.")
+            return
+        print(f"\n{'=' * 100}")
+        print(f"{'Experiments in ' + db_url:^100}")
+        print(f"{'=' * 100}\n")
+        for _, row in df.iterrows():
+            print(f"🧪 {row['name']} (id: {row['experiment_id'][:8]}...)")
+            print(f"   Created: {row['created_at']}")
+            print(f"   Description: {row['description']}")
+            print(f"   Sessions: {row['num_sessions']}")
+            print(f"   Events: {row['num_events']:,}")
+            if row["total_cost"] and row["total_cost"] > 0:
+                print(f"   Cost: ${row['total_cost']:.4f}")
+            if row["total_tokens"] and row["total_tokens"] > 0:
+                print(f"   Tokens: {int(row['total_tokens']):,}")
+            print()
+    finally:
+        await db.close()
+async def show_experiment_details(db_url: str, experiment_id: str):
+    """Show detailed information about a specific experiment."""
+    db = NativeLibsqlTraceManager(db_url)
+    await db.initialize()
+    try:
+        # Get experiment info
+        exp_df = await db.query_traces(
+            """
+            SELECT * FROM experiments WHERE experiment_id LIKE :exp_id
+        """,
+            {"exp_id": f"{experiment_id}%"},
+        )
+        if exp_df.empty:
+            print(f"No experiment found matching ID: {experiment_id}")
+            return
+        exp = exp_df.iloc[0]
+        print(f"\n{'=' * 100}")
+        print(f"Experiment: {exp['name']} ({exp['experiment_id']})")
+        print(f"{'=' * 100}\n")
+        # Get session statistics
+        sessions_df = await db.get_sessions_by_experiment(exp["experiment_id"])
+        if sessions_df:
+            print(f"Sessions: {len(sessions_df)}")
+            # Get aggregated stats
+            stats_df = await db.query_traces(
+                """
+                SELECT
+                    COUNT(DISTINCT ev.id) as total_events,
+                    COUNT(DISTINCT m.id) as total_messages,
+                    SUM(CASE WHEN ev.event_type = 'cais' THEN ev.cost_usd ELSE 0 END) / 100.0 as total_cost,
+                    SUM(CASE WHEN ev.event_type = 'cais' THEN ev.total_tokens ELSE 0 END) as total_tokens
+                FROM session_traces st
+                LEFT JOIN events ev ON st.session_id = ev.session_id
+                LEFT JOIN messages m ON st.session_id = m.session_id
+                WHERE st.experiment_id = :exp_id
+            """,
+                {"exp_id": exp["experiment_id"]},
+            )
+            if not stats_df.empty:
+                stats = stats_df.iloc[0]
+                print(f"Total events: {int(stats['total_events']):,}")
+                print(f"Total messages: {int(stats['total_messages']):,}")
+                print(f"Total cost: ${stats['total_cost']:.4f}")
+                print(f"Total tokens: {int(stats['total_tokens']):,}")
+            # Show session list
+            print("\nSession list:")
+            for sess in sessions_df:
+                print(f"  - {sess['session_id']} ({sess['created_at']})")
+                print(
+                    f"    Timesteps: {sess['num_timesteps']}, Events: {sess['num_events']}, Messages: {sess['num_messages']}"
+                )
+    finally:
+        await db.close()
+async def show_model_usage(db_url: str, model_name: str | None = None):
+    """Show model usage statistics."""
+    db = NativeLibsqlTraceManager(db_url)
+    await db.initialize()
+    try:
+        df = await db.get_model_usage(model_name=model_name)
+        if df.empty:
+            print("No model usage data found.")
+            return
+        print(f"\n{'=' * 100}")
+        print(f"{'Model Usage Statistics':^100}")
+        print(f"{'=' * 100}\n")
+        print(df.to_string(index=False))
+    finally:
+        await db.close()
+async def main():
+    parser = argparse.ArgumentParser(description="Query experiments from Turso/sqld (v3)")
+    parser.add_argument(
+        "-u", "--url", default="sqlite+libsql://http://127.0.0.1:8080", help="Turso database URL"
+    )
+    parser.add_argument(
+        "-e", "--experiment", help="Show details for specific experiment ID (can be partial)"
+    )
+    parser.add_argument("-m", "--model", help="Show usage for specific model")
+    parser.add_argument("--usage", action="store_true", help="Show model usage statistics")
+    args = parser.parse_args()
+    if args.usage or args.model:
+        await show_model_usage(args.url, args.model)
+    elif args.experiment:
+        await show_experiment_details(args.url, args.experiment)
+    else:
+        await list_experiments(args.url)
+if __name__ == "__main__":
+    asyncio.run(main())

synth_ai/tui/cli/query_experiments_v3.py ADDED Viewed

@@ -0,0 +1,164 @@
+#!/usr/bin/env python3
+"""
+Query experiments and sessions from Turso/sqld using v3 tracing.
+"""
+import argparse
+import asyncio
+from synth_ai.tracing_v3.turso import NativeLibsqlTraceManager
+async def list_experiments(db_url: str):
+    """List all experiments in the database."""
+    db = NativeLibsqlTraceManager(db_url)
+    await db.initialize()
+    try:
+        df = await db.query_traces("""
+            SELECT
+                e.experiment_id,
+                e.name,
+                e.description,
+                e.created_at,
+                COUNT(DISTINCT st.session_id) as num_sessions,
+                COUNT(DISTINCT ev.id) as num_events,
+                SUM(CASE WHEN ev.event_type = 'cais' THEN ev.cost_usd ELSE 0 END) / 100.0 as total_cost,
+                SUM(CASE WHEN ev.event_type = 'cais' THEN ev.total_tokens ELSE 0 END) as total_tokens
+            FROM experiments e
+            LEFT JOIN session_traces st ON e.experiment_id = st.experiment_id
+            LEFT JOIN events ev ON st.session_id = ev.session_id
+            GROUP BY e.experiment_id, e.name, e.description, e.created_at
+            ORDER BY e.created_at DESC
+        """)
+        if df.empty:
+            print("No experiments found in database.")
+            return
+        print(f"\n{'=' * 100}")
+        print(f"{'Experiments in ' + db_url:^100}")
+        print(f"{'=' * 100}\n")
+        for _, row in df.iterrows():
+            print(f"🧪 {row['name']} (id: {row['experiment_id'][:8]}...)")
+            print(f"   Created: {row['created_at']}")
+            print(f"   Description: {row['description']}")
+            print(f"   Sessions: {row['num_sessions']}")
+            print(f"   Events: {row['num_events']:,}")
+            if row["total_cost"] and row["total_cost"] > 0:
+                print(f"   Cost: ${row['total_cost']:.4f}")
+            if row["total_tokens"] and row["total_tokens"] > 0:
+                print(f"   Tokens: {int(row['total_tokens']):,}")
+            print()
+    finally:
+        await db.close()
+async def show_experiment_details(db_url: str, experiment_id: str):
+    """Show detailed information about a specific experiment."""
+    db = NativeLibsqlTraceManager(db_url)
+    await db.initialize()
+    try:
+        # Get experiment info
+        exp_df = await db.query_traces(
+            """
+            SELECT * FROM experiments WHERE experiment_id LIKE :exp_id
+        """,
+            {"exp_id": f"{experiment_id}%"},
+        )
+        if exp_df.empty:
+            print(f"No experiment found matching ID: {experiment_id}")
+            return
+        exp = exp_df.iloc[0]
+        print(f"\n{'=' * 100}")
+        print(f"Experiment: {exp['name']} ({exp['experiment_id']})")
+        print(f"{'=' * 100}\n")
+        # Get session statistics
+        sessions_df = await db.get_sessions_by_experiment(exp["experiment_id"])
+        if sessions_df:
+            print(f"Sessions: {len(sessions_df)}")
+            # Get aggregated stats
+            stats_df = await db.query_traces(
+                """
+                SELECT
+                    COUNT(DISTINCT ev.id) as total_events,
+                    COUNT(DISTINCT m.id) as total_messages,
+                    SUM(CASE WHEN ev.event_type = 'cais' THEN ev.cost_usd ELSE 0 END) / 100.0 as total_cost,
+                    SUM(CASE WHEN ev.event_type = 'cais' THEN ev.total_tokens ELSE 0 END) as total_tokens
+                FROM session_traces st
+                LEFT JOIN events ev ON st.session_id = ev.session_id
+                LEFT JOIN messages m ON st.session_id = m.session_id
+                WHERE st.experiment_id = :exp_id
+            """,
+                {"exp_id": exp["experiment_id"]},
+            )
+            if not stats_df.empty:
+                stats = stats_df.iloc[0]
+                print(f"Total events: {int(stats['total_events']):,}")
+                print(f"Total messages: {int(stats['total_messages']):,}")
+                print(f"Total cost: ${stats['total_cost']:.4f}")
+                print(f"Total tokens: {int(stats['total_tokens']):,}")
+            # Show session list
+            print("\nSession list:")
+            for sess in sessions_df:
+                print(f"  - {sess['session_id']} ({sess['created_at']})")
+                print(
+                    f"    Timesteps: {sess['num_timesteps']}, Events: {sess['num_events']}, Messages: {sess['num_messages']}"
+                )
+    finally:
+        await db.close()
+async def show_model_usage(db_url: str, model_name: str | None = None):
+    """Show model usage statistics."""
+    db = NativeLibsqlTraceManager(db_url)
+    await db.initialize()
+    try:
+        df = await db.get_model_usage(model_name=model_name)
+        if df.empty:
+            print("No model usage data found.")
+            return
+        print(f"\n{'=' * 100}")
+        print(f"{'Model Usage Statistics':^100}")
+        print(f"{'=' * 100}\n")
+        print(df.to_string(index=False))
+    finally:
+        await db.close()
+async def main():
+    parser = argparse.ArgumentParser(description="Query experiments from Turso/sqld (v3)")
+    parser.add_argument(
+        "-u", "--url", default="sqlite+libsql://http://127.0.0.1:8080", help="Turso database URL"
+    )
+    parser.add_argument(
+        "-e", "--experiment", help="Show details for specific experiment ID (can be partial)"
+    )
+    parser.add_argument("-m", "--model", help="Show usage for specific model")
+    parser.add_argument("--usage", action="store_true", help="Show model usage statistics")
+    args = parser.parse_args()
+    if args.usage or args.model:
+        await show_model_usage(args.url, args.model)
+    elif args.experiment:
+        await show_experiment_details(args.url, args.experiment)
+    else:
+        await list_experiments(args.url)
+if __name__ == "__main__":
+    asyncio.run(main())

synth-ai 0.2.13.dev2__py3-none-any.whl → 0.2.16__py3-none-any.whl

Potentially problematic release.

synth-ai 0.2.13.dev2py3-none-any.whl → 0.2.16py3-none-any.whl