synth-ai 0.2.8.dev11__tar.gz → 0.2.8.dev13__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {synth_ai-0.2.8.dev11/synth_ai.egg-info → synth_ai-0.2.8.dev13}/PKG-INFO +3 -2
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/pyproject.toml +4 -2
- synth_ai-0.2.8.dev13/synth_ai/api/train/__init__.py +5 -0
- synth_ai-0.2.8.dev13/synth_ai/api/train/builders.py +165 -0
- synth_ai-0.2.8.dev13/synth_ai/api/train/cli.py +429 -0
- synth_ai-0.2.8.dev13/synth_ai/api/train/config_finder.py +120 -0
- synth_ai-0.2.8.dev13/synth_ai/api/train/env_resolver.py +302 -0
- synth_ai-0.2.8.dev13/synth_ai/api/train/pollers.py +66 -0
- synth_ai-0.2.8.dev13/synth_ai/api/train/task_app.py +128 -0
- synth_ai-0.2.8.dev13/synth_ai/api/train/utils.py +232 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/cli/__init__.py +23 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/cli/rl_demo.py +2 -2
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/cli/root.py +2 -1
- synth_ai-0.2.8.dev13/synth_ai/cli/task_apps.py +520 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/demos/demo_task_apps/math/modal_task_app.py +31 -25
- synth_ai-0.2.8.dev13/synth_ai/task/__init__.py +103 -0
- synth_ai-0.2.8.dev13/synth_ai/task/apps/__init__.py +88 -0
- synth_ai-0.2.8.dev13/synth_ai/task/apps/grpo_crafter.py +438 -0
- synth_ai-0.2.8.dev13/synth_ai/task/apps/math_single_step.py +852 -0
- synth_ai-0.2.8.dev13/synth_ai/task/auth.py +132 -0
- synth_ai-0.2.8.dev13/synth_ai/task/client.py +148 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/task/contracts.py +29 -14
- synth_ai-0.2.8.dev13/synth_ai/task/datasets.py +105 -0
- synth_ai-0.2.8.dev13/synth_ai/task/errors.py +49 -0
- synth_ai-0.2.8.dev13/synth_ai/task/json.py +77 -0
- synth_ai-0.2.8.dev13/synth_ai/task/proxy.py +258 -0
- synth_ai-0.2.8.dev13/synth_ai/task/rubrics.py +212 -0
- synth_ai-0.2.8.dev13/synth_ai/task/server.py +398 -0
- synth_ai-0.2.8.dev13/synth_ai/task/tracing_utils.py +79 -0
- synth_ai-0.2.8.dev13/synth_ai/task/vendors.py +61 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/session_tracer.py +13 -5
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/storage/base.py +10 -12
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/turso/manager.py +20 -6
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13/synth_ai.egg-info}/PKG-INFO +3 -2
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai.egg-info/SOURCES.txt +22 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai.egg-info/requires.txt +3 -1
- synth_ai-0.2.8.dev11/synth_ai/task/__init__.py +0 -10
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/LICENSE +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/MANIFEST.in +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/README.md +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/setup.cfg +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/__main__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/cli/balance.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/cli/calc.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/cli/demo.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/cli/legacy_root_backup.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/cli/man.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/cli/recent.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/cli/status.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/cli/traces.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/cli/watch.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/compound/cais.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/config/base_url.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/core/experiment.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/core/system.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/demos/core/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/demos/core/cli.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/demos/demo_task_apps/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/demos/demo_task_apps/core.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/demos/demo_task_apps/math/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/demos/demo_task_apps/math/_common.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/demos/demo_task_apps/math/app.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/demos/demo_task_apps/math/config.toml +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/demos/demo_task_apps/math/deploy_modal.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/demos/demo_task_apps/math/deploy_task_app.sh +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/environment/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/environment/artifacts/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/environment/artifacts/base.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/environment/core.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/environment/db/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/environment/db/sqlite.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/environment/registry.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/environment/resources/sqlite.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/environment/results.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/environment/rewards/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/environment/rewards/core.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/environment/shared_engine.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/environment/tools/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/bandit/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/bandit/engine.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/bandit/environment.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/bandit/taskset.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/analyze_semantic_words_markdown.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_comprehensive_evaluation.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_evaluation_browser.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_evaluation_config.toml +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_evaluation_framework.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/crafter_synth_config.toml +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/filter_config_modal.toml +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/filter_traces_sft_turso.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/kick_off_ft_modal.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_action_results.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_agent_actions.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_latest_run.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_lm_traces.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_no_rewards.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_trace_issue.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/check_db_schema.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/check_latest_results.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/debug_agent_responses.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/quick_trace_check.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/compare_experiments.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/filter_traces_sft_turso.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/kick_off_ft_oai.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/multi_model_config.toml +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/analyze_enhanced_hooks.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/analyze_hook_events.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/analyze_hook_results.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/check_hook_storage.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/check_seeds.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/compare_seed_performance.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/custom_eval_pipelines.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/plot_hook_frequency.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/seed_analysis_summary.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/run_rollouts_for_models_and_compare_v3.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_quick_evaluation.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_react_agent.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/crafter_trace_evaluation.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/example_v3_usage.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/compare_traces.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_comprehensive_evaluation.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_env_serialization.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_evaluation_browser.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_quick_evaluation.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_trace_evaluation.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/debug_player_loss.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/diagnose_service.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/diagnose_slowness.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/eval_by_difficulty.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/eval_example.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/explore_saved_states.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/filter_traces_sft.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/filter_traces_sft_OLD.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/generate_ft_data_gemini.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/generate_ft_data_modal.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/generate_ft_metadata.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/kick_off_ft_gemini.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/kick_off_ft_modal.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/prepare_vertex_ft.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/profile_env_slowness.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/replicate_issue.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/run_and_eval.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/run_comparison.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/run_qwen_rollouts.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/trace_eval_OLD.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/agent_demos/old/validate_openai_format.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/config_logging.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/debug_translation.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/engine.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/engine_deterministic_patch.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/engine_helpers/action_map.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/engine_helpers/serialization.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/engine_serialization_patch_v3.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/environment.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/taskset.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/trace_hooks_v3.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_classic/world_config_patch_simple.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/agent_demos/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/agent_demos/trace_eval.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/crafter/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/crafter/config.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/crafter/constants.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/crafter/engine.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/crafter/env.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/crafter/objects.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/crafter/recorder.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/crafter/worldgen.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/dataset_builder.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/environment.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/old/analyze_diamond_issue.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/old/analyze_diamond_spawning.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/old/compare_worlds.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/old/dataset_stats.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/old/diamond_spawning_summary.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/old/example_dataset_usage.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/crafter_custom/run_dataset.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/enron/art_helpers/email_search_tools.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/enron/art_helpers/local_email_db.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/enron/art_helpers/types_enron.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/enron/engine.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/enron/environment.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/enron/taskset.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/enron/units/keyword_stats.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/minigrid/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/minigrid/agent_demos/minigrid_evaluation_framework.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/minigrid/agent_demos/minigrid_quick_evaluation.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/minigrid/agent_demos/minigrid_react_agent.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/minigrid/agent_demos/minigrid_trace_evaluation.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/minigrid/engine.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/minigrid/environment.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/minigrid/environment_mapping.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/minigrid/puzzle_loader.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/minigrid/taskset.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/achievements.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/agent_demos/nethack_evaluation_framework.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/agent_demos/nethack_quick_evaluation.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/agent_demos/nethack_react_agent.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/engine.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/environment.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/helpers/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/helpers/action_mapping.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/helpers/nle_wrapper.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/helpers/observation_utils.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/helpers/recording_wrapper.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/helpers/trajectory_recorder.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/helpers/visualization/replay_viewer.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/helpers/visualization/visualizer.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/nethack/taskset.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/agent_demos/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/config_logging.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/memory_map.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/reward_components.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/reward_library/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/reward_library/adaptive_rewards.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/reward_library/battle_rewards.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/reward_library/composite_rewards.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/reward_library/economy_rewards.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/reward_library/efficiency_rewards.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/reward_library/exploration_rewards.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/reward_library/novelty_rewards.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/reward_library/pallet_town_rewards.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/reward_library/pokemon_rewards.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/reward_library/social_rewards.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/reward_library/story_rewards.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/screen_analysis.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/engine_helpers/state_extraction.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/environment.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/taskset.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/red/units/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/agent_demos/sokoban_full_eval.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/engine.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/engine_helpers/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/engine_helpers/room_utils.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/engine_helpers/vendored/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/boxoban_env.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/render_utils.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/room_utils.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_fixed_targets.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_pull.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_two_player.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_variations.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/environment.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/generate_verified_puzzles.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/puzzle_loader.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/taskset.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/sokoban/units/astar_common.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/tictactoe/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/tictactoe/engine.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/tictactoe/environment.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/tictactoe/taskset.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/verilog/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/verilog/engine.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/verilog/environment.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/verilog/taskset.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/wordle/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/wordle/engine.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/wordle/environment.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/wordle/helpers/generate_instances_wordfreq.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/examples/wordle/taskset.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/reproducibility/core.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/reproducibility/helpers.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/reproducibility/tree.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/service/app.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/service/core_routes.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/service/external_registry.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/service/registry.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/stateful/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/stateful/core.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/stateful/engine.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/stateful/state.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/tasks/api.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/tasks/core.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/tasks/filters.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/tasks/utils.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/v0_observability/history.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/environments/v0_observability/log.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/evals/base.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/experimental/synth_oss.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/handshake.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/http.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/http_client.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/inference/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/inference/client.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/install_sqld.sh +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/jobs/client.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/client.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/config.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/constants.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/core.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/filtering.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/ft_client.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/gateway.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/health.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/jobs.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/offline/dpo.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/offline/providers.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/offline/sft.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/offline/shared.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/online/grpo.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/online/irft.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/prompts/banking77_injection_eval.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/prompts/gepa.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/prompts/mipro.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/prompts/random_search.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/prompts/run_mipro_banking77.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/prompts/run_random_search_banking77.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/rl_client.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/sse.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/learning/validators.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/caching/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/caching/constants.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/caching/dbs.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/caching/ephemeral.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/caching/handler.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/caching/initialize.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/caching/persistent.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/config.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/constants.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/core/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/core/all.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/core/exceptions.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/core/main.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/core/main_v3.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/core/synth_models.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/core/vendor_clients.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/cost/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/cost/monitor.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/cost/statefulness.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/injection.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/overrides.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/provider_support/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/provider_support/anthropic.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/provider_support/openai.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/provider_support/suppress_logging.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/structured_outputs/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/structured_outputs/handler.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/structured_outputs/inject.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/structured_outputs/rehabilitate.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/tools/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/tools/base.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/unified_interface.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/base.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/core/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/core/anthropic_api.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/core/gemini_api.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/core/mistral_api.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/core/openai_api.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/core/synth_dev_api.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/local/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/local/ollama.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/openai_standard.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/openai_standard_responses.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/retries.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/supported/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/supported/custom_endpoint.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/supported/deepseek.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/supported/grok.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/supported/groq.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/supported/ollama.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/supported/openrouter.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/supported/together.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/vendors/synth_client.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/lm/warmup.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/rl/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/rl/contracts.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/rl/env_keys.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/rl/secrets.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/scripts/verify_rewards.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/task/health.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/task/validators.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v1/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/abstractions.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/config.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/db_config.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/decorators.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/examples/basic_usage.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/hooks.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/llm_call_record_helpers.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/lm_call_record_abstractions.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/migration_helper.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/replica_sync.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/storage/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/storage/config.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/storage/exceptions.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/storage/factory.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/storage/types.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/storage/utils.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/turso/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/turso/daemon.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/turso/models.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/tracing_v3/utils.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/abstractions.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/base_client.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/client_manager.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/config.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/context.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/decorators.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/events/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/events/manage.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/events/scope.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/events/store.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/immediate_client.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/local.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/log_client_base.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/retry_queue.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/trackers.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/upload.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing/utils.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/abstractions.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/base_client.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/client_manager.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/config.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/context.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/decorators.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/events/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/events/manage.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/events/scope.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/events/store.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/immediate_client.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/local.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/log_client_base.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/retry_queue.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/trackers.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/upload.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/v0/tracing_v1/utils.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai/zyk/__init__.py +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai.egg-info/dependency_links.txt +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai.egg-info/entry_points.txt +0 -0
- {synth_ai-0.2.8.dev11 → synth_ai-0.2.8.dev13}/synth_ai.egg-info/top_level.txt +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: synth-ai
|
|
3
|
-
Version: 0.2.8.
|
|
3
|
+
Version: 0.2.8.dev13
|
|
4
4
|
Summary: RL as a service SDK - Core AI functionality and tracing
|
|
5
5
|
Author-email: Synth AI <josh@usesynth.ai>
|
|
6
6
|
License-Expression: MIT
|
|
@@ -35,7 +35,6 @@ Requires-Dist: numpy>=2.2.3
|
|
|
35
35
|
Requires-Dist: networkx>=3.4.2
|
|
36
36
|
Requires-Dist: redis>=6.2.0
|
|
37
37
|
Requires-Dist: duckdb>=1.0.0
|
|
38
|
-
Requires-Dist: pandas>=2.2.3
|
|
39
38
|
Requires-Dist: ty>=0.0.1a5
|
|
40
39
|
Requires-Dist: toml>=0.10.2
|
|
41
40
|
Requires-Dist: sqlalchemy>=2.0.42
|
|
@@ -70,6 +69,8 @@ Requires-Dist: datasets>=4.0.0; extra == "research"
|
|
|
70
69
|
Provides-Extra: all
|
|
71
70
|
Requires-Dist: crafter>=1.8.3; extra == "all"
|
|
72
71
|
Requires-Dist: datasets>=4.0.0; extra == "all"
|
|
72
|
+
Provides-Extra: analytics
|
|
73
|
+
Requires-Dist: pandas>=2.2.3; extra == "analytics"
|
|
73
74
|
Dynamic: license-file
|
|
74
75
|
|
|
75
76
|
# Synth-AI
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
[project]
|
|
2
2
|
name = "synth-ai"
|
|
3
|
-
version = "0.2.8.
|
|
3
|
+
version = "0.2.8.dev13"
|
|
4
4
|
description = "RL as a service SDK - Core AI functionality and tracing"
|
|
5
5
|
authors = [{name = "Synth AI", email = "josh@usesynth.ai"}]
|
|
6
6
|
license = "MIT"
|
|
@@ -37,7 +37,6 @@ dependencies = [
|
|
|
37
37
|
"networkx>=3.4.2",
|
|
38
38
|
"redis>=6.2.0",
|
|
39
39
|
"duckdb>=1.0.0",
|
|
40
|
-
"pandas>=2.2.3",
|
|
41
40
|
"ty>=0.0.1a5", # Type annotations helper
|
|
42
41
|
"toml>=0.10.2",
|
|
43
42
|
"sqlalchemy>=2.0.42",
|
|
@@ -84,6 +83,9 @@ all = [
|
|
|
84
83
|
"crafter>=1.8.3",
|
|
85
84
|
"datasets>=4.0.0",
|
|
86
85
|
]
|
|
86
|
+
analytics = [
|
|
87
|
+
"pandas>=2.2.3",
|
|
88
|
+
]
|
|
87
89
|
|
|
88
90
|
[project.urls]
|
|
89
91
|
Homepage = "https://github.com/synth-laboratories/synth-ai"
|
|
@@ -0,0 +1,165 @@
|
|
|
1
|
+
from __future__ import annotations
|
|
2
|
+
|
|
3
|
+
from dataclasses import dataclass
|
|
4
|
+
from pathlib import Path
|
|
5
|
+
from typing import Any
|
|
6
|
+
|
|
7
|
+
import click
|
|
8
|
+
|
|
9
|
+
from .utils import ensure_api_base, load_toml, TrainError
|
|
10
|
+
|
|
11
|
+
|
|
12
|
+
@dataclass(slots=True)
|
|
13
|
+
class RLBuildResult:
|
|
14
|
+
payload: dict[str, Any]
|
|
15
|
+
task_url: str
|
|
16
|
+
idempotency: str | None
|
|
17
|
+
|
|
18
|
+
|
|
19
|
+
@dataclass(slots=True)
|
|
20
|
+
class SFTBuildResult:
|
|
21
|
+
payload: dict[str, Any]
|
|
22
|
+
train_file: Path
|
|
23
|
+
validation_file: Path | None
|
|
24
|
+
|
|
25
|
+
|
|
26
|
+
def build_rl_payload(
|
|
27
|
+
*,
|
|
28
|
+
config_path: Path,
|
|
29
|
+
task_url: str,
|
|
30
|
+
overrides: dict[str, Any],
|
|
31
|
+
idempotency: str | None,
|
|
32
|
+
) -> RLBuildResult:
|
|
33
|
+
data = load_toml(config_path)
|
|
34
|
+
services = data.get("services") if isinstance(data.get("services"), dict) else {}
|
|
35
|
+
model_cfg = data.get("model") if isinstance(data.get("model"), dict) else {}
|
|
36
|
+
|
|
37
|
+
final_task_url = (overrides.get("task_url") or task_url or services.get("task_url") or "").strip()
|
|
38
|
+
if not final_task_url:
|
|
39
|
+
raise click.ClickException("Task app URL required (provide --task-url or set services.task_url in TOML)")
|
|
40
|
+
|
|
41
|
+
model_source = (model_cfg.get("source") or "").strip()
|
|
42
|
+
model_base = (model_cfg.get("base") or "").strip()
|
|
43
|
+
override_model = (overrides.get("model") or "").strip()
|
|
44
|
+
if override_model:
|
|
45
|
+
model_source = override_model
|
|
46
|
+
model_base = ""
|
|
47
|
+
if bool(model_source) == bool(model_base):
|
|
48
|
+
raise click.ClickException("Model section must specify exactly one of [model].source or [model].base")
|
|
49
|
+
|
|
50
|
+
# Force TOML services.task_url to the effective endpoint to avoid split URLs
|
|
51
|
+
try:
|
|
52
|
+
if isinstance(data.get("services"), dict):
|
|
53
|
+
data["services"]["task_url"] = final_task_url
|
|
54
|
+
else:
|
|
55
|
+
data["services"] = {"task_url": final_task_url}
|
|
56
|
+
except Exception:
|
|
57
|
+
pass
|
|
58
|
+
|
|
59
|
+
payload: dict[str, Any] = {
|
|
60
|
+
"job_type": "rl",
|
|
61
|
+
"compute": data.get("compute", {}),
|
|
62
|
+
"data": {
|
|
63
|
+
"endpoint_base_url": final_task_url.rstrip("/"),
|
|
64
|
+
"config": data,
|
|
65
|
+
},
|
|
66
|
+
"tags": {"source": "train-cli"},
|
|
67
|
+
}
|
|
68
|
+
if model_source:
|
|
69
|
+
payload["data"]["model"] = model_source
|
|
70
|
+
if model_base:
|
|
71
|
+
payload["data"]["base_model"] = model_base
|
|
72
|
+
|
|
73
|
+
backend = overrides.get("backend")
|
|
74
|
+
if backend:
|
|
75
|
+
payload.setdefault("metadata", {})["backend_base_url"] = ensure_api_base(str(backend))
|
|
76
|
+
|
|
77
|
+
return RLBuildResult(payload=payload, task_url=final_task_url, idempotency=idempotency)
|
|
78
|
+
|
|
79
|
+
|
|
80
|
+
def build_sft_payload(
|
|
81
|
+
*,
|
|
82
|
+
config_path: Path,
|
|
83
|
+
dataset_override: Path | None,
|
|
84
|
+
) -> SFTBuildResult:
|
|
85
|
+
data = load_toml(config_path)
|
|
86
|
+
job_cfg = data.get("job") if isinstance(data.get("job"), dict) else {}
|
|
87
|
+
data_cfg = data.get("data") if isinstance(data.get("data"), dict) else {}
|
|
88
|
+
hp_cfg = data.get("hyperparameters") if isinstance(data.get("hyperparameters"), dict) else {}
|
|
89
|
+
train_cfg = data.get("training") if isinstance(data.get("training"), dict) else {}
|
|
90
|
+
compute_cfg = data.get("compute") if isinstance(data.get("compute"), dict) else {}
|
|
91
|
+
|
|
92
|
+
raw_dataset = dataset_override or job_cfg.get("data") or job_cfg.get("data_path")
|
|
93
|
+
if not raw_dataset:
|
|
94
|
+
raise TrainError("Dataset not specified; pass --dataset or set [job].data")
|
|
95
|
+
dataset_path = Path(raw_dataset)
|
|
96
|
+
dataset_path = (dataset_path if dataset_path.is_absolute() else (config_path.parent / dataset_path)).resolve()
|
|
97
|
+
if not dataset_path.exists():
|
|
98
|
+
raise TrainError(f"Dataset not found: {dataset_path}")
|
|
99
|
+
|
|
100
|
+
validation_path = data_cfg.get("validation_path") if isinstance(data_cfg.get("validation_path"), str) else None
|
|
101
|
+
validation_file = None
|
|
102
|
+
if validation_path:
|
|
103
|
+
vpath = Path(validation_path)
|
|
104
|
+
vpath = (vpath if vpath.is_absolute() else (config_path.parent / vpath)).resolve()
|
|
105
|
+
if not vpath.exists():
|
|
106
|
+
click.echo(f"[WARN] Validation dataset {vpath} missing; continuing without validation")
|
|
107
|
+
else:
|
|
108
|
+
validation_file = vpath
|
|
109
|
+
|
|
110
|
+
hp_block: dict[str, Any] = {
|
|
111
|
+
"n_epochs": int(hp_cfg.get("n_epochs", 1)),
|
|
112
|
+
}
|
|
113
|
+
for key in (
|
|
114
|
+
"batch_size",
|
|
115
|
+
"global_batch",
|
|
116
|
+
"per_device_batch",
|
|
117
|
+
"gradient_accumulation_steps",
|
|
118
|
+
"sequence_length",
|
|
119
|
+
"learning_rate",
|
|
120
|
+
"warmup_ratio",
|
|
121
|
+
"train_kind",
|
|
122
|
+
):
|
|
123
|
+
if key in hp_cfg:
|
|
124
|
+
hp_block[key] = hp_cfg[key]
|
|
125
|
+
if isinstance(hp_cfg.get("parallelism"), dict):
|
|
126
|
+
hp_block["parallelism"] = hp_cfg["parallelism"]
|
|
127
|
+
|
|
128
|
+
compute_block = {k: compute_cfg[k] for k in ("gpu_type", "gpu_count", "nodes") if k in compute_cfg}
|
|
129
|
+
|
|
130
|
+
effective = {
|
|
131
|
+
"compute": compute_block,
|
|
132
|
+
"data": {"topology": data_cfg.get("topology", {}) if isinstance(data_cfg.get("topology"), dict) else {}},
|
|
133
|
+
"training": {k: v for k, v in train_cfg.items() if k in ("mode", "use_qlora")},
|
|
134
|
+
}
|
|
135
|
+
|
|
136
|
+
validation_cfg = train_cfg.get("validation") if isinstance(train_cfg.get("validation"), dict) else None
|
|
137
|
+
if isinstance(validation_cfg, dict):
|
|
138
|
+
hp_block.update(
|
|
139
|
+
{
|
|
140
|
+
"evaluation_strategy": validation_cfg.get("evaluation_strategy", "steps"),
|
|
141
|
+
"eval_steps": int(validation_cfg.get("eval_steps", 0) or 0),
|
|
142
|
+
"save_best_model_at_end": bool(validation_cfg.get("save_best_model_at_end", True)),
|
|
143
|
+
"metric_for_best_model": validation_cfg.get("metric_for_best_model", "val.loss"),
|
|
144
|
+
"greater_is_better": bool(validation_cfg.get("greater_is_better", False)),
|
|
145
|
+
}
|
|
146
|
+
)
|
|
147
|
+
effective.setdefault("training", {})["validation"] = {"enabled": bool(validation_cfg.get("enabled", True))}
|
|
148
|
+
|
|
149
|
+
payload = {
|
|
150
|
+
"model": job_cfg.get("model") or data.get("model"),
|
|
151
|
+
"training_file_id": None, # populated after upload
|
|
152
|
+
"training_type": "sft_offline",
|
|
153
|
+
"hyperparameters": hp_block,
|
|
154
|
+
"metadata": {"effective_config": effective},
|
|
155
|
+
}
|
|
156
|
+
|
|
157
|
+
return SFTBuildResult(payload=payload, train_file=dataset_path, validation_file=validation_file)
|
|
158
|
+
|
|
159
|
+
|
|
160
|
+
__all__ = [
|
|
161
|
+
"RLBuildResult",
|
|
162
|
+
"SFTBuildResult",
|
|
163
|
+
"build_rl_payload",
|
|
164
|
+
"build_sft_payload",
|
|
165
|
+
]
|
|
@@ -0,0 +1,429 @@
|
|
|
1
|
+
from __future__ import annotations
|
|
2
|
+
|
|
3
|
+
import os
|
|
4
|
+
from pathlib import Path
|
|
5
|
+
from typing import Any, Dict
|
|
6
|
+
|
|
7
|
+
import click
|
|
8
|
+
|
|
9
|
+
from .builders import RLBuildResult, SFTBuildResult, build_rl_payload, build_sft_payload
|
|
10
|
+
from .config_finder import discover_configs, prompt_for_config
|
|
11
|
+
from .env_resolver import KeySpec, resolve_env
|
|
12
|
+
from .pollers import RLJobPoller, SFTJobPoller
|
|
13
|
+
from .task_app import check_task_app_health
|
|
14
|
+
from .utils import (
|
|
15
|
+
TrainError,
|
|
16
|
+
REPO_ROOT,
|
|
17
|
+
ensure_api_base,
|
|
18
|
+
http_post,
|
|
19
|
+
http_get,
|
|
20
|
+
limit_jsonl_examples,
|
|
21
|
+
mask_value,
|
|
22
|
+
post_multipart,
|
|
23
|
+
preview_json,
|
|
24
|
+
sleep,
|
|
25
|
+
validate_sft_jsonl,
|
|
26
|
+
)
|
|
27
|
+
|
|
28
|
+
|
|
29
|
+
def _discover_dataset_candidates(config_path: Path, limit: int = 50) -> list[Path]:
|
|
30
|
+
search_dirs: list[Path] = [
|
|
31
|
+
config_path.parent,
|
|
32
|
+
config_path.parent / "datasets",
|
|
33
|
+
REPO_ROOT / "traces",
|
|
34
|
+
REPO_ROOT / "datasets",
|
|
35
|
+
]
|
|
36
|
+
|
|
37
|
+
candidates: list[Path] = []
|
|
38
|
+
seen: set[Path] = set()
|
|
39
|
+
for directory in search_dirs:
|
|
40
|
+
if not directory.exists() or not directory.is_dir():
|
|
41
|
+
continue
|
|
42
|
+
for path in directory.rglob("*.jsonl"):
|
|
43
|
+
try:
|
|
44
|
+
resolved = path.resolve()
|
|
45
|
+
except OSError:
|
|
46
|
+
continue
|
|
47
|
+
if resolved in seen:
|
|
48
|
+
continue
|
|
49
|
+
seen.add(resolved)
|
|
50
|
+
if resolved.stat().st_size == 0:
|
|
51
|
+
continue
|
|
52
|
+
candidates.append(resolved)
|
|
53
|
+
if len(candidates) >= limit:
|
|
54
|
+
return candidates
|
|
55
|
+
return candidates
|
|
56
|
+
|
|
57
|
+
|
|
58
|
+
def prompt_for_dataset(config_path: Path) -> Path:
|
|
59
|
+
candidates = _discover_dataset_candidates(config_path)
|
|
60
|
+
while True:
|
|
61
|
+
if candidates:
|
|
62
|
+
click.echo("Select dataset JSONL file:")
|
|
63
|
+
for idx, candidate in enumerate(candidates, start=1):
|
|
64
|
+
click.echo(f" {idx}) {candidate}")
|
|
65
|
+
click.echo(" m) Enter path manually")
|
|
66
|
+
click.echo(" 0) Abort")
|
|
67
|
+
choice = click.prompt("Choice", default="m").strip().lower()
|
|
68
|
+
if choice == "0":
|
|
69
|
+
raise click.ClickException("Aborted by user")
|
|
70
|
+
if choice in {"m", "manual"}:
|
|
71
|
+
selected = _prompt_manual_dataset()
|
|
72
|
+
else:
|
|
73
|
+
try:
|
|
74
|
+
idx = int(choice)
|
|
75
|
+
except ValueError:
|
|
76
|
+
click.echo("Invalid selection; try again")
|
|
77
|
+
continue
|
|
78
|
+
if idx < 1 or idx > len(candidates):
|
|
79
|
+
click.echo("Invalid selection; try again")
|
|
80
|
+
continue
|
|
81
|
+
selected = candidates[idx - 1]
|
|
82
|
+
else:
|
|
83
|
+
selected = _prompt_manual_dataset()
|
|
84
|
+
|
|
85
|
+
if selected.exists() and selected.suffix == ".jsonl":
|
|
86
|
+
return selected.resolve()
|
|
87
|
+
click.echo("File not found or not a .jsonl; please try again.")
|
|
88
|
+
|
|
89
|
+
|
|
90
|
+
def _prompt_manual_dataset() -> Path:
|
|
91
|
+
manual = click.prompt("Enter dataset JSONL path", type=str).strip()
|
|
92
|
+
return Path(manual).expanduser()
|
|
93
|
+
|
|
94
|
+
|
|
95
|
+
@click.command("train")
|
|
96
|
+
@click.option("--config", "config_paths", multiple=True, type=click.Path(), help="Path to training TOML (repeatable)")
|
|
97
|
+
@click.option("--type", "train_type", type=click.Choice(["auto", "rl", "sft"]), default="auto")
|
|
98
|
+
@click.option("--env-file", "env_files", multiple=True, type=click.Path(), help=".env file(s) to preload (skips selection prompt)")
|
|
99
|
+
@click.option("--task-url", default=None, help="Override task app base URL (RL only)")
|
|
100
|
+
@click.option("--dataset", "dataset_path", type=click.Path(), default=None, help="Override dataset JSONL path (SFT)")
|
|
101
|
+
@click.option("--backend", default=lambda: os.getenv("BACKEND_BASE_URL", "http://localhost:8000/api"), help="Backend base URL")
|
|
102
|
+
@click.option("--model", default=None, help="Override model identifier")
|
|
103
|
+
@click.option("--idempotency", default=None, help="Idempotency-Key header for job creation")
|
|
104
|
+
@click.option("--dry-run", is_flag=True, help="Preview payload without submitting")
|
|
105
|
+
@click.option("--poll/--no-poll", default=True, help="Poll job status until terminal state")
|
|
106
|
+
@click.option("--poll-timeout", default=3600.0, type=float, help="Maximum seconds to poll before timing out")
|
|
107
|
+
@click.option("--poll-interval", default=5.0, type=float, help="Seconds between poll attempts")
|
|
108
|
+
@click.option("--examples", "examples_limit", type=int, default=None, help="Limit SFT training to the first N examples")
|
|
109
|
+
def train_command(
|
|
110
|
+
config_paths: tuple[str, ...],
|
|
111
|
+
train_type: str,
|
|
112
|
+
env_files: tuple[str, ...],
|
|
113
|
+
task_url: str | None,
|
|
114
|
+
dataset_path: str | None,
|
|
115
|
+
backend: str,
|
|
116
|
+
model: str | None,
|
|
117
|
+
idempotency: str | None,
|
|
118
|
+
dry_run: bool,
|
|
119
|
+
poll: bool,
|
|
120
|
+
poll_timeout: float,
|
|
121
|
+
poll_interval: float,
|
|
122
|
+
examples_limit: int | None,
|
|
123
|
+
) -> None:
|
|
124
|
+
"""Interactive launcher for RL / SFT jobs."""
|
|
125
|
+
|
|
126
|
+
candidates = discover_configs(list(config_paths), requested_type=train_type if train_type != "auto" else None)
|
|
127
|
+
selection = prompt_for_config(candidates, requested_type=train_type if train_type != "auto" else None)
|
|
128
|
+
|
|
129
|
+
effective_type = train_type if train_type != "auto" else selection.train_type
|
|
130
|
+
if effective_type not in {"rl", "sft"}:
|
|
131
|
+
effective_type = click.prompt("Detected config type is ambiguous. Enter type", type=click.Choice(["rl", "sft"]))
|
|
132
|
+
|
|
133
|
+
cfg_path = selection.path
|
|
134
|
+
click.echo(f"Using config: {cfg_path} ({effective_type})")
|
|
135
|
+
|
|
136
|
+
required_keys: list[KeySpec] = []
|
|
137
|
+
if effective_type == "rl":
|
|
138
|
+
required_keys.append(KeySpec("SYNTH_API_KEY", "Synth API key for backend"))
|
|
139
|
+
required_keys.append(
|
|
140
|
+
KeySpec(
|
|
141
|
+
"ENVIRONMENT_API_KEY",
|
|
142
|
+
"Environment API key for task app",
|
|
143
|
+
allow_modal_secret=True,
|
|
144
|
+
modal_secret_pattern="env",
|
|
145
|
+
)
|
|
146
|
+
)
|
|
147
|
+
required_keys.append(
|
|
148
|
+
KeySpec(
|
|
149
|
+
"TASK_APP_URL",
|
|
150
|
+
"Task app base URL",
|
|
151
|
+
secret=False,
|
|
152
|
+
allow_modal_app=True,
|
|
153
|
+
optional=bool(task_url),
|
|
154
|
+
)
|
|
155
|
+
)
|
|
156
|
+
else: # sft
|
|
157
|
+
required_keys.append(KeySpec("SYNTH_API_KEY", "Synth API key for backend"))
|
|
158
|
+
|
|
159
|
+
env_path, env_values = resolve_env(
|
|
160
|
+
config_path=cfg_path,
|
|
161
|
+
explicit_env_paths=env_files,
|
|
162
|
+
required_keys=required_keys,
|
|
163
|
+
)
|
|
164
|
+
click.echo(f"Using env file: {env_path}")
|
|
165
|
+
|
|
166
|
+
synth_key = env_values.get("SYNTH_API_KEY") or os.environ.get("SYNTH_API_KEY")
|
|
167
|
+
if not synth_key:
|
|
168
|
+
raise click.ClickException("SYNTH_API_KEY required")
|
|
169
|
+
|
|
170
|
+
backend_base = ensure_api_base(backend)
|
|
171
|
+
click.echo(f"Backend base: {backend_base} (key {mask_value(synth_key)})")
|
|
172
|
+
|
|
173
|
+
if effective_type == "rl":
|
|
174
|
+
handle_rl(
|
|
175
|
+
cfg_path=cfg_path,
|
|
176
|
+
backend_base=backend_base,
|
|
177
|
+
synth_key=synth_key,
|
|
178
|
+
task_url_override=task_url,
|
|
179
|
+
model_override=model,
|
|
180
|
+
idempotency=idempotency,
|
|
181
|
+
dry_run=dry_run,
|
|
182
|
+
poll=poll,
|
|
183
|
+
poll_timeout=poll_timeout,
|
|
184
|
+
poll_interval=poll_interval,
|
|
185
|
+
)
|
|
186
|
+
else:
|
|
187
|
+
dataset_override_path = Path(dataset_path).expanduser().resolve() if dataset_path else None
|
|
188
|
+
handle_sft(
|
|
189
|
+
cfg_path=cfg_path,
|
|
190
|
+
backend_base=backend_base,
|
|
191
|
+
synth_key=synth_key,
|
|
192
|
+
dataset_override=dataset_override_path,
|
|
193
|
+
dry_run=dry_run,
|
|
194
|
+
poll=poll,
|
|
195
|
+
poll_timeout=poll_timeout,
|
|
196
|
+
poll_interval=poll_interval,
|
|
197
|
+
examples_limit=examples_limit,
|
|
198
|
+
)
|
|
199
|
+
|
|
200
|
+
|
|
201
|
+
def _wait_for_training_file(backend_base: str, api_key: str, file_id: str, *, timeout: float = 120.0) -> None:
|
|
202
|
+
url = f"{backend_base}/learning/files/{file_id}"
|
|
203
|
+
headers = {"Authorization": f"Bearer {api_key}"}
|
|
204
|
+
elapsed = 0.0
|
|
205
|
+
interval = 2.0
|
|
206
|
+
while True:
|
|
207
|
+
resp = http_get(url, headers=headers, timeout=30.0)
|
|
208
|
+
if resp.status_code == 200:
|
|
209
|
+
try:
|
|
210
|
+
data = resp.json()
|
|
211
|
+
except Exception:
|
|
212
|
+
data = {}
|
|
213
|
+
status = str(data.get("status") or data.get("state") or data.get("storage_state") or "ready").lower()
|
|
214
|
+
if status in {"ready", "uploaded", "stored", "complete"}:
|
|
215
|
+
return
|
|
216
|
+
elif resp.status_code == 404:
|
|
217
|
+
# Keep polling; object may not be visible yet
|
|
218
|
+
pass
|
|
219
|
+
else:
|
|
220
|
+
click.echo(f"[WARN] Unexpected response while checking training file {file_id}: {resp.status_code}")
|
|
221
|
+
|
|
222
|
+
if elapsed >= timeout:
|
|
223
|
+
raise click.ClickException(f"Training file {file_id} not ready after {timeout:.0f}s")
|
|
224
|
+
sleep(interval)
|
|
225
|
+
elapsed += interval
|
|
226
|
+
|
|
227
|
+
|
|
228
|
+
def handle_rl(
|
|
229
|
+
*,
|
|
230
|
+
cfg_path: Path,
|
|
231
|
+
backend_base: str,
|
|
232
|
+
synth_key: str,
|
|
233
|
+
task_url_override: str | None,
|
|
234
|
+
model_override: str | None,
|
|
235
|
+
idempotency: str | None,
|
|
236
|
+
dry_run: bool,
|
|
237
|
+
poll: bool,
|
|
238
|
+
poll_timeout: float,
|
|
239
|
+
poll_interval: float,
|
|
240
|
+
) -> None:
|
|
241
|
+
overrides: Dict[str, Any] = {"backend": backend_base, "task_url": task_url_override, "model": model_override}
|
|
242
|
+
build = build_rl_payload(
|
|
243
|
+
config_path=cfg_path,
|
|
244
|
+
task_url=task_url_override or os.environ.get("TASK_APP_URL", ""),
|
|
245
|
+
overrides=overrides,
|
|
246
|
+
idempotency=idempotency,
|
|
247
|
+
)
|
|
248
|
+
|
|
249
|
+
# Backend-side verification: try ALL org environment keys against /health and /task_info
|
|
250
|
+
verify_url = f"{backend_base}/rl/verify_task_app"
|
|
251
|
+
verify_headers = {"Authorization": f"Bearer {synth_key}", "Content-Type": "application/json"}
|
|
252
|
+
try:
|
|
253
|
+
vresp = http_post(verify_url, headers=verify_headers, json_body={"endpoint_base_url": build.task_url})
|
|
254
|
+
try:
|
|
255
|
+
vjs = vresp.json()
|
|
256
|
+
except Exception:
|
|
257
|
+
vjs = {"status": vresp.status_code, "text": (vresp.text or "")[:400]}
|
|
258
|
+
except Exception as _ve:
|
|
259
|
+
raise click.ClickException(f"Task app verification call failed: {type(_ve).__name__}: {_ve}") from _ve
|
|
260
|
+
if vresp.status_code >= 400:
|
|
261
|
+
click.echo("Task app verification error:\n" + preview_json(vjs, limit=800))
|
|
262
|
+
raise click.ClickException(f"Verification failed with status {vresp.status_code}")
|
|
263
|
+
if not bool(vjs.get("any_ok")):
|
|
264
|
+
click.echo("Task app verification failed; no auth combination succeeded. Full report:")
|
|
265
|
+
click.echo(preview_json(vjs, limit=1200))
|
|
266
|
+
raise click.ClickException("Task app verification failed (auth)")
|
|
267
|
+
else:
|
|
268
|
+
# Print concise summary
|
|
269
|
+
try:
|
|
270
|
+
cands = vjs.get("candidates_first15") or []
|
|
271
|
+
attempts = vjs.get("attempts") or []
|
|
272
|
+
statuses = [a.get("status") for a in attempts]
|
|
273
|
+
click.echo(f"Verification OK (candidates={cands}, statuses={statuses})")
|
|
274
|
+
except Exception:
|
|
275
|
+
pass
|
|
276
|
+
|
|
277
|
+
env_key = os.environ.get("ENVIRONMENT_API_KEY")
|
|
278
|
+
if not env_key:
|
|
279
|
+
raise click.ClickException("ENVIRONMENT_API_KEY required for RL flow")
|
|
280
|
+
|
|
281
|
+
click.echo("Performing task app health check…")
|
|
282
|
+
health = check_task_app_health(build.task_url, env_key)
|
|
283
|
+
if not health.ok:
|
|
284
|
+
click.echo(f"Task app health check failed: {health.detail}")
|
|
285
|
+
raise click.ClickException("Aborting due to failing health check")
|
|
286
|
+
else:
|
|
287
|
+
click.echo("Task app healthy")
|
|
288
|
+
|
|
289
|
+
create_url = f"{backend_base}/rl/jobs"
|
|
290
|
+
headers = {"Authorization": f"Bearer {synth_key}", "Content-Type": "application/json"}
|
|
291
|
+
if build.idempotency:
|
|
292
|
+
headers["Idempotency-Key"] = build.idempotency
|
|
293
|
+
|
|
294
|
+
click.echo(f"POST {create_url}")
|
|
295
|
+
click.echo("Payload preview:\n" + preview_json(build.payload, limit=800))
|
|
296
|
+
if dry_run:
|
|
297
|
+
click.echo("Dry run enabled; skipping submission")
|
|
298
|
+
return
|
|
299
|
+
|
|
300
|
+
resp = http_post(create_url, headers=headers, json_body=build.payload)
|
|
301
|
+
try:
|
|
302
|
+
js = resp.json()
|
|
303
|
+
except Exception:
|
|
304
|
+
js = {"status": resp.status_code, "text": resp.text[:400]}
|
|
305
|
+
click.echo(f"Response {resp.status_code}: {preview_json(js, limit=400)}")
|
|
306
|
+
if resp.status_code not in (200, 201):
|
|
307
|
+
raise click.ClickException("Job creation failed")
|
|
308
|
+
job_id = js.get("job_id") or js.get("id")
|
|
309
|
+
if not job_id:
|
|
310
|
+
raise click.ClickException("Response missing job id")
|
|
311
|
+
|
|
312
|
+
if not poll:
|
|
313
|
+
click.echo(f"Created job {job_id} (polling disabled)")
|
|
314
|
+
return
|
|
315
|
+
|
|
316
|
+
poller = RLJobPoller(backend_base, synth_key, interval=poll_interval, timeout=poll_timeout)
|
|
317
|
+
outcome = poller.poll_job(job_id)
|
|
318
|
+
click.echo(f"Final status: {outcome.status}")
|
|
319
|
+
click.echo(preview_json(outcome.payload, limit=600))
|
|
320
|
+
|
|
321
|
+
|
|
322
|
+
def handle_sft(
|
|
323
|
+
*,
|
|
324
|
+
cfg_path: Path,
|
|
325
|
+
backend_base: str,
|
|
326
|
+
synth_key: str,
|
|
327
|
+
dataset_override: Path | None,
|
|
328
|
+
dry_run: bool,
|
|
329
|
+
poll: bool,
|
|
330
|
+
poll_timeout: float,
|
|
331
|
+
poll_interval: float,
|
|
332
|
+
examples_limit: int | None,
|
|
333
|
+
) -> None:
|
|
334
|
+
dataset_path = dataset_override
|
|
335
|
+
|
|
336
|
+
while True:
|
|
337
|
+
try:
|
|
338
|
+
build = build_sft_payload(config_path=cfg_path, dataset_override=dataset_path)
|
|
339
|
+
break
|
|
340
|
+
except TrainError as exc:
|
|
341
|
+
click.echo(str(exc))
|
|
342
|
+
dataset_path = prompt_for_dataset(cfg_path)
|
|
343
|
+
|
|
344
|
+
limited_path: Path | None = None
|
|
345
|
+
|
|
346
|
+
try:
|
|
347
|
+
if examples_limit is not None:
|
|
348
|
+
limited_path = limit_jsonl_examples(build.train_file, examples_limit)
|
|
349
|
+
click.echo(
|
|
350
|
+
f"Using first {examples_limit} examples from {build.train_file} -> {limited_path}"
|
|
351
|
+
)
|
|
352
|
+
build.train_file = limited_path
|
|
353
|
+
|
|
354
|
+
click.echo("Validating training dataset…")
|
|
355
|
+
validate_sft_jsonl(build.train_file)
|
|
356
|
+
if build.validation_file and build.validation_file.suffix == ".jsonl":
|
|
357
|
+
click.echo("Validating validation dataset…")
|
|
358
|
+
validate_sft_jsonl(build.validation_file)
|
|
359
|
+
|
|
360
|
+
upload_url = f"{backend_base}/learning/files"
|
|
361
|
+
click.echo(f"Uploading dataset {build.train_file}")
|
|
362
|
+
if dry_run:
|
|
363
|
+
click.echo("Dry run: skipping upload")
|
|
364
|
+
train_file_id = "dry-run-train"
|
|
365
|
+
val_file_id = None
|
|
366
|
+
else:
|
|
367
|
+
resp = post_multipart(upload_url, api_key=synth_key, file_field="file", file_path=build.train_file)
|
|
368
|
+
js = resp.json() if resp.headers.get("content-type", "").startswith("application/json") else {}
|
|
369
|
+
if resp.status_code >= 400 or "id" not in js:
|
|
370
|
+
raise click.ClickException(f"Training file upload failed ({resp.status_code}): {js or resp.text[:200]}")
|
|
371
|
+
train_file_id = js["id"]
|
|
372
|
+
val_file_id = None
|
|
373
|
+
if build.validation_file:
|
|
374
|
+
click.echo(f"Uploading validation dataset {build.validation_file}")
|
|
375
|
+
vresp = post_multipart(upload_url, api_key=synth_key, file_field="file", file_path=build.validation_file)
|
|
376
|
+
vjs = vresp.json() if vresp.headers.get("content-type", "").startswith("application/json") else {}
|
|
377
|
+
if vresp.status_code < 400 and "id" in vjs:
|
|
378
|
+
val_file_id = vjs["id"]
|
|
379
|
+
else:
|
|
380
|
+
click.echo(f"[WARN] Validation upload failed: {vresp.status_code} {vjs or vresp.text[:200]}")
|
|
381
|
+
payload = dict(build.payload)
|
|
382
|
+
payload["training_file_id"] = train_file_id
|
|
383
|
+
if val_file_id:
|
|
384
|
+
payload.setdefault("metadata", {}).setdefault("effective_config", {}).setdefault("data", {})["validation_files"] = [val_file_id]
|
|
385
|
+
|
|
386
|
+
try:
|
|
387
|
+
_wait_for_training_file(backend_base, synth_key, train_file_id)
|
|
388
|
+
except click.ClickException as exc:
|
|
389
|
+
raise click.ClickException(f"Training file {train_file_id} not ready: {exc}") from exc
|
|
390
|
+
|
|
391
|
+
click.echo("FFT job payload:\n" + preview_json(payload, limit=800))
|
|
392
|
+
if dry_run:
|
|
393
|
+
click.echo("Dry run: skipping job submission")
|
|
394
|
+
return
|
|
395
|
+
|
|
396
|
+
create_url = f"{backend_base}/learning/jobs"
|
|
397
|
+
headers = {"Authorization": f"Bearer {synth_key}", "Content-Type": "application/json"}
|
|
398
|
+
resp = http_post(create_url, headers=headers, json_body=payload)
|
|
399
|
+
js = resp.json() if resp.headers.get("content-type", "").startswith("application/json") else {}
|
|
400
|
+
click.echo(f"Response {resp.status_code}: {preview_json(js, limit=400)}")
|
|
401
|
+
if resp.status_code not in (200, 201):
|
|
402
|
+
raise click.ClickException("Failed to create learning job")
|
|
403
|
+
job_id = js.get("job_id") or js.get("id")
|
|
404
|
+
if not job_id:
|
|
405
|
+
raise click.ClickException("Response missing job id")
|
|
406
|
+
|
|
407
|
+
start_url = f"{backend_base}/learning/jobs/{job_id}/start"
|
|
408
|
+
click.echo(f"POST {start_url} (start)")
|
|
409
|
+
_ = http_post(start_url, headers=headers, json_body={})
|
|
410
|
+
|
|
411
|
+
if not poll:
|
|
412
|
+
click.echo(f"Started job {job_id} (polling disabled)")
|
|
413
|
+
return
|
|
414
|
+
|
|
415
|
+
poller = SFTJobPoller(backend_base, synth_key, interval=poll_interval, timeout=poll_timeout)
|
|
416
|
+
outcome = poller.poll_job(job_id)
|
|
417
|
+
click.echo(f"Final status: {outcome.status}")
|
|
418
|
+
click.echo(preview_json(outcome.payload, limit=600))
|
|
419
|
+
finally:
|
|
420
|
+
if limited_path is not None:
|
|
421
|
+
try:
|
|
422
|
+
limited_path.unlink(missing_ok=True)
|
|
423
|
+
limited_path.parent.rmdir()
|
|
424
|
+
except Exception:
|
|
425
|
+
pass
|
|
426
|
+
|
|
427
|
+
|
|
428
|
+
def register(cli: click.Group) -> None:
|
|
429
|
+
cli.add_command(train_command)
|