synth-ai 0.2.9.dev5__py3-none-any.whl → 0.2.10__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of synth-ai might be problematic. Click here for more details.

Files changed (349) hide show
  1. examples/__init__.py +16 -0
  2. examples/crafter_debug_render.py +23 -17
  3. examples/dev/qwen3_32b_qlora_4xh100.toml +40 -0
  4. examples/multi_step/crafter_rl_lora.md +29 -0
  5. examples/qwen_coder/README.md +102 -0
  6. examples/qwen_coder/_shared.py +113 -0
  7. examples/qwen_coder/configs/coder_lora_30b.toml +61 -0
  8. examples/qwen_coder/configs/coder_lora_4b.toml +57 -0
  9. examples/qwen_coder/configs/coder_lora_small.toml +58 -0
  10. examples/qwen_coder/generate_dataset.py +98 -0
  11. examples/qwen_coder/infer_ft_smoke.py +65 -0
  12. examples/qwen_coder/infer_prod_proxy.py +73 -0
  13. examples/qwen_coder/infer_via_synth.py +87 -0
  14. examples/qwen_coder/scripts/infer_coder.sh +19 -0
  15. examples/qwen_coder/scripts/train_coder_30b.sh +22 -0
  16. examples/qwen_coder/sft_full_17b.py +103 -0
  17. examples/qwen_coder/sft_lora_30b.py +110 -0
  18. examples/qwen_coder/subset_jsonl.py +39 -0
  19. examples/qwen_coder/todos.md +38 -0
  20. examples/qwen_coder/validate_jsonl.py +60 -0
  21. examples/rl/configs/eval_base_qwen.toml +1 -1
  22. examples/rl/configs/rl_from_base_qwen17.toml +1 -1
  23. examples/rl/download_dataset.py +26 -10
  24. examples/rl/run_eval.py +53 -52
  25. examples/rl/run_rl_and_save.py +29 -12
  26. examples/rl/task_app/math_single_step.py +180 -41
  27. examples/rl/task_app/math_task_app.py +14 -6
  28. examples/sft/README.md +139 -0
  29. examples/sft/configs/crafter_fft_qwen0p6b.toml +44 -0
  30. examples/sft/configs/crafter_lora_qwen0p6b.toml +45 -0
  31. examples/sft/evaluate.py +117 -0
  32. examples/sft/export_dataset.py +117 -0
  33. examples/sft/generate_traces.py +162 -0
  34. examples/swe/__init__.py +12 -0
  35. examples/swe/task_app/README.md +105 -0
  36. examples/swe/task_app/__init__.py +2 -0
  37. examples/swe/task_app/grpo_swe_mini.py +571 -0
  38. examples/swe/task_app/grpo_swe_mini_task_app.py +136 -0
  39. examples/swe/task_app/hosted/README.md +173 -0
  40. examples/swe/task_app/hosted/__init__.py +5 -0
  41. examples/swe/task_app/hosted/branching.py +143 -0
  42. examples/swe/task_app/hosted/environment_routes.py +1289 -0
  43. examples/swe/task_app/hosted/envs/__init__.py +1 -0
  44. examples/swe/task_app/hosted/envs/crafter/__init__.py +6 -0
  45. examples/swe/task_app/hosted/envs/crafter/app.py +1 -0
  46. examples/swe/task_app/hosted/envs/crafter/environment.py +522 -0
  47. examples/swe/task_app/hosted/envs/crafter/policy.py +478 -0
  48. examples/swe/task_app/hosted/envs/crafter/react_agent.py +108 -0
  49. examples/swe/task_app/hosted/envs/crafter/shared.py +305 -0
  50. examples/swe/task_app/hosted/envs/crafter/tools.py +47 -0
  51. examples/swe/task_app/hosted/envs/mini_swe/__init__.py +8 -0
  52. examples/swe/task_app/hosted/envs/mini_swe/environment.py +1164 -0
  53. examples/swe/task_app/hosted/envs/mini_swe/policy.py +355 -0
  54. examples/swe/task_app/hosted/envs/mini_swe/shared.py +83 -0
  55. examples/swe/task_app/hosted/envs/mini_swe/tools.py +96 -0
  56. examples/swe/task_app/hosted/hosted_app.py +204 -0
  57. examples/swe/task_app/hosted/inference/__init__.py +5 -0
  58. examples/swe/task_app/hosted/inference/openai_client.py +618 -0
  59. examples/swe/task_app/hosted/main.py +100 -0
  60. examples/swe/task_app/hosted/policy_routes.py +1079 -0
  61. examples/swe/task_app/hosted/registry.py +195 -0
  62. examples/swe/task_app/hosted/rollout.py +1869 -0
  63. examples/swe/task_app/hosted/storage/__init__.py +5 -0
  64. examples/swe/task_app/hosted/storage/volume.py +211 -0
  65. examples/swe/task_app/hosted/test_agents.py +161 -0
  66. examples/swe/task_app/hosted/test_service.py +137 -0
  67. examples/swe/task_app/hosted/utils.py +62 -0
  68. examples/vlm/PROPOSAL.md +53 -0
  69. examples/vlm/README.md +68 -0
  70. examples/vlm/configs/crafter_vlm_gpt4o.toml +44 -0
  71. examples/vlm/crafter_image_only_agent.py +207 -0
  72. examples/vlm/crafter_openai_vlm_agent.py +277 -0
  73. examples/vlm/filter_image_rows.py +63 -0
  74. examples/vlm/run_crafter_vlm_benchmark.py +316 -0
  75. examples/warming_up_to_rl/analyze_trace_db.py +12 -10
  76. examples/warming_up_to_rl/configs/rl_from_base_qwen4b.toml +11 -1
  77. examples/warming_up_to_rl/export_trace_sft.py +218 -36
  78. examples/warming_up_to_rl/groq_test.py +15 -8
  79. examples/warming_up_to_rl/manage_secrets.py +29 -25
  80. examples/warming_up_to_rl/readme.md +9 -2
  81. examples/warming_up_to_rl/run_eval.py +137 -61
  82. examples/warming_up_to_rl/run_fft_and_save.py +131 -60
  83. examples/warming_up_to_rl/run_local_rollout.py +88 -39
  84. examples/warming_up_to_rl/run_local_rollout_modal.py +114 -28
  85. examples/warming_up_to_rl/run_local_rollout_parallel.py +81 -20
  86. examples/warming_up_to_rl/run_local_rollout_traced.py +126 -23
  87. examples/warming_up_to_rl/run_rl_and_save.py +35 -12
  88. examples/warming_up_to_rl/run_rollout_remote.py +44 -19
  89. examples/warming_up_to_rl/task_app/README.md +6 -2
  90. examples/warming_up_to_rl/task_app/grpo_crafter.py +319 -57
  91. examples/warming_up_to_rl/task_app/grpo_crafter_task_app.py +11 -30
  92. examples/warming_up_to_rl/task_app/synth_envs_hosted/__init__.py +1 -1
  93. examples/warming_up_to_rl/task_app/synth_envs_hosted/branching.py +9 -11
  94. examples/warming_up_to_rl/task_app/synth_envs_hosted/environment_routes.py +137 -182
  95. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/__init__.py +1 -1
  96. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/__init__.py +1 -1
  97. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/app.py +1 -1
  98. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/environment.py +150 -57
  99. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/policy.py +105 -69
  100. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/react_agent.py +19 -7
  101. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/shared.py +45 -42
  102. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/tools.py +1 -1
  103. examples/warming_up_to_rl/task_app/synth_envs_hosted/hosted_app.py +47 -45
  104. examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/__init__.py +1 -1
  105. examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py +198 -92
  106. examples/warming_up_to_rl/task_app/synth_envs_hosted/main.py +0 -2
  107. examples/warming_up_to_rl/task_app/synth_envs_hosted/policy_routes.py +361 -263
  108. examples/warming_up_to_rl/task_app/synth_envs_hosted/registry.py +21 -23
  109. examples/warming_up_to_rl/task_app/synth_envs_hosted/rollout.py +394 -274
  110. examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/__init__.py +1 -1
  111. examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/volume.py +56 -62
  112. examples/warming_up_to_rl/task_app/synth_envs_hosted/test_agents.py +1 -0
  113. examples/warming_up_to_rl/task_app/synth_envs_hosted/test_service.py +6 -15
  114. examples/warming_up_to_rl/task_app/synth_envs_hosted/utils.py +4 -3
  115. synth_ai/__init__.py +1 -0
  116. synth_ai/api/models/supported.py +376 -0
  117. synth_ai/api/train/builders.py +157 -26
  118. synth_ai/api/train/cli.py +213 -57
  119. synth_ai/api/train/config_finder.py +65 -5
  120. synth_ai/api/train/env_resolver.py +33 -15
  121. synth_ai/api/train/pollers.py +13 -4
  122. synth_ai/api/train/supported_algos.py +139 -0
  123. synth_ai/api/train/task_app.py +5 -3
  124. synth_ai/api/train/utils.py +33 -48
  125. synth_ai/cli/__init__.py +19 -4
  126. synth_ai/cli/_modal_wrapper.py +28 -0
  127. synth_ai/cli/_typer_patch.py +49 -0
  128. synth_ai/cli/balance.py +2 -3
  129. synth_ai/cli/calc.py +1 -1
  130. synth_ai/cli/demo.py +21 -6
  131. synth_ai/cli/recent.py +2 -2
  132. synth_ai/cli/rl_demo.py +77 -17
  133. synth_ai/cli/root.py +116 -39
  134. synth_ai/cli/status.py +2 -2
  135. synth_ai/cli/task_apps.py +1699 -259
  136. synth_ai/cli/traces.py +7 -4
  137. synth_ai/cli/turso.py +73 -0
  138. synth_ai/cli/watch.py +12 -18
  139. synth_ai/core/experiment.py +0 -2
  140. synth_ai/demo_registry.py +68 -31
  141. synth_ai/demos/core/cli.py +516 -194
  142. synth_ai/demos/demo_task_apps/__init__.py +3 -3
  143. synth_ai/demos/demo_task_apps/core.py +64 -28
  144. synth_ai/demos/demo_task_apps/crafter/configs/crafter_fft_4b.toml +2 -3
  145. synth_ai/demos/demo_task_apps/crafter/grpo_crafter_task_app.py +37 -30
  146. synth_ai/demos/demo_task_apps/math/_common.py +1 -2
  147. synth_ai/demos/demo_task_apps/math/app.py +2 -1
  148. synth_ai/demos/demo_task_apps/math/deploy_modal.py +3 -6
  149. synth_ai/demos/demo_task_apps/math/modal_task_app.py +183 -82
  150. synth_ai/demos/demo_task_apps/math/task_app_entry.py +0 -2
  151. synth_ai/environments/examples/bandit/engine.py +12 -4
  152. synth_ai/environments/examples/bandit/taskset.py +4 -4
  153. synth_ai/environments/examples/crafter_classic/environment.py +76 -1
  154. synth_ai/environments/reproducibility/tree.py +5 -6
  155. synth_ai/environments/service/app.py +11 -12
  156. synth_ai/environments/service/core_routes.py +10 -9
  157. synth_ai/environments/stateful/engine.py +1 -1
  158. synth_ai/environments/tasks/core.py +1 -0
  159. synth_ai/environments/tasks/filters.py +5 -6
  160. synth_ai/environments/tasks/utils.py +4 -5
  161. synth_ai/evals/base.py +0 -2
  162. synth_ai/handshake.py +11 -9
  163. synth_ai/http.py +1 -1
  164. synth_ai/http_client.py +43 -11
  165. synth_ai/inference/__init__.py +0 -2
  166. synth_ai/inference/client.py +20 -6
  167. synth_ai/jobs/client.py +103 -78
  168. synth_ai/learning/__init__.py +41 -6
  169. synth_ai/learning/algorithms.py +14 -0
  170. synth_ai/learning/client.py +121 -29
  171. synth_ai/learning/config.py +2 -40
  172. synth_ai/learning/constants.py +0 -2
  173. synth_ai/learning/ft_client.py +4 -56
  174. synth_ai/learning/health.py +13 -7
  175. synth_ai/learning/jobs.py +43 -47
  176. synth_ai/{rl → learning/rl}/__init__.py +14 -5
  177. synth_ai/learning/rl/client.py +267 -0
  178. synth_ai/learning/rl/config.py +31 -0
  179. synth_ai/{rl → learning/rl}/contracts.py +5 -10
  180. synth_ai/{rl → learning/rl}/env_keys.py +45 -16
  181. synth_ai/learning/rl/secrets.py +13 -0
  182. synth_ai/learning/rl_client.py +2 -253
  183. synth_ai/learning/sft/__init__.py +29 -0
  184. synth_ai/learning/sft/client.py +68 -0
  185. synth_ai/learning/sft/config.py +270 -0
  186. synth_ai/learning/sft/data.py +295 -0
  187. synth_ai/learning/sse.py +25 -26
  188. synth_ai/learning/validators.py +25 -24
  189. synth_ai/lm/__init__.py +21 -47
  190. synth_ai/task/__init__.py +26 -27
  191. synth_ai/task/apps/__init__.py +18 -19
  192. synth_ai/task/auth.py +35 -23
  193. synth_ai/task/client.py +15 -13
  194. synth_ai/task/contracts.py +37 -35
  195. synth_ai/task/datasets.py +9 -6
  196. synth_ai/task/errors.py +11 -10
  197. synth_ai/task/health.py +17 -11
  198. synth_ai/task/json.py +58 -24
  199. synth_ai/task/proxy.py +15 -14
  200. synth_ai/task/rubrics.py +22 -15
  201. synth_ai/task/server.py +43 -17
  202. synth_ai/task/tracing_utils.py +12 -7
  203. synth_ai/task/validators.py +0 -1
  204. synth_ai/task/vendors.py +5 -7
  205. synth_ai/tracing_v3/__init__.py +2 -0
  206. synth_ai/tracing_v3/abstractions.py +21 -4
  207. synth_ai/tracing_v3/db_config.py +26 -1
  208. synth_ai/tracing_v3/decorators.py +18 -15
  209. synth_ai/tracing_v3/examples/basic_usage.py +3 -2
  210. synth_ai/tracing_v3/hooks.py +6 -4
  211. synth_ai/tracing_v3/llm_call_record_helpers.py +6 -6
  212. synth_ai/tracing_v3/replica_sync.py +1 -0
  213. synth_ai/tracing_v3/session_tracer.py +63 -16
  214. synth_ai/tracing_v3/storage/base.py +89 -1
  215. synth_ai/tracing_v3/storage/config.py +21 -8
  216. synth_ai/tracing_v3/storage/factory.py +10 -8
  217. synth_ai/tracing_v3/storage/utils.py +4 -2
  218. synth_ai/tracing_v3/turso/daemon.py +7 -2
  219. synth_ai/tracing_v3/turso/models.py +5 -2
  220. synth_ai/tracing_v3/turso/native_manager.py +1173 -0
  221. synth_ai/tracing_v3/utils.py +4 -3
  222. synth_ai/v0/api/__init__.py +8 -0
  223. synth_ai/v0/api/models/__init__.py +8 -0
  224. synth_ai/v0/api/models/supported.py +8 -0
  225. synth_ai/v0/config/__init__.py +15 -0
  226. synth_ai/v0/config/base_url.py +12 -0
  227. synth_ai/v0/lm/__init__.py +51 -0
  228. synth_ai/{lm → v0/lm}/caching/ephemeral.py +3 -5
  229. synth_ai/{lm → v0/lm}/caching/handler.py +4 -4
  230. synth_ai/{lm → v0/lm}/caching/initialize.py +1 -1
  231. synth_ai/{lm → v0/lm}/caching/persistent.py +1 -1
  232. synth_ai/{lm → v0/lm}/config.py +6 -1
  233. synth_ai/{lm → v0/lm}/core/all.py +9 -9
  234. synth_ai/{lm → v0/lm}/core/exceptions.py +0 -2
  235. synth_ai/{lm → v0/lm}/core/main.py +19 -7
  236. synth_ai/{lm → v0/lm}/core/main_v3.py +10 -10
  237. synth_ai/{lm → v0/lm}/core/synth_models.py +2 -15
  238. synth_ai/{lm → v0/lm}/core/vendor_clients.py +6 -4
  239. synth_ai/{lm → v0/lm}/overrides.py +4 -4
  240. synth_ai/{lm → v0/lm}/provider_support/anthropic.py +4 -4
  241. synth_ai/{lm → v0/lm}/provider_support/openai.py +5 -5
  242. synth_ai/{lm → v0/lm}/structured_outputs/handler.py +5 -5
  243. synth_ai/{lm → v0/lm}/structured_outputs/rehabilitate.py +1 -1
  244. synth_ai/{lm → v0/lm}/vendors/core/anthropic_api.py +16 -16
  245. synth_ai/{lm → v0/lm}/vendors/core/gemini_api.py +5 -5
  246. synth_ai/{lm → v0/lm}/vendors/core/mistral_api.py +5 -5
  247. synth_ai/{lm → v0/lm}/vendors/core/openai_api.py +12 -10
  248. synth_ai/{lm → v0/lm}/vendors/openai_standard.py +11 -9
  249. synth_ai/{lm → v0/lm}/vendors/openai_standard_responses.py +8 -5
  250. synth_ai/{lm → v0/lm}/vendors/supported/custom_endpoint.py +4 -6
  251. synth_ai/{lm → v0/lm}/vendors/supported/deepseek.py +2 -2
  252. synth_ai/{lm → v0/lm}/vendors/supported/grok.py +2 -2
  253. synth_ai/{lm → v0/lm}/vendors/supported/groq.py +1 -1
  254. synth_ai/{lm → v0/lm}/vendors/supported/ollama.py +1 -1
  255. synth_ai/{lm → v0/lm}/vendors/supported/openrouter.py +3 -3
  256. synth_ai/{lm → v0/lm}/vendors/supported/together.py +1 -1
  257. synth_ai/{lm → v0/lm}/vendors/synth_client.py +38 -11
  258. synth_ai/v0/tracing/upload.py +32 -135
  259. synth_ai/v0/tracing_v3/__init__.py +10 -0
  260. synth_ai/v0/tracing_v3/abstractions.py +3 -0
  261. synth_ai/v0/tracing_v3/decorators.py +3 -0
  262. synth_ai/v0/tracing_v3/llm_call_record_helpers.py +3 -0
  263. synth_ai/v0/tracing_v3/session_tracer.py +3 -0
  264. {synth_ai-0.2.9.dev5.dist-info → synth_ai-0.2.10.dist-info}/METADATA +10 -7
  265. {synth_ai-0.2.9.dev5.dist-info → synth_ai-0.2.10.dist-info}/RECORD +294 -258
  266. examples/common_old/backend.py +0 -21
  267. examples/evals_old/README.md +0 -98
  268. examples/evals_old/__init__.py +0 -6
  269. examples/evals_old/compare_models.py +0 -1037
  270. examples/evals_old/example_log.md +0 -145
  271. examples/evals_old/run_demo.sh +0 -126
  272. examples/evals_old/trace_analysis.py +0 -270
  273. examples/finetuning_old/_backup_synth_qwen/config.toml +0 -29
  274. examples/finetuning_old/_backup_synth_qwen/example_log.md +0 -324
  275. examples/finetuning_old/_backup_synth_qwen/filter_traces.py +0 -60
  276. examples/finetuning_old/_backup_synth_qwen/filter_traces_achievements.py +0 -239
  277. examples/finetuning_old/_backup_synth_qwen/purge_v3_traces.py +0 -109
  278. examples/finetuning_old/_backup_synth_qwen/react_agent_lm.py +0 -1924
  279. examples/finetuning_old/_backup_synth_qwen/readme.md +0 -49
  280. examples/finetuning_old/_backup_synth_qwen/run_crafter_qwen4b.py +0 -114
  281. examples/finetuning_old/_backup_synth_qwen/run_demo.sh +0 -195
  282. examples/finetuning_old/_backup_synth_qwen/sft_kickoff.py +0 -118
  283. examples/finetuning_old/synth_qwen_v1/README.md +0 -68
  284. examples/finetuning_old/synth_qwen_v1/filter_traces.py +0 -60
  285. examples/finetuning_old/synth_qwen_v1/filter_traces_achievements.py +0 -239
  286. examples/finetuning_old/synth_qwen_v1/finetune.py +0 -46
  287. examples/finetuning_old/synth_qwen_v1/hello_ft_model.py +0 -71
  288. examples/finetuning_old/synth_qwen_v1/infer.py +0 -37
  289. examples/finetuning_old/synth_qwen_v1/poll.py +0 -44
  290. examples/finetuning_old/synth_qwen_v1/prepare_data.py +0 -35
  291. examples/finetuning_old/synth_qwen_v1/purge_v3_traces.py +0 -109
  292. examples/finetuning_old/synth_qwen_v1/react_agent_lm.py +0 -1932
  293. examples/finetuning_old/synth_qwen_v1/run_crafter_sft_job.py +0 -207
  294. examples/finetuning_old/synth_qwen_v1/run_ft_job.py +0 -232
  295. examples/finetuning_old/synth_qwen_v1/upload_data.py +0 -34
  296. examples/finetuning_old/synth_qwen_v1/util.py +0 -147
  297. examples/rl_old/task_app.py +0 -962
  298. synth_ai/experimental/synth_oss.py +0 -446
  299. synth_ai/install_sqld.sh +0 -40
  300. synth_ai/learning/filtering.py +0 -0
  301. synth_ai/learning/offline/dpo.py +0 -0
  302. synth_ai/learning/offline/providers.py +0 -7
  303. synth_ai/learning/offline/sft.py +0 -0
  304. synth_ai/learning/offline/shared.py +0 -0
  305. synth_ai/learning/online/grpo.py +0 -0
  306. synth_ai/learning/online/irft.py +0 -0
  307. synth_ai/learning/prompts/banking77_injection_eval.py +0 -168
  308. synth_ai/learning/prompts/gepa.py +0 -0
  309. synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +0 -213
  310. synth_ai/learning/prompts/mipro.py +0 -289
  311. synth_ai/learning/prompts/random_search.py +0 -246
  312. synth_ai/learning/prompts/run_mipro_banking77.py +0 -172
  313. synth_ai/learning/prompts/run_random_search_banking77.py +0 -324
  314. synth_ai/rl/secrets.py +0 -19
  315. synth_ai/scripts/verify_rewards.py +0 -100
  316. synth_ai/tracing/__init__.py +0 -30
  317. synth_ai/tracing_v1/__init__.py +0 -33
  318. synth_ai/tracing_v3/turso/__init__.py +0 -25
  319. synth_ai/tracing_v3/turso/manager.py +0 -774
  320. synth_ai/zyk/__init__.py +0 -30
  321. /synth_ai/{lm → v0/lm}/caching/__init__.py +0 -0
  322. /synth_ai/{lm → v0/lm}/caching/constants.py +0 -0
  323. /synth_ai/{lm → v0/lm}/caching/dbs.py +0 -0
  324. /synth_ai/{lm → v0/lm}/constants.py +0 -0
  325. /synth_ai/{lm → v0/lm}/core/__init__.py +0 -0
  326. /synth_ai/{lm → v0/lm}/cost/__init__.py +0 -0
  327. /synth_ai/{lm → v0/lm}/cost/monitor.py +0 -0
  328. /synth_ai/{lm → v0/lm}/cost/statefulness.py +0 -0
  329. /synth_ai/{lm → v0/lm}/injection.py +0 -0
  330. /synth_ai/{lm → v0/lm}/provider_support/__init__.py +0 -0
  331. /synth_ai/{lm → v0/lm}/provider_support/suppress_logging.py +0 -0
  332. /synth_ai/{lm → v0/lm}/structured_outputs/__init__.py +0 -0
  333. /synth_ai/{lm → v0/lm}/structured_outputs/inject.py +0 -0
  334. /synth_ai/{lm → v0/lm}/tools/__init__.py +0 -0
  335. /synth_ai/{lm → v0/lm}/tools/base.py +0 -0
  336. /synth_ai/{lm → v0/lm}/unified_interface.py +0 -0
  337. /synth_ai/{lm → v0/lm}/vendors/__init__.py +0 -0
  338. /synth_ai/{lm → v0/lm}/vendors/base.py +0 -0
  339. /synth_ai/{lm → v0/lm}/vendors/core/__init__.py +0 -0
  340. /synth_ai/{lm → v0/lm}/vendors/core/synth_dev_api.py +0 -0
  341. /synth_ai/{lm → v0/lm}/vendors/local/__init__.py +0 -0
  342. /synth_ai/{lm → v0/lm}/vendors/local/ollama.py +0 -0
  343. /synth_ai/{lm → v0/lm}/vendors/retries.py +0 -0
  344. /synth_ai/{lm → v0/lm}/vendors/supported/__init__.py +0 -0
  345. /synth_ai/{lm → v0/lm}/warmup.py +0 -0
  346. {synth_ai-0.2.9.dev5.dist-info → synth_ai-0.2.10.dist-info}/WHEEL +0 -0
  347. {synth_ai-0.2.9.dev5.dist-info → synth_ai-0.2.10.dist-info}/entry_points.txt +0 -0
  348. {synth_ai-0.2.9.dev5.dist-info → synth_ai-0.2.10.dist-info}/licenses/LICENSE +0 -0
  349. {synth_ai-0.2.9.dev5.dist-info → synth_ai-0.2.10.dist-info}/top_level.txt +0 -0
@@ -1,12 +1,12 @@
1
- from __future__ import annotations
2
-
3
1
  """Helpers for uploading RL environment credentials to the backend."""
4
2
 
3
+ from __future__ import annotations
4
+
5
5
  import base64
6
6
  import binascii
7
7
  import json
8
- from typing import Any, Dict
9
8
  import os
9
+ from typing import Any
10
10
 
11
11
  import requests
12
12
  from nacl.public import PublicKey, SealedBox
@@ -18,14 +18,12 @@ _ALGORITHM = "libsodium.sealedbox.v1"
18
18
 
19
19
 
20
20
  def encrypt_for_backend(pubkey_b64: str, secret: str | bytes) -> str:
21
- """Encrypt ``secret`` for storage by the backend using libsodium sealed boxes."""
22
-
23
21
  if not isinstance(pubkey_b64, str) or not pubkey_b64.strip():
24
22
  raise ValueError("public key must be a non-empty base64 string")
25
23
 
26
24
  try:
27
25
  key_bytes = base64.b64decode(pubkey_b64, validate=True)
28
- except binascii.Error as exc: # pragma: no cover - defensive guard
26
+ except binascii.Error as exc:
29
27
  raise ValueError("public key must be base64-encoded") from exc
30
28
 
31
29
  if len(key_bytes) != 32:
@@ -35,7 +33,7 @@ def encrypt_for_backend(pubkey_b64: str, secret: str | bytes) -> str:
35
33
  secret_bytes = secret.encode("utf-8")
36
34
  elif isinstance(secret, bytes):
37
35
  secret_bytes = secret
38
- else: # pragma: no cover - type guard
36
+ else:
39
37
  raise TypeError("secret must be str or bytes")
40
38
 
41
39
  if not secret_bytes:
@@ -52,20 +50,17 @@ def setup_environment_api_key(
52
50
  token: str | None = None,
53
51
  *,
54
52
  timeout: float = 15.0,
55
- ) -> Dict[str, Any]:
56
- """Upload an ENVIRONMENT_API_KEY to the backend."""
57
-
53
+ ) -> dict[str, Any]:
58
54
  backend = backend_base.rstrip("/")
59
55
  if not backend:
60
56
  raise ValueError("backend_base must be provided")
61
57
  if not synth_api_key:
62
58
  raise ValueError("synth_api_key must be provided")
63
59
 
64
- # Require caller-provided plaintext. If not provided, read from ENVIRONMENT_API_KEY.
65
60
  plaintext = token if token is not None else os.getenv("ENVIRONMENT_API_KEY", "").strip()
66
61
  if not plaintext:
67
62
  raise ValueError("ENVIRONMENT_API_KEY must be set (or pass token=...) to upload")
68
- if not isinstance(plaintext, str): # pragma: no cover - defensive guard
63
+ if not isinstance(plaintext, str):
69
64
  raise TypeError("token must be a string")
70
65
 
71
66
  token_bytes = plaintext.encode("utf-8")
@@ -81,7 +76,7 @@ def setup_environment_api_key(
81
76
 
82
77
  try:
83
78
  doc = response.json()
84
- except ValueError as exc: # pragma: no cover - backend invariant
79
+ except ValueError as exc:
85
80
  raise RuntimeError("backend returned invalid JSON for public key") from exc
86
81
 
87
82
  if not isinstance(doc, dict):
@@ -91,17 +86,51 @@ def setup_environment_api_key(
91
86
  if not isinstance(pubkey, str) or not pubkey:
92
87
  raise RuntimeError("backend response missing public_key")
93
88
 
94
- # The backend currently returns a single algorithm identifier; keep a guard in
95
- # case future versions change the value and we need to surface that to callers.
96
89
  alg = doc.get("alg")
97
90
  if alg is not None and alg != _ALGORITHM:
98
91
  raise RuntimeError(f"unsupported sealed box algorithm: {alg}")
99
92
 
93
+ # Diagnostics: safe previews and hashes to correlate with backend logs
94
+ try:
95
+ import hashlib as _hash
96
+
97
+ pk_bytes = base64.b64decode(pubkey, validate=True)
98
+ pk_sha256 = _hash.sha256(pk_bytes).hexdigest()
99
+ print(
100
+ f"[env-keys] public_key: b64_len={len(pubkey)} sha256={pk_sha256} head={pubkey[:16]} tail={pubkey[-16:]}"
101
+ )
102
+ _plen = len(plaintext)
103
+ _ppref = (plaintext[:6] + "…") if _plen > 10 else plaintext
104
+ _psuf = ("…" + plaintext[-4:]) if _plen > 10 else ""
105
+ _has_ws = any(ch.isspace() for ch in plaintext)
106
+ print(
107
+ f"[env-keys] plaintext: len={_plen} preview={_ppref}{_psuf} has_ws={bool(_has_ws)}"
108
+ )
109
+ except Exception:
110
+ pass
111
+
100
112
  ciphertext_b64 = encrypt_for_backend(pubkey, token_bytes)
101
113
 
102
114
  body = {"name": "ENVIRONMENT_API_KEY", "ciphertext_b64": ciphertext_b64}
103
115
  post_url = f"{backend}/api/v1/env-keys"
104
- response2 = requests.post(post_url, headers={**headers, "Content-Type": "application/json"}, json=body, timeout=timeout)
116
+ # Ciphertext diagnostics
117
+ try:
118
+ import hashlib as _hash
119
+
120
+ _ct_bytes = base64.b64decode(ciphertext_b64, validate=True)
121
+ _ct_sha = _hash.sha256(_ct_bytes).hexdigest()
122
+ print(
123
+ f"[env-keys] ciphertext: b64_len={len(ciphertext_b64)} sha256={_ct_sha} head={ciphertext_b64[:16]} tail={ciphertext_b64[-16:]}"
124
+ )
125
+ except Exception:
126
+ pass
127
+
128
+ response2 = requests.post(
129
+ post_url,
130
+ headers={**headers, "Content-Type": "application/json"},
131
+ json=body,
132
+ timeout=timeout,
133
+ )
105
134
  _raise_with_detail(response2)
106
135
 
107
136
  try:
@@ -0,0 +1,13 @@
1
+ """Helpers for generating RL environment credentials."""
2
+
3
+ from __future__ import annotations
4
+
5
+ import secrets
6
+
7
+ __all__ = ["mint_environment_api_key"]
8
+
9
+
10
+ def mint_environment_api_key() -> str:
11
+ """Mint a random ENVIRONMENT_API_KEY value."""
12
+
13
+ return secrets.token_hex(32)
@@ -1,256 +1,5 @@
1
1
  from __future__ import annotations
2
2
 
3
- from typing import Any, Dict, List, Optional, Callable
4
- import os
5
- import time
6
-
7
- from ..http import AsyncHttpClient, HTTPError, sleep
8
-
9
-
10
- def _api_base(b: str) -> str:
11
- b = (b or "").rstrip("/")
12
- return b if b.endswith("/api") else f"{b}/api"
13
-
14
-
15
- class RlClient:
16
- """Lightweight RL client for provider-agnostic job control.
17
-
18
- Notes:
19
- - Uses learning/* for status/events/metrics and rl/* for creation/start.
20
- - Trainer endpoints are resolved server-side via trainer_id.
21
- """
22
-
23
- def __init__(self, base_url: str, api_key: str, *, timeout: float = 600.0) -> None:
24
- self._base_url = base_url.rstrip("/")
25
- self._api_key = api_key
26
- self._timeout = timeout
27
-
28
- async def resolve_trainer_start_url(self, trainer_id: str) -> str:
29
- """GET /api/rl/services/{id} → { training_start_url }"""
30
- path = f"/api/rl/services/{trainer_id}"
31
- async with AsyncHttpClient(self._base_url, self._api_key, timeout=30.0) as http:
32
- js = await http.get(path)
33
- if not isinstance(js, dict):
34
- raise HTTPError(status=500, url=path, message="invalid_service_response", body_snippet=str(js)[:200])
35
- start_url = js.get("training_start_url")
36
- if not isinstance(start_url, str) or not start_url:
37
- raise HTTPError(status=500, url=path, message="missing_training_start_url", body_snippet=str(js)[:200])
38
- return start_url
39
-
40
- async def create_job(
41
- self,
42
- *,
43
- model: str,
44
- task_app_url: str,
45
- trainer: Dict[str, Any],
46
- trainer_id: Optional[str] = None,
47
- job_config_id: Optional[str] = None,
48
- inline_config: Optional[Dict[str, Any]] = None,
49
- ) -> Dict[str, Any]:
50
- body = {
51
- "job_type": "rl",
52
- "data": {
53
- "model": model,
54
- "endpoint_base_url": task_app_url,
55
- **({"job_config_id": job_config_id} if job_config_id else {}),
56
- **({"config": inline_config} if inline_config else {}),
57
- "trainer": {
58
- "batch_size": int(trainer.get("batch_size", 1)),
59
- "group_size": max(2, int(trainer.get("group_size", 2))),
60
- },
61
- },
62
- }
63
- async with AsyncHttpClient(self._base_url, self._api_key, timeout=self._timeout) as http:
64
- js = await http.post_json(f"{_api_base(self._base_url)}/rl/jobs", json=body)
65
- if not isinstance(js, dict):
66
- raise HTTPError(status=500, url="/api/rl/jobs", message="invalid_create_response", body_snippet=str(js)[:200])
67
- return js
68
-
69
- async def start_job_if_supported(self, job_id: str) -> Optional[Dict[str, Any]]:
70
- path = f"{_api_base(self._base_url)}/rl/jobs/{job_id}/start"
71
- try:
72
- async with AsyncHttpClient(self._base_url, self._api_key, timeout=30.0) as http:
73
- return await http.post_json(path, json={})
74
- except HTTPError as he: # noqa: PERF203
75
- if he.status == 404:
76
- return None
77
- raise
78
-
79
- async def get_job(self, job_id: str) -> Dict[str, Any]:
80
- async with AsyncHttpClient(self._base_url, self._api_key, timeout=30.0) as http:
81
- return await http.get(f"{_api_base(self._base_url)}/learning/jobs/{job_id}")
82
-
83
- async def get_events(self, job_id: str, *, since_seq: int = 0, limit: int = 200) -> List[Dict[str, Any]]:
84
- params = {"since_seq": since_seq, "limit": limit}
85
- async with AsyncHttpClient(self._base_url, self._api_key, timeout=30.0) as http:
86
- try:
87
- js = await http.get(f"{_api_base(self._base_url)}/learning/jobs/{job_id}/events", params=params)
88
- except HTTPError as he:
89
- try:
90
- print(
91
- f"[poll] events HTTPError status={he.status} url={he.url} since_seq={since_seq} body={(he.body_snippet or '')[:200]}"
92
- )
93
- except Exception:
94
- pass
95
- raise
96
- if isinstance(js, dict):
97
- evs = js.get("events") or js.get("data")
98
- if isinstance(evs, list):
99
- return evs
100
- return []
101
-
102
- async def get_metrics(self, job_id: str, *, after_step: int = -1, limit: int = 200) -> List[Dict[str, Any]]:
103
- params = {"after_step": after_step, "limit": limit}
104
- async with AsyncHttpClient(self._base_url, self._api_key, timeout=30.0) as http:
105
- js = await http.get(f"{_api_base(self._base_url)}/learning/jobs/{job_id}/metrics", params=params)
106
- if isinstance(js, dict) and isinstance(js.get("points"), list):
107
- return js["points"]
108
- return []
109
-
110
- async def poll_until_terminal(
111
- self,
112
- job_id: str,
113
- *,
114
- interval_seconds: float = 2.0,
115
- max_seconds: float | None = None,
116
- empty_polls_threshold: int = 5,
117
- startup_deadline_s: int = 45,
118
- on_event: Optional[Callable[[Dict[str, Any]], None]] = None,
119
- on_metric: Optional[Callable[[Dict[str, Any]], None]] = None,
120
- ) -> Dict[str, Any]:
121
- last_seq_by_stream: Dict[str, int] = {}
122
- events_job_id: Optional[str] = None
123
- last_status: Optional[str] = None
124
- last_step_by_name: Dict[str, int] = {}
125
- empty_polls = 0
126
- saw_any_event = False
127
- start_t = time.time()
128
- terminal = {"succeeded", "failed", "cancelled", "canceled", "error", "completed"}
129
-
130
- while True:
131
- status_data: Optional[Dict[str, Any]] = None
132
- try:
133
- status_data = await self.get_job(job_id)
134
- except Exception:
135
- status_data = None
136
- if status_data is None:
137
- try:
138
- print(f"[poll] get_job returned None base={self._base_url} job_id={job_id}")
139
- except Exception:
140
- pass
141
- status = str((status_data or {}).get("status") or "").lower()
142
- if status_data:
143
- linked = status_data.get("linked_job_id")
144
- if isinstance(linked, str) and linked and linked != events_job_id:
145
- events_job_id = linked
146
- try:
147
- print(f"[poll] discovered linked_job_id stream={events_job_id}")
148
- except Exception:
149
- pass
150
- if status and status != last_status:
151
- last_status = status
152
- # Status transitions only to avoid log spam
153
- if on_event:
154
- try:
155
- on_event({"type": "rl.status", "message": status})
156
- except Exception:
157
- pass
158
-
159
- # Events
160
- stream_ids = [job_id]
161
- if events_job_id and events_job_id not in stream_ids:
162
- stream_ids.append(events_job_id)
163
- try:
164
- print(f"[poll] streams={stream_ids} intervals={interval_seconds}s since_map={last_seq_by_stream} empty_polls={empty_polls}")
165
- except Exception:
166
- pass
167
- total_events_this_cycle = 0
168
- terminal_event_seen = False
169
- terminal_event_status: Optional[str] = None
170
- for ev_id in stream_ids:
171
- since = last_seq_by_stream.get(ev_id, 0)
172
- try:
173
- events = await self.get_events(ev_id, since_seq=since, limit=200)
174
- except HTTPError as he:
175
- try:
176
- print(f"[poll] get_events error status={he.status} url={he.url} since={since} body={(he.body_snippet or '')[:200]}")
177
- except Exception:
178
- pass
179
- events = []
180
- except Exception as e:
181
- try:
182
- print(f"[poll] get_events unexpected error ev_id={ev_id} since={since} err={type(e).__name__}: {e}")
183
- except Exception:
184
- pass
185
- events = []
186
- total_events_this_cycle += len(events)
187
- if events:
188
- saw_any_event = True
189
- for e in events:
190
- seq_val = int(e.get("seq") or 0)
191
- if seq_val <= last_seq_by_stream.get(ev_id, 0):
192
- continue
193
- last_seq_by_stream[ev_id] = seq_val
194
- if on_event:
195
- try:
196
- on_event(e)
197
- except Exception:
198
- pass
199
- et = str(e.get("type") or e.get("event_type") or "").lower()
200
- if et in ("rl.job.completed", "workflow.completed", "rl.train.completed"):
201
- terminal_event_seen = True
202
- terminal_event_status = "succeeded"
203
- elif et in ("rl.job.failed", "workflow.failed"):
204
- terminal_event_seen = True
205
- terminal_event_status = "failed"
206
-
207
- # Metrics
208
- try:
209
- after = max(last_step_by_name.values()) if last_step_by_name else -1
210
- points = await self.get_metrics(job_id, after_step=after, limit=200)
211
- for p in points:
212
- name = str(p.get("name") or "")
213
- step = int(p.get("step") or -1)
214
- if step <= last_step_by_name.get(name, -1):
215
- continue
216
- last_step_by_name[name] = step
217
- if on_metric:
218
- try:
219
- on_metric(p)
220
- except Exception:
221
- pass
222
- except Exception:
223
- pass
224
-
225
- if terminal_event_seen:
226
- return {"status": terminal_event_status or status or "completed", "job_id": job_id}
227
- if status and status in terminal:
228
- return {"status": status, "job_id": job_id}
229
-
230
- if total_events_this_cycle == 0:
231
- empty_polls += 1
232
- else:
233
- empty_polls = 0
234
- if empty_polls >= max(1, int(empty_polls_threshold)):
235
- try:
236
- print(
237
- f"[poll] threshold hit: empty_polls={empty_polls} >= {empty_polls_threshold} streams={stream_ids} last_seq_map={last_seq_by_stream}"
238
- )
239
- except Exception:
240
- pass
241
- raise AssertionError(f"No new events detected for {empty_polls_threshold} consecutive polls. Check event ingestion.")
242
-
243
- if not saw_any_event and (time.time() - start_t) > int(startup_deadline_s):
244
- try:
245
- print(
246
- f"[poll] startup window exceeded: {startup_deadline_s}s base={self._base_url} job={job_id} streams={stream_ids} last_seq_map={last_seq_by_stream}"
247
- )
248
- except Exception:
249
- pass
250
- raise AssertionError(f"No events observed within startup window ({startup_deadline_s}s). Investigate event streaming.")
251
-
252
- await sleep(interval_seconds)
253
- if max_seconds is not None and (time.time() - start_t) >= max_seconds:
254
- raise TimeoutError(f"Polling timed out after {max_seconds}s for job {job_id}")
255
-
3
+ from .rl.client import RlClient
256
4
 
5
+ __all__ = ["RlClient"]
@@ -0,0 +1,29 @@
1
+ from .client import FtClient
2
+ from .data import (
3
+ SFTDataError,
4
+ SFTExample,
5
+ SFTMessage,
6
+ SFTToolCall,
7
+ SFTToolDefinition,
8
+ coerce_example,
9
+ collect_sft_jsonl_errors,
10
+ iter_sft_examples,
11
+ load_jsonl,
12
+ parse_jsonl_line,
13
+ validate_jsonl_or_raise,
14
+ )
15
+
16
+ __all__ = [
17
+ "FtClient",
18
+ "SFTDataError",
19
+ "SFTExample",
20
+ "SFTMessage",
21
+ "SFTToolCall",
22
+ "SFTToolDefinition",
23
+ "collect_sft_jsonl_errors",
24
+ "coerce_example",
25
+ "iter_sft_examples",
26
+ "load_jsonl",
27
+ "parse_jsonl_line",
28
+ "validate_jsonl_or_raise",
29
+ ]
@@ -0,0 +1,68 @@
1
+ from __future__ import annotations
2
+
3
+ from pathlib import Path
4
+ from typing import Any
5
+
6
+ from ...http import AsyncHttpClient, HTTPError
7
+ from .config import prepare_sft_job_payload
8
+ from .data import validate_jsonl_or_raise
9
+
10
+
11
+ class FtClient:
12
+ def __init__(self, base_url: str, api_key: str, *, timeout: float = 30.0) -> None:
13
+ self._base_url = base_url.rstrip("/")
14
+ self._api_key = api_key
15
+ self._timeout = timeout
16
+
17
+ async def upload_training_file(self, path: str | Path, *, purpose: str = "fine-tune") -> str:
18
+ p = Path(path)
19
+ if p.suffix.lower() == ".jsonl" and purpose == "fine-tune":
20
+ validate_jsonl_or_raise(p, min_messages=2)
21
+ content = p.read_bytes()
22
+ async with AsyncHttpClient(self._base_url, self._api_key, timeout=self._timeout) as http:
23
+ data = {"purpose": purpose}
24
+ files = {"file": (p.name, content, _infer_content_type(p.name))}
25
+ js = await http.post_multipart("/api/learning/files", data=data, files=files)
26
+ if not isinstance(js, dict) or "id" not in js:
27
+ raise HTTPError(
28
+ status=500,
29
+ url="/api/learning/files",
30
+ message="invalid_upload_response",
31
+ body_snippet=str(js)[:200],
32
+ )
33
+ return str(js["id"])
34
+
35
+ async def create_sft_job(
36
+ self,
37
+ *,
38
+ model: str,
39
+ training_file_id: str,
40
+ hyperparameters: dict[str, Any],
41
+ metadata: dict[str, Any] | None = None,
42
+ ) -> dict[str, Any]:
43
+ body = prepare_sft_job_payload(
44
+ model=model,
45
+ training_file=training_file_id,
46
+ hyperparameters=hyperparameters,
47
+ metadata=metadata,
48
+ training_type="sft_offline",
49
+ training_file_field="training_file_id",
50
+ require_training_file=True,
51
+ )
52
+ async with AsyncHttpClient(self._base_url, self._api_key, timeout=self._timeout) as http:
53
+ return await http.post_json("/api/learning/jobs", json=body)
54
+
55
+ async def start_job(self, job_id: str) -> dict[str, Any]:
56
+ async with AsyncHttpClient(self._base_url, self._api_key, timeout=self._timeout) as http:
57
+ return await http.post_json(f"/api/learning/jobs/{job_id}/start", json={})
58
+
59
+
60
+ def _infer_content_type(filename: str) -> str:
61
+ name = filename.lower()
62
+ if name.endswith(".jsonl"):
63
+ return "application/jsonl"
64
+ if name.endswith(".json"):
65
+ return "application/json"
66
+ if name.endswith(".txt"):
67
+ return "text/plain"
68
+ return "application/octet-stream"