synth-ai 0.2.6.dev1__py3-none-any.whl → 0.4.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (738) hide show
  1. synth_ai/__init__.py +44 -24
  2. synth_ai/__main__.py +30 -3
  3. synth_ai/cli/__init__.py +103 -48
  4. synth_ai/cli/__main__.py +42 -0
  5. synth_ai/cli/_internal/__init__.py +5 -0
  6. synth_ai/cli/_internal/modal_wrapper.py +31 -0
  7. synth_ai/cli/_internal/storage.py +20 -0
  8. synth_ai/cli/_internal/typer_patch.py +47 -0
  9. synth_ai/cli/_internal/validate_task_app.py +29 -0
  10. synth_ai/cli/agents/__init__.py +17 -0
  11. synth_ai/cli/agents/claude.py +77 -0
  12. synth_ai/cli/agents/codex.py +265 -0
  13. synth_ai/cli/agents/opencode.py +253 -0
  14. synth_ai/cli/commands/__init__.py +18 -0
  15. synth_ai/cli/commands/artifacts/__init__.py +13 -0
  16. synth_ai/cli/commands/artifacts/client.py +119 -0
  17. synth_ai/cli/commands/artifacts/config.py +57 -0
  18. synth_ai/cli/commands/artifacts/core.py +24 -0
  19. synth_ai/cli/commands/artifacts/download.py +188 -0
  20. synth_ai/cli/commands/artifacts/export.py +186 -0
  21. synth_ai/cli/commands/artifacts/list.py +156 -0
  22. synth_ai/cli/commands/artifacts/parsing.py +250 -0
  23. synth_ai/cli/commands/artifacts/show.py +336 -0
  24. synth_ai/cli/commands/demo/__init__.py +3 -0
  25. synth_ai/cli/commands/demo/core.py +153 -0
  26. synth_ai/cli/commands/eval/__init__.py +10 -0
  27. synth_ai/cli/commands/eval/config.py +338 -0
  28. synth_ai/cli/commands/eval/core.py +256 -0
  29. synth_ai/cli/commands/eval/runner.py +704 -0
  30. synth_ai/cli/commands/eval/validation.py +60 -0
  31. synth_ai/cli/commands/filter/__init__.py +12 -0
  32. synth_ai/cli/commands/filter/core.py +424 -0
  33. synth_ai/cli/commands/filter/errors.py +55 -0
  34. synth_ai/cli/commands/filter/validation.py +77 -0
  35. synth_ai/cli/commands/help/__init__.py +185 -0
  36. synth_ai/cli/commands/help/core.py +72 -0
  37. synth_ai/cli/commands/scan/__init__.py +19 -0
  38. synth_ai/cli/commands/scan/cloudflare_scanner.py +403 -0
  39. synth_ai/cli/commands/scan/core.py +344 -0
  40. synth_ai/cli/commands/scan/health_checker.py +242 -0
  41. synth_ai/cli/commands/scan/local_scanner.py +278 -0
  42. synth_ai/cli/commands/scan/models.py +83 -0
  43. synth_ai/cli/commands/smoke/__init__.py +7 -0
  44. synth_ai/cli/commands/smoke/core.py +1428 -0
  45. synth_ai/cli/commands/status/__init__.py +3 -0
  46. synth_ai/cli/commands/status/client.py +91 -0
  47. synth_ai/cli/commands/status/config.py +12 -0
  48. synth_ai/cli/commands/status/errors.py +11 -0
  49. synth_ai/cli/commands/status/subcommands/__init__.py +3 -0
  50. synth_ai/cli/commands/status/subcommands/config.py +13 -0
  51. synth_ai/cli/commands/status/subcommands/files.py +34 -0
  52. synth_ai/cli/commands/status/subcommands/jobs.py +51 -0
  53. synth_ai/cli/commands/status/subcommands/models.py +35 -0
  54. synth_ai/cli/commands/status/subcommands/runs.py +34 -0
  55. synth_ai/cli/commands/status/subcommands/session.py +77 -0
  56. synth_ai/cli/commands/status/subcommands/summary.py +39 -0
  57. synth_ai/cli/commands/status/subcommands/utils.py +41 -0
  58. synth_ai/cli/commands/status/utils.py +23 -0
  59. synth_ai/cli/commands/train/__init__.py +53 -0
  60. synth_ai/cli/commands/train/core.py +22 -0
  61. synth_ai/cli/commands/train/errors.py +117 -0
  62. synth_ai/cli/commands/train/judge_schemas.py +201 -0
  63. synth_ai/cli/commands/train/judge_validation.py +305 -0
  64. synth_ai/cli/commands/train/prompt_learning_validation.py +633 -0
  65. synth_ai/cli/commands/train/validation.py +392 -0
  66. synth_ai/cli/demo_apps/__init__.py +10 -0
  67. synth_ai/cli/demo_apps/core/__init__.py +28 -0
  68. synth_ai/cli/demo_apps/core/cli.py +1735 -0
  69. synth_ai/cli/demo_apps/crafter/__init__.py +1 -0
  70. synth_ai/cli/demo_apps/crafter/crafter_fft_4b.toml +55 -0
  71. synth_ai/cli/demo_apps/crafter/grpo_crafter_task_app.py +186 -0
  72. synth_ai/cli/demo_apps/crafter/rl_from_base_qwen4b.toml +74 -0
  73. synth_ai/cli/demo_apps/demo_registry.py +176 -0
  74. synth_ai/cli/demo_apps/demo_task_apps/__init__.py +7 -0
  75. synth_ai/{demos → cli/demo_apps}/demo_task_apps/core.py +117 -51
  76. synth_ai/cli/demo_apps/demo_task_apps/crafter/__init__.py +1 -0
  77. synth_ai/cli/demo_apps/demo_task_apps/crafter/configs/crafter_fft_4b.toml +53 -0
  78. synth_ai/cli/demo_apps/demo_task_apps/crafter/configs/rl_from_base_qwen4b.toml +73 -0
  79. synth_ai/cli/demo_apps/demo_task_apps/crafter/grpo_crafter_task_app.py +185 -0
  80. synth_ai/cli/demo_apps/demo_task_apps/math/_common.py +16 -0
  81. synth_ai/{demos → cli/demo_apps}/demo_task_apps/math/app.py +2 -1
  82. synth_ai/cli/demo_apps/demo_task_apps/math/config.toml +73 -0
  83. synth_ai/{demos → cli/demo_apps}/demo_task_apps/math/deploy_modal.py +3 -6
  84. synth_ai/cli/demo_apps/demo_task_apps/math/modal_task_app.py +738 -0
  85. synth_ai/cli/demo_apps/demo_task_apps/math/task_app_entry.py +39 -0
  86. synth_ai/cli/demo_apps/math/__init__.py +1 -0
  87. synth_ai/cli/demo_apps/math/_common.py +16 -0
  88. synth_ai/cli/demo_apps/math/app.py +38 -0
  89. synth_ai/cli/demo_apps/math/config.toml +75 -0
  90. synth_ai/cli/demo_apps/math/deploy_modal.py +54 -0
  91. synth_ai/cli/demo_apps/math/modal_task_app.py +698 -0
  92. synth_ai/cli/demo_apps/math/task_app_entry.py +53 -0
  93. synth_ai/cli/demo_apps/mipro/main.py +271 -0
  94. synth_ai/cli/demo_apps/mipro/task_app.py +922 -0
  95. synth_ai/cli/demo_apps/mipro/train_cfg.toml +92 -0
  96. synth_ai/cli/demos/__init__.py +12 -0
  97. synth_ai/cli/demos/demo.py +32 -0
  98. synth_ai/cli/demos/rl_demo.py +254 -0
  99. synth_ai/cli/deploy.py +216 -0
  100. synth_ai/cli/infra/__init__.py +14 -0
  101. synth_ai/cli/{balance.py → infra/balance.py} +21 -3
  102. synth_ai/cli/infra/mcp.py +35 -0
  103. synth_ai/cli/infra/modal_app.py +36 -0
  104. synth_ai/cli/infra/setup.py +69 -0
  105. synth_ai/cli/infra/status.py +16 -0
  106. synth_ai/cli/infra/turso.py +77 -0
  107. synth_ai/cli/lib/__init__.py +10 -0
  108. synth_ai/cli/lib/agents.py +76 -0
  109. synth_ai/cli/lib/apps/modal_app.py +101 -0
  110. synth_ai/cli/lib/apps/task_app.py +642 -0
  111. synth_ai/cli/lib/bin.py +39 -0
  112. synth_ai/cli/lib/env.py +375 -0
  113. synth_ai/cli/lib/errors.py +85 -0
  114. synth_ai/cli/lib/modal.py +315 -0
  115. synth_ai/cli/lib/plotting.py +126 -0
  116. synth_ai/cli/lib/prompt_args.py +39 -0
  117. synth_ai/cli/lib/prompts.py +284 -0
  118. synth_ai/cli/lib/sqld.py +122 -0
  119. synth_ai/cli/lib/task_app_discovery.py +884 -0
  120. synth_ai/cli/lib/task_app_env.py +295 -0
  121. synth_ai/cli/lib/train_cfgs.py +300 -0
  122. synth_ai/cli/lib/tunnel_records.py +207 -0
  123. synth_ai/cli/local/__init__.py +14 -0
  124. synth_ai/cli/local/experiment_queue/__init__.py +72 -0
  125. synth_ai/cli/local/experiment_queue/api_schemas.py +221 -0
  126. synth_ai/cli/local/experiment_queue/celery_app.py +208 -0
  127. synth_ai/cli/local/experiment_queue/config.py +128 -0
  128. synth_ai/cli/local/experiment_queue/config_utils.py +272 -0
  129. synth_ai/cli/local/experiment_queue/database.py +175 -0
  130. synth_ai/cli/local/experiment_queue/dispatcher.py +119 -0
  131. synth_ai/cli/local/experiment_queue/models.py +231 -0
  132. synth_ai/cli/local/experiment_queue/progress_info.py +160 -0
  133. synth_ai/cli/local/experiment_queue/results.py +373 -0
  134. synth_ai/cli/local/experiment_queue/schemas.py +131 -0
  135. synth_ai/cli/local/experiment_queue/service.py +344 -0
  136. synth_ai/cli/local/experiment_queue/status.py +372 -0
  137. synth_ai/cli/local/experiment_queue/status_tracker.py +360 -0
  138. synth_ai/cli/local/experiment_queue/tasks.py +1984 -0
  139. synth_ai/cli/local/experiment_queue/trace_storage.py +65 -0
  140. synth_ai/cli/local/experiment_queue/validation.py +157 -0
  141. synth_ai/cli/local/session/__init__.py +92 -0
  142. synth_ai/cli/local/session/client.py +383 -0
  143. synth_ai/cli/local/session/constants.py +63 -0
  144. synth_ai/cli/local/session/exceptions.py +105 -0
  145. synth_ai/cli/local/session/manager.py +139 -0
  146. synth_ai/cli/local/session/models.py +89 -0
  147. synth_ai/cli/local/session/query.py +110 -0
  148. synth_ai/cli/root.py +150 -102
  149. synth_ai/cli/task_apps/__init__.py +37 -0
  150. synth_ai/cli/task_apps/commands.py +3145 -0
  151. synth_ai/cli/task_apps/deploy.py +7 -0
  152. synth_ai/cli/task_apps/list.py +26 -0
  153. synth_ai/cli/task_apps/main.py +36 -0
  154. synth_ai/cli/task_apps/modal_serve.py +11 -0
  155. synth_ai/cli/task_apps/serve.py +11 -0
  156. synth_ai/cli/training/__init__.py +8 -0
  157. synth_ai/cli/training/train.py +5 -0
  158. synth_ai/cli/training/train_cfg.py +34 -0
  159. synth_ai/cli/{watch.py → training/watch.py} +13 -18
  160. synth_ai/cli/turso.py +52 -0
  161. synth_ai/cli/utils/__init__.py +8 -0
  162. synth_ai/cli/utils/experiments.py +235 -0
  163. synth_ai/cli/utils/queue.py +504 -0
  164. synth_ai/cli/{recent.py → utils/recent.py} +13 -7
  165. synth_ai/cli/{traces.py → utils/traces.py} +9 -5
  166. synth_ai/contracts/__init__.py +67 -0
  167. synth_ai/core/__init__.py +100 -0
  168. synth_ai/core/_utils/__init__.py +54 -0
  169. synth_ai/core/_utils/base_url.py +10 -0
  170. synth_ai/core/_utils/http.py +10 -0
  171. synth_ai/core/_utils/prompts.py +14 -0
  172. synth_ai/core/_utils/task_app_state.py +12 -0
  173. synth_ai/core/_utils/user_config.py +10 -0
  174. synth_ai/core/apps/common.py +116 -0
  175. synth_ai/core/auth.py +95 -0
  176. synth_ai/core/cfgs.py +240 -0
  177. synth_ai/core/config/__init__.py +16 -0
  178. synth_ai/core/config/base.py +168 -0
  179. synth_ai/core/config/resolver.py +89 -0
  180. synth_ai/core/env.py +231 -0
  181. synth_ai/core/errors.py +126 -0
  182. synth_ai/core/http.py +230 -0
  183. synth_ai/core/integrations/__init__.py +11 -0
  184. synth_ai/core/integrations/cloudflare.py +1710 -0
  185. synth_ai/core/integrations/mcp/__init__.py +6 -0
  186. synth_ai/core/integrations/mcp/__main__.py +8 -0
  187. synth_ai/core/integrations/mcp/claude.py +36 -0
  188. synth_ai/core/integrations/mcp/main.py +254 -0
  189. synth_ai/core/integrations/mcp/setup.py +100 -0
  190. synth_ai/core/integrations/modal.py +277 -0
  191. synth_ai/core/json.py +72 -0
  192. synth_ai/core/log_filter.py +99 -0
  193. synth_ai/core/logging.py +82 -0
  194. synth_ai/core/paths.py +107 -0
  195. synth_ai/core/pricing.py +109 -0
  196. synth_ai/core/process.py +233 -0
  197. synth_ai/core/ssl.py +25 -0
  198. synth_ai/core/storage/__init__.py +71 -0
  199. synth_ai/core/task_app_state.py +318 -0
  200. synth_ai/core/telemetry.py +282 -0
  201. synth_ai/{tracing_v3 → core/tracing_v3}/__init__.py +5 -1
  202. synth_ai/{tracing_v3 → core/tracing_v3}/abstractions.py +21 -4
  203. synth_ai/core/tracing_v3/config.py +229 -0
  204. synth_ai/core/tracing_v3/constants.py +21 -0
  205. synth_ai/{tracing_v3 → core/tracing_v3}/db_config.py +42 -29
  206. synth_ai/{tracing_v3 → core/tracing_v3}/decorators.py +80 -45
  207. synth_ai/{tracing_v3 → core/tracing_v3}/examples/basic_usage.py +15 -9
  208. synth_ai/{tracing_v3 → core/tracing_v3}/hooks.py +6 -4
  209. synth_ai/{tracing_v3 → core/tracing_v3}/llm_call_record_helpers.py +161 -61
  210. synth_ai/{tracing_v3 → core/tracing_v3}/migration_helper.py +1 -2
  211. synth_ai/{tracing_v3 → core/tracing_v3}/replica_sync.py +12 -7
  212. synth_ai/core/tracing_v3/serialization.py +130 -0
  213. synth_ai/{tracing_v3 → core/tracing_v3}/session_tracer.py +88 -21
  214. synth_ai/{tracing_v3 → core/tracing_v3}/storage/base.py +99 -12
  215. synth_ai/core/tracing_v3/storage/config.py +109 -0
  216. synth_ai/{tracing_v3 → core/tracing_v3}/storage/factory.py +11 -9
  217. synth_ai/{tracing_v3 → core/tracing_v3}/storage/utils.py +15 -11
  218. synth_ai/core/tracing_v3/trace_utils.py +326 -0
  219. synth_ai/core/tracing_v3/turso/__init__.py +12 -0
  220. synth_ai/core/tracing_v3/turso/daemon.py +278 -0
  221. synth_ai/{tracing_v3 → core/tracing_v3}/turso/models.py +7 -3
  222. synth_ai/core/tracing_v3/turso/native_manager.py +1385 -0
  223. synth_ai/{tracing_v3 → core/tracing_v3}/utils.py +5 -4
  224. synth_ai/core/urls.py +18 -0
  225. synth_ai/core/user_config.py +137 -0
  226. synth_ai/core/uvicorn.py +222 -0
  227. synth_ai/data/__init__.py +83 -0
  228. synth_ai/data/enums.py +123 -0
  229. synth_ai/data/rewards.py +152 -0
  230. synth_ai/data/traces.py +35 -0
  231. synth_ai/products/__init__.py +6 -0
  232. synth_ai/products/graph_evolve/__init__.py +46 -0
  233. synth_ai/products/graph_evolve/client.py +226 -0
  234. synth_ai/products/graph_evolve/config.py +591 -0
  235. synth_ai/products/graph_evolve/converters/__init__.py +42 -0
  236. synth_ai/products/graph_evolve/converters/openai_sft.py +484 -0
  237. synth_ai/products/graph_evolve/examples/hotpotqa/config.toml +109 -0
  238. synth_ai/products/graph_evolve/run.py +222 -0
  239. synth_ai/products/graph_gepa/__init__.py +23 -0
  240. synth_ai/products/graph_gepa/converters/__init__.py +19 -0
  241. synth_ai/products/graph_gepa/converters/openai_sft.py +29 -0
  242. synth_ai/sdk/__init__.py +123 -0
  243. synth_ai/sdk/api/__init__.py +1 -0
  244. synth_ai/sdk/api/models/supported.py +514 -0
  245. synth_ai/sdk/api/research_agent/__init__.py +296 -0
  246. synth_ai/sdk/api/train/__init__.py +85 -0
  247. synth_ai/sdk/api/train/builders.py +895 -0
  248. synth_ai/sdk/api/train/cli.py +2199 -0
  249. synth_ai/sdk/api/train/config_finder.py +267 -0
  250. synth_ai/sdk/api/train/configs/__init__.py +65 -0
  251. synth_ai/sdk/api/train/configs/prompt_learning.py +1706 -0
  252. synth_ai/sdk/api/train/configs/rl.py +187 -0
  253. synth_ai/sdk/api/train/configs/sft.py +99 -0
  254. synth_ai/sdk/api/train/configs/shared.py +81 -0
  255. synth_ai/sdk/api/train/context_learning.py +312 -0
  256. synth_ai/sdk/api/train/env_resolver.py +418 -0
  257. synth_ai/sdk/api/train/graph_validators.py +216 -0
  258. synth_ai/sdk/api/train/graphgen.py +984 -0
  259. synth_ai/sdk/api/train/graphgen_models.py +823 -0
  260. synth_ai/sdk/api/train/graphgen_validators.py +109 -0
  261. synth_ai/sdk/api/train/local_api.py +10 -0
  262. synth_ai/sdk/api/train/pollers.py +124 -0
  263. synth_ai/sdk/api/train/progress/__init__.py +97 -0
  264. synth_ai/sdk/api/train/progress/dataclasses.py +569 -0
  265. synth_ai/sdk/api/train/progress/events.py +326 -0
  266. synth_ai/sdk/api/train/progress/results.py +428 -0
  267. synth_ai/sdk/api/train/progress/tracker.py +641 -0
  268. synth_ai/sdk/api/train/prompt_learning.py +469 -0
  269. synth_ai/sdk/api/train/rl.py +441 -0
  270. synth_ai/sdk/api/train/sft.py +396 -0
  271. synth_ai/sdk/api/train/summary.py +522 -0
  272. synth_ai/sdk/api/train/supported_algos.py +147 -0
  273. synth_ai/sdk/api/train/task_app.py +351 -0
  274. synth_ai/sdk/api/train/utils.py +279 -0
  275. synth_ai/sdk/api/train/validators.py +2424 -0
  276. synth_ai/sdk/graphs/__init__.py +15 -0
  277. synth_ai/sdk/graphs/completions.py +570 -0
  278. synth_ai/{inference → sdk/inference}/__init__.py +0 -1
  279. synth_ai/sdk/inference/client.py +128 -0
  280. synth_ai/sdk/jobs/__init__.py +16 -0
  281. synth_ai/sdk/jobs/client.py +371 -0
  282. synth_ai/sdk/judging/__init__.py +14 -0
  283. synth_ai/sdk/judging/base.py +24 -0
  284. synth_ai/sdk/judging/client.py +40 -0
  285. synth_ai/sdk/judging/schemas.py +222 -0
  286. synth_ai/sdk/judging/types.py +42 -0
  287. synth_ai/sdk/learning/__init__.py +99 -0
  288. synth_ai/sdk/learning/algorithms.py +14 -0
  289. synth_ai/{learning → sdk/learning}/client.py +121 -30
  290. synth_ai/sdk/learning/config.py +5 -0
  291. synth_ai/{learning → sdk/learning}/constants.py +0 -2
  292. synth_ai/sdk/learning/context_learning_client.py +531 -0
  293. synth_ai/sdk/learning/context_learning_types.py +292 -0
  294. synth_ai/sdk/learning/ft_client.py +7 -0
  295. synth_ai/{learning → sdk/learning}/health.py +15 -9
  296. synth_ai/{learning → sdk/learning}/jobs.py +44 -47
  297. synth_ai/sdk/learning/prompt_extraction.py +334 -0
  298. synth_ai/sdk/learning/prompt_learning_client.py +455 -0
  299. synth_ai/sdk/learning/prompt_learning_types.py +186 -0
  300. synth_ai/{rl → sdk/learning/rl}/__init__.py +13 -8
  301. synth_ai/{learning/rl_client.py → sdk/learning/rl/client.py} +89 -77
  302. synth_ai/sdk/learning/rl/config.py +31 -0
  303. synth_ai/{rl → sdk/learning/rl}/contracts.py +5 -14
  304. synth_ai/{rl → sdk/learning/rl}/env_keys.py +45 -16
  305. synth_ai/sdk/learning/rl/secrets.py +13 -0
  306. synth_ai/sdk/learning/rl_client.py +5 -0
  307. synth_ai/sdk/learning/sft/__init__.py +29 -0
  308. synth_ai/sdk/learning/sft/client.py +95 -0
  309. synth_ai/sdk/learning/sft/config.py +270 -0
  310. synth_ai/sdk/learning/sft/data.py +698 -0
  311. synth_ai/sdk/learning/sse.py +57 -0
  312. synth_ai/sdk/learning/validators.py +52 -0
  313. synth_ai/sdk/localapi/__init__.py +40 -0
  314. synth_ai/sdk/localapi/apps/__init__.py +28 -0
  315. synth_ai/sdk/localapi/client.py +10 -0
  316. synth_ai/sdk/localapi/contracts.py +10 -0
  317. synth_ai/sdk/localapi/helpers.py +519 -0
  318. synth_ai/sdk/localapi/rollouts.py +87 -0
  319. synth_ai/sdk/localapi/server.py +29 -0
  320. synth_ai/sdk/localapi/template.py +70 -0
  321. synth_ai/sdk/streaming/__init__.py +35 -0
  322. synth_ai/sdk/streaming/config.py +94 -0
  323. synth_ai/sdk/streaming/handlers.py +1997 -0
  324. synth_ai/sdk/streaming/streamer.py +713 -0
  325. synth_ai/sdk/streaming/types.py +112 -0
  326. synth_ai/sdk/task/__init__.py +164 -0
  327. synth_ai/sdk/task/apps/__init__.py +169 -0
  328. synth_ai/sdk/task/auth.py +165 -0
  329. synth_ai/sdk/task/client.py +175 -0
  330. synth_ai/sdk/task/config.py +257 -0
  331. synth_ai/sdk/task/contracts.py +219 -0
  332. synth_ai/sdk/task/datasets.py +108 -0
  333. synth_ai/sdk/task/errors.py +50 -0
  334. synth_ai/sdk/task/health.py +34 -0
  335. synth_ai/sdk/task/in_process.py +1190 -0
  336. synth_ai/sdk/task/in_process_runner.py +314 -0
  337. synth_ai/sdk/task/inference_api.py +299 -0
  338. synth_ai/sdk/task/json.py +111 -0
  339. synth_ai/sdk/task/proxy.py +287 -0
  340. synth_ai/sdk/task/rubrics/__init__.py +55 -0
  341. synth_ai/sdk/task/rubrics/loaders.py +156 -0
  342. synth_ai/sdk/task/rubrics/models.py +57 -0
  343. synth_ai/sdk/task/rubrics/scoring.py +116 -0
  344. synth_ai/sdk/task/rubrics/strict.py +149 -0
  345. synth_ai/sdk/task/rubrics.py +219 -0
  346. synth_ai/sdk/task/server.py +631 -0
  347. synth_ai/sdk/task/trace_correlation_helpers.py +539 -0
  348. synth_ai/sdk/task/tracing_utils.py +95 -0
  349. synth_ai/sdk/task/validators.py +441 -0
  350. synth_ai/sdk/task/vendors.py +59 -0
  351. synth_ai/sdk/training/__init__.py +102 -0
  352. synth_ai/sdk/tunnels/__init__.py +83 -0
  353. synth_ai/sdk/tunnels/cleanup.py +83 -0
  354. synth_ai/sdk/tunnels/ports.py +120 -0
  355. synth_ai/utils/__init__.py +213 -0
  356. synth_ai-0.4.3.dist-info/METADATA +262 -0
  357. synth_ai-0.4.3.dist-info/RECORD +370 -0
  358. {synth_ai-0.2.6.dev1.dist-info → synth_ai-0.4.3.dist-info}/entry_points.txt +0 -1
  359. synth_ai/cli/calc.py +0 -69
  360. synth_ai/cli/demo.py +0 -131
  361. synth_ai/cli/legacy_root_backup.py +0 -470
  362. synth_ai/cli/man.py +0 -106
  363. synth_ai/cli/rl_demo.py +0 -137
  364. synth_ai/cli/status.py +0 -133
  365. synth_ai/config/base_url.py +0 -98
  366. synth_ai/core/experiment.py +0 -15
  367. synth_ai/core/system.py +0 -15
  368. synth_ai/demos/core/__init__.py +0 -1
  369. synth_ai/demos/core/cli.py +0 -685
  370. synth_ai/demos/demo_task_apps/__init__.py +0 -1
  371. synth_ai/demos/demo_task_apps/math/config.toml +0 -44
  372. synth_ai/demos/demo_task_apps/math/deploy_task_app.sh +0 -22
  373. synth_ai/environments/__init__.py +0 -31
  374. synth_ai/environments/environment/__init__.py +0 -1
  375. synth_ai/environments/environment/artifacts/__init__.py +0 -1
  376. synth_ai/environments/environment/artifacts/base.py +0 -52
  377. synth_ai/environments/environment/core.py +0 -67
  378. synth_ai/environments/environment/db/__init__.py +0 -1
  379. synth_ai/environments/environment/db/sqlite.py +0 -45
  380. synth_ai/environments/environment/registry.py +0 -233
  381. synth_ai/environments/environment/resources/sqlite.py +0 -45
  382. synth_ai/environments/environment/results.py +0 -1
  383. synth_ai/environments/environment/rewards/__init__.py +0 -1
  384. synth_ai/environments/environment/rewards/core.py +0 -29
  385. synth_ai/environments/environment/shared_engine.py +0 -26
  386. synth_ai/environments/environment/tools/__init__.py +0 -200
  387. synth_ai/environments/examples/__init__.py +0 -1
  388. synth_ai/environments/examples/bandit/__init__.py +0 -33
  389. synth_ai/environments/examples/bandit/engine.py +0 -294
  390. synth_ai/environments/examples/bandit/environment.py +0 -194
  391. synth_ai/environments/examples/bandit/taskset.py +0 -200
  392. synth_ai/environments/examples/crafter_classic/__init__.py +0 -8
  393. synth_ai/environments/examples/crafter_classic/agent_demos/analyze_semantic_words_markdown.py +0 -250
  394. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_comprehensive_evaluation.py +0 -59
  395. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_evaluation_browser.py +0 -152
  396. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_evaluation_config.toml +0 -24
  397. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_evaluation_framework.py +0 -1194
  398. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/crafter_synth_config.toml +0 -56
  399. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/filter_config_modal.toml +0 -32
  400. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/filter_traces_sft_turso.py +0 -724
  401. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/kick_off_ft_modal.py +0 -384
  402. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_action_results.py +0 -53
  403. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_agent_actions.py +0 -178
  404. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_latest_run.py +0 -222
  405. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_lm_traces.py +0 -183
  406. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_no_rewards.py +0 -210
  407. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_trace_issue.py +0 -206
  408. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/check_db_schema.py +0 -49
  409. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/check_latest_results.py +0 -64
  410. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/debug_agent_responses.py +0 -88
  411. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/quick_trace_check.py +0 -77
  412. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/compare_experiments.py +0 -324
  413. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/filter_traces_sft_turso.py +0 -580
  414. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/kick_off_ft_oai.py +0 -362
  415. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/multi_model_config.toml +0 -49
  416. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/analyze_enhanced_hooks.py +0 -332
  417. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/analyze_hook_events.py +0 -97
  418. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/analyze_hook_results.py +0 -217
  419. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/check_hook_storage.py +0 -87
  420. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/check_seeds.py +0 -88
  421. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/compare_seed_performance.py +0 -195
  422. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/custom_eval_pipelines.py +0 -400
  423. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/plot_hook_frequency.py +0 -195
  424. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/seed_analysis_summary.py +0 -56
  425. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/run_rollouts_for_models_and_compare_v3.py +0 -858
  426. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_quick_evaluation.py +0 -52
  427. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_react_agent.py +0 -874
  428. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_trace_evaluation.py +0 -1412
  429. synth_ai/environments/examples/crafter_classic/agent_demos/example_v3_usage.py +0 -216
  430. synth_ai/environments/examples/crafter_classic/agent_demos/old/compare_traces.py +0 -296
  431. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_comprehensive_evaluation.py +0 -58
  432. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_env_serialization.py +0 -464
  433. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_evaluation_browser.py +0 -152
  434. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_quick_evaluation.py +0 -51
  435. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_trace_evaluation.py +0 -1412
  436. synth_ai/environments/examples/crafter_classic/agent_demos/old/debug_player_loss.py +0 -112
  437. synth_ai/environments/examples/crafter_classic/agent_demos/old/diagnose_service.py +0 -203
  438. synth_ai/environments/examples/crafter_classic/agent_demos/old/diagnose_slowness.py +0 -305
  439. synth_ai/environments/examples/crafter_classic/agent_demos/old/eval_by_difficulty.py +0 -126
  440. synth_ai/environments/examples/crafter_classic/agent_demos/old/eval_example.py +0 -94
  441. synth_ai/environments/examples/crafter_classic/agent_demos/old/explore_saved_states.py +0 -142
  442. synth_ai/environments/examples/crafter_classic/agent_demos/old/filter_traces_sft.py +0 -26
  443. synth_ai/environments/examples/crafter_classic/agent_demos/old/filter_traces_sft_OLD.py +0 -984
  444. synth_ai/environments/examples/crafter_classic/agent_demos/old/generate_ft_data_gemini.py +0 -724
  445. synth_ai/environments/examples/crafter_classic/agent_demos/old/generate_ft_data_modal.py +0 -386
  446. synth_ai/environments/examples/crafter_classic/agent_demos/old/generate_ft_metadata.py +0 -205
  447. synth_ai/environments/examples/crafter_classic/agent_demos/old/kick_off_ft_gemini.py +0 -150
  448. synth_ai/environments/examples/crafter_classic/agent_demos/old/kick_off_ft_modal.py +0 -283
  449. synth_ai/environments/examples/crafter_classic/agent_demos/old/prepare_vertex_ft.py +0 -280
  450. synth_ai/environments/examples/crafter_classic/agent_demos/old/profile_env_slowness.py +0 -456
  451. synth_ai/environments/examples/crafter_classic/agent_demos/old/replicate_issue.py +0 -166
  452. synth_ai/environments/examples/crafter_classic/agent_demos/old/run_and_eval.py +0 -102
  453. synth_ai/environments/examples/crafter_classic/agent_demos/old/run_comparison.py +0 -128
  454. synth_ai/environments/examples/crafter_classic/agent_demos/old/run_qwen_rollouts.py +0 -655
  455. synth_ai/environments/examples/crafter_classic/agent_demos/old/trace_eval_OLD.py +0 -202
  456. synth_ai/environments/examples/crafter_classic/agent_demos/old/validate_openai_format.py +0 -166
  457. synth_ai/environments/examples/crafter_classic/config_logging.py +0 -111
  458. synth_ai/environments/examples/crafter_classic/debug_translation.py +0 -0
  459. synth_ai/environments/examples/crafter_classic/engine.py +0 -579
  460. synth_ai/environments/examples/crafter_classic/engine_deterministic_patch.py +0 -64
  461. synth_ai/environments/examples/crafter_classic/engine_helpers/action_map.py +0 -6
  462. synth_ai/environments/examples/crafter_classic/engine_helpers/serialization.py +0 -75
  463. synth_ai/environments/examples/crafter_classic/engine_serialization_patch_v3.py +0 -267
  464. synth_ai/environments/examples/crafter_classic/environment.py +0 -404
  465. synth_ai/environments/examples/crafter_classic/taskset.py +0 -233
  466. synth_ai/environments/examples/crafter_classic/trace_hooks_v3.py +0 -228
  467. synth_ai/environments/examples/crafter_classic/world_config_patch_simple.py +0 -299
  468. synth_ai/environments/examples/crafter_custom/__init__.py +0 -4
  469. synth_ai/environments/examples/crafter_custom/agent_demos/__init__.py +0 -1
  470. synth_ai/environments/examples/crafter_custom/agent_demos/trace_eval.py +0 -202
  471. synth_ai/environments/examples/crafter_custom/crafter/__init__.py +0 -7
  472. synth_ai/environments/examples/crafter_custom/crafter/config.py +0 -182
  473. synth_ai/environments/examples/crafter_custom/crafter/constants.py +0 -8
  474. synth_ai/environments/examples/crafter_custom/crafter/engine.py +0 -269
  475. synth_ai/environments/examples/crafter_custom/crafter/env.py +0 -262
  476. synth_ai/environments/examples/crafter_custom/crafter/objects.py +0 -417
  477. synth_ai/environments/examples/crafter_custom/crafter/recorder.py +0 -187
  478. synth_ai/environments/examples/crafter_custom/crafter/worldgen.py +0 -118
  479. synth_ai/environments/examples/crafter_custom/dataset_builder.py +0 -373
  480. synth_ai/environments/examples/crafter_custom/environment.py +0 -312
  481. synth_ai/environments/examples/crafter_custom/old/analyze_diamond_issue.py +0 -159
  482. synth_ai/environments/examples/crafter_custom/old/analyze_diamond_spawning.py +0 -158
  483. synth_ai/environments/examples/crafter_custom/old/compare_worlds.py +0 -71
  484. synth_ai/environments/examples/crafter_custom/old/dataset_stats.py +0 -105
  485. synth_ai/environments/examples/crafter_custom/old/diamond_spawning_summary.py +0 -119
  486. synth_ai/environments/examples/crafter_custom/old/example_dataset_usage.py +0 -52
  487. synth_ai/environments/examples/crafter_custom/run_dataset.py +0 -305
  488. synth_ai/environments/examples/enron/art_helpers/email_search_tools.py +0 -156
  489. synth_ai/environments/examples/enron/art_helpers/local_email_db.py +0 -281
  490. synth_ai/environments/examples/enron/art_helpers/types_enron.py +0 -25
  491. synth_ai/environments/examples/enron/engine.py +0 -295
  492. synth_ai/environments/examples/enron/environment.py +0 -166
  493. synth_ai/environments/examples/enron/taskset.py +0 -112
  494. synth_ai/environments/examples/enron/units/keyword_stats.py +0 -112
  495. synth_ai/environments/examples/minigrid/__init__.py +0 -48
  496. synth_ai/environments/examples/minigrid/agent_demos/minigrid_evaluation_framework.py +0 -1188
  497. synth_ai/environments/examples/minigrid/agent_demos/minigrid_quick_evaluation.py +0 -48
  498. synth_ai/environments/examples/minigrid/agent_demos/minigrid_react_agent.py +0 -562
  499. synth_ai/environments/examples/minigrid/agent_demos/minigrid_trace_evaluation.py +0 -221
  500. synth_ai/environments/examples/minigrid/engine.py +0 -589
  501. synth_ai/environments/examples/minigrid/environment.py +0 -274
  502. synth_ai/environments/examples/minigrid/environment_mapping.py +0 -242
  503. synth_ai/environments/examples/minigrid/puzzle_loader.py +0 -417
  504. synth_ai/environments/examples/minigrid/taskset.py +0 -583
  505. synth_ai/environments/examples/nethack/__init__.py +0 -7
  506. synth_ai/environments/examples/nethack/achievements.py +0 -337
  507. synth_ai/environments/examples/nethack/agent_demos/nethack_evaluation_framework.py +0 -981
  508. synth_ai/environments/examples/nethack/agent_demos/nethack_quick_evaluation.py +0 -74
  509. synth_ai/environments/examples/nethack/agent_demos/nethack_react_agent.py +0 -831
  510. synth_ai/environments/examples/nethack/engine.py +0 -739
  511. synth_ai/environments/examples/nethack/environment.py +0 -256
  512. synth_ai/environments/examples/nethack/helpers/__init__.py +0 -41
  513. synth_ai/environments/examples/nethack/helpers/action_mapping.py +0 -301
  514. synth_ai/environments/examples/nethack/helpers/nle_wrapper.py +0 -402
  515. synth_ai/environments/examples/nethack/helpers/observation_utils.py +0 -433
  516. synth_ai/environments/examples/nethack/helpers/recording_wrapper.py +0 -200
  517. synth_ai/environments/examples/nethack/helpers/trajectory_recorder.py +0 -269
  518. synth_ai/environments/examples/nethack/helpers/visualization/replay_viewer.py +0 -308
  519. synth_ai/environments/examples/nethack/helpers/visualization/visualizer.py +0 -431
  520. synth_ai/environments/examples/nethack/taskset.py +0 -323
  521. synth_ai/environments/examples/red/__init__.py +0 -7
  522. synth_ai/environments/examples/red/agent_demos/__init__.py +0 -1
  523. synth_ai/environments/examples/red/config_logging.py +0 -110
  524. synth_ai/environments/examples/red/engine.py +0 -694
  525. synth_ai/environments/examples/red/engine_helpers/__init__.py +0 -1
  526. synth_ai/environments/examples/red/engine_helpers/memory_map.py +0 -28
  527. synth_ai/environments/examples/red/engine_helpers/reward_components.py +0 -276
  528. synth_ai/environments/examples/red/engine_helpers/reward_library/__init__.py +0 -142
  529. synth_ai/environments/examples/red/engine_helpers/reward_library/adaptive_rewards.py +0 -57
  530. synth_ai/environments/examples/red/engine_helpers/reward_library/battle_rewards.py +0 -284
  531. synth_ai/environments/examples/red/engine_helpers/reward_library/composite_rewards.py +0 -150
  532. synth_ai/environments/examples/red/engine_helpers/reward_library/economy_rewards.py +0 -138
  533. synth_ai/environments/examples/red/engine_helpers/reward_library/efficiency_rewards.py +0 -57
  534. synth_ai/environments/examples/red/engine_helpers/reward_library/exploration_rewards.py +0 -331
  535. synth_ai/environments/examples/red/engine_helpers/reward_library/novelty_rewards.py +0 -121
  536. synth_ai/environments/examples/red/engine_helpers/reward_library/pallet_town_rewards.py +0 -559
  537. synth_ai/environments/examples/red/engine_helpers/reward_library/pokemon_rewards.py +0 -313
  538. synth_ai/environments/examples/red/engine_helpers/reward_library/social_rewards.py +0 -148
  539. synth_ai/environments/examples/red/engine_helpers/reward_library/story_rewards.py +0 -247
  540. synth_ai/environments/examples/red/engine_helpers/screen_analysis.py +0 -368
  541. synth_ai/environments/examples/red/engine_helpers/state_extraction.py +0 -140
  542. synth_ai/environments/examples/red/environment.py +0 -238
  543. synth_ai/environments/examples/red/taskset.py +0 -79
  544. synth_ai/environments/examples/red/units/__init__.py +0 -1
  545. synth_ai/environments/examples/sokoban/__init__.py +0 -1
  546. synth_ai/environments/examples/sokoban/agent_demos/sokoban_full_eval.py +0 -899
  547. synth_ai/environments/examples/sokoban/engine.py +0 -678
  548. synth_ai/environments/examples/sokoban/engine_helpers/__init__.py +0 -1
  549. synth_ai/environments/examples/sokoban/engine_helpers/room_utils.py +0 -657
  550. synth_ai/environments/examples/sokoban/engine_helpers/vendored/__init__.py +0 -18
  551. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/__init__.py +0 -3
  552. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/boxoban_env.py +0 -131
  553. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/render_utils.py +0 -370
  554. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/room_utils.py +0 -332
  555. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env.py +0 -306
  556. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_fixed_targets.py +0 -67
  557. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_pull.py +0 -115
  558. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_two_player.py +0 -123
  559. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_variations.py +0 -394
  560. synth_ai/environments/examples/sokoban/environment.py +0 -229
  561. synth_ai/environments/examples/sokoban/generate_verified_puzzles.py +0 -440
  562. synth_ai/environments/examples/sokoban/puzzle_loader.py +0 -312
  563. synth_ai/environments/examples/sokoban/taskset.py +0 -428
  564. synth_ai/environments/examples/sokoban/units/astar_common.py +0 -95
  565. synth_ai/environments/examples/tictactoe/__init__.py +0 -1
  566. synth_ai/environments/examples/tictactoe/engine.py +0 -368
  567. synth_ai/environments/examples/tictactoe/environment.py +0 -240
  568. synth_ai/environments/examples/tictactoe/taskset.py +0 -215
  569. synth_ai/environments/examples/verilog/__init__.py +0 -10
  570. synth_ai/environments/examples/verilog/engine.py +0 -329
  571. synth_ai/environments/examples/verilog/environment.py +0 -350
  572. synth_ai/environments/examples/verilog/taskset.py +0 -420
  573. synth_ai/environments/examples/wordle/__init__.py +0 -29
  574. synth_ai/environments/examples/wordle/engine.py +0 -398
  575. synth_ai/environments/examples/wordle/environment.py +0 -159
  576. synth_ai/environments/examples/wordle/helpers/generate_instances_wordfreq.py +0 -75
  577. synth_ai/environments/examples/wordle/taskset.py +0 -230
  578. synth_ai/environments/reproducibility/core.py +0 -42
  579. synth_ai/environments/reproducibility/helpers.py +0 -0
  580. synth_ai/environments/reproducibility/tree.py +0 -364
  581. synth_ai/environments/service/app.py +0 -91
  582. synth_ai/environments/service/core_routes.py +0 -1020
  583. synth_ai/environments/service/external_registry.py +0 -56
  584. synth_ai/environments/service/registry.py +0 -9
  585. synth_ai/environments/stateful/__init__.py +0 -1
  586. synth_ai/environments/stateful/core.py +0 -163
  587. synth_ai/environments/stateful/engine.py +0 -21
  588. synth_ai/environments/stateful/state.py +0 -7
  589. synth_ai/environments/tasks/api.py +0 -19
  590. synth_ai/environments/tasks/core.py +0 -80
  591. synth_ai/environments/tasks/filters.py +0 -41
  592. synth_ai/environments/tasks/utils.py +0 -91
  593. synth_ai/environments/v0_observability/history.py +0 -3
  594. synth_ai/environments/v0_observability/log.py +0 -2
  595. synth_ai/evals/base.py +0 -15
  596. synth_ai/experimental/synth_oss.py +0 -446
  597. synth_ai/http.py +0 -102
  598. synth_ai/inference/client.py +0 -20
  599. synth_ai/install_sqld.sh +0 -40
  600. synth_ai/jobs/client.py +0 -246
  601. synth_ai/learning/__init__.py +0 -24
  602. synth_ai/learning/config.py +0 -43
  603. synth_ai/learning/filtering.py +0 -0
  604. synth_ai/learning/ft_client.py +0 -59
  605. synth_ai/learning/offline/dpo.py +0 -0
  606. synth_ai/learning/offline/providers.py +0 -7
  607. synth_ai/learning/offline/sft.py +0 -0
  608. synth_ai/learning/offline/shared.py +0 -0
  609. synth_ai/learning/online/grpo.py +0 -0
  610. synth_ai/learning/online/irft.py +0 -0
  611. synth_ai/learning/prompts/banking77_injection_eval.py +0 -168
  612. synth_ai/learning/prompts/gepa.py +0 -0
  613. synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +0 -213
  614. synth_ai/learning/prompts/mipro.py +0 -289
  615. synth_ai/learning/prompts/random_search.py +0 -246
  616. synth_ai/learning/prompts/run_mipro_banking77.py +0 -172
  617. synth_ai/learning/prompts/run_random_search_banking77.py +0 -324
  618. synth_ai/learning/sse.py +0 -58
  619. synth_ai/learning/validators.py +0 -48
  620. synth_ai/lm/__init__.py +0 -51
  621. synth_ai/lm/caching/constants.py +0 -6
  622. synth_ai/lm/caching/dbs.py +0 -0
  623. synth_ai/lm/caching/ephemeral.py +0 -102
  624. synth_ai/lm/caching/handler.py +0 -137
  625. synth_ai/lm/caching/initialize.py +0 -11
  626. synth_ai/lm/caching/persistent.py +0 -114
  627. synth_ai/lm/config.py +0 -110
  628. synth_ai/lm/constants.py +0 -32
  629. synth_ai/lm/core/__init__.py +0 -8
  630. synth_ai/lm/core/all.py +0 -73
  631. synth_ai/lm/core/exceptions.py +0 -7
  632. synth_ai/lm/core/main.py +0 -319
  633. synth_ai/lm/core/main_v3.py +0 -594
  634. synth_ai/lm/core/synth_models.py +0 -48
  635. synth_ai/lm/core/vendor_clients.py +0 -188
  636. synth_ai/lm/cost/__init__.py +0 -0
  637. synth_ai/lm/cost/monitor.py +0 -1
  638. synth_ai/lm/cost/statefulness.py +0 -1
  639. synth_ai/lm/injection.py +0 -80
  640. synth_ai/lm/overrides.py +0 -206
  641. synth_ai/lm/provider_support/__init__.py +0 -8
  642. synth_ai/lm/provider_support/anthropic.py +0 -972
  643. synth_ai/lm/provider_support/openai.py +0 -1139
  644. synth_ai/lm/provider_support/suppress_logging.py +0 -31
  645. synth_ai/lm/structured_outputs/__init__.py +0 -0
  646. synth_ai/lm/structured_outputs/handler.py +0 -440
  647. synth_ai/lm/structured_outputs/inject.py +0 -297
  648. synth_ai/lm/structured_outputs/rehabilitate.py +0 -185
  649. synth_ai/lm/tools/__init__.py +0 -3
  650. synth_ai/lm/tools/base.py +0 -172
  651. synth_ai/lm/unified_interface.py +0 -202
  652. synth_ai/lm/vendors/__init__.py +0 -0
  653. synth_ai/lm/vendors/base.py +0 -81
  654. synth_ai/lm/vendors/core/__init__.py +0 -0
  655. synth_ai/lm/vendors/core/anthropic_api.py +0 -387
  656. synth_ai/lm/vendors/core/gemini_api.py +0 -292
  657. synth_ai/lm/vendors/core/mistral_api.py +0 -322
  658. synth_ai/lm/vendors/core/openai_api.py +0 -220
  659. synth_ai/lm/vendors/core/synth_dev_api.py +0 -0
  660. synth_ai/lm/vendors/local/__init__.py +0 -0
  661. synth_ai/lm/vendors/local/ollama.py +0 -0
  662. synth_ai/lm/vendors/openai_standard.py +0 -780
  663. synth_ai/lm/vendors/openai_standard_responses.py +0 -256
  664. synth_ai/lm/vendors/retries.py +0 -22
  665. synth_ai/lm/vendors/supported/__init__.py +0 -0
  666. synth_ai/lm/vendors/supported/custom_endpoint.py +0 -417
  667. synth_ai/lm/vendors/supported/deepseek.py +0 -69
  668. synth_ai/lm/vendors/supported/grok.py +0 -75
  669. synth_ai/lm/vendors/supported/groq.py +0 -16
  670. synth_ai/lm/vendors/supported/ollama.py +0 -15
  671. synth_ai/lm/vendors/supported/openrouter.py +0 -74
  672. synth_ai/lm/vendors/supported/together.py +0 -11
  673. synth_ai/lm/vendors/synth_client.py +0 -808
  674. synth_ai/lm/warmup.py +0 -186
  675. synth_ai/rl/secrets.py +0 -19
  676. synth_ai/scripts/verify_rewards.py +0 -100
  677. synth_ai/task/__init__.py +0 -10
  678. synth_ai/task/contracts.py +0 -120
  679. synth_ai/task/health.py +0 -28
  680. synth_ai/task/validators.py +0 -12
  681. synth_ai/tracing/__init__.py +0 -30
  682. synth_ai/tracing_v1/__init__.py +0 -33
  683. synth_ai/tracing_v3/config.py +0 -84
  684. synth_ai/tracing_v3/storage/config.py +0 -62
  685. synth_ai/tracing_v3/turso/__init__.py +0 -25
  686. synth_ai/tracing_v3/turso/daemon.py +0 -144
  687. synth_ai/tracing_v3/turso/manager.py +0 -760
  688. synth_ai/v0/tracing/__init__.py +0 -0
  689. synth_ai/v0/tracing/abstractions.py +0 -224
  690. synth_ai/v0/tracing/base_client.py +0 -91
  691. synth_ai/v0/tracing/client_manager.py +0 -131
  692. synth_ai/v0/tracing/config.py +0 -140
  693. synth_ai/v0/tracing/context.py +0 -146
  694. synth_ai/v0/tracing/decorators.py +0 -680
  695. synth_ai/v0/tracing/events/__init__.py +0 -0
  696. synth_ai/v0/tracing/events/manage.py +0 -147
  697. synth_ai/v0/tracing/events/scope.py +0 -86
  698. synth_ai/v0/tracing/events/store.py +0 -228
  699. synth_ai/v0/tracing/immediate_client.py +0 -151
  700. synth_ai/v0/tracing/local.py +0 -18
  701. synth_ai/v0/tracing/log_client_base.py +0 -73
  702. synth_ai/v0/tracing/retry_queue.py +0 -186
  703. synth_ai/v0/tracing/trackers.py +0 -515
  704. synth_ai/v0/tracing/upload.py +0 -510
  705. synth_ai/v0/tracing/utils.py +0 -9
  706. synth_ai/v0/tracing_v1/__init__.py +0 -16
  707. synth_ai/v0/tracing_v1/abstractions.py +0 -224
  708. synth_ai/v0/tracing_v1/base_client.py +0 -91
  709. synth_ai/v0/tracing_v1/client_manager.py +0 -131
  710. synth_ai/v0/tracing_v1/config.py +0 -140
  711. synth_ai/v0/tracing_v1/context.py +0 -146
  712. synth_ai/v0/tracing_v1/decorators.py +0 -701
  713. synth_ai/v0/tracing_v1/events/__init__.py +0 -0
  714. synth_ai/v0/tracing_v1/events/manage.py +0 -147
  715. synth_ai/v0/tracing_v1/events/scope.py +0 -86
  716. synth_ai/v0/tracing_v1/events/store.py +0 -228
  717. synth_ai/v0/tracing_v1/immediate_client.py +0 -151
  718. synth_ai/v0/tracing_v1/local.py +0 -18
  719. synth_ai/v0/tracing_v1/log_client_base.py +0 -73
  720. synth_ai/v0/tracing_v1/retry_queue.py +0 -186
  721. synth_ai/v0/tracing_v1/trackers.py +0 -515
  722. synth_ai/v0/tracing_v1/upload.py +0 -525
  723. synth_ai/v0/tracing_v1/utils.py +0 -9
  724. synth_ai/zyk/__init__.py +0 -30
  725. synth_ai-0.2.6.dev1.dist-info/METADATA +0 -106
  726. synth_ai-0.2.6.dev1.dist-info/RECORD +0 -416
  727. /synth_ai/{demos → cli/demo_apps}/demo_task_apps/math/__init__.py +0 -0
  728. /synth_ai/{lm/caching → core/apps}/__init__.py +0 -0
  729. /synth_ai/{tracing_v3 → core/tracing_v3}/lm_call_record_abstractions.py +0 -0
  730. /synth_ai/{tracing_v3 → core/tracing_v3}/storage/__init__.py +0 -0
  731. /synth_ai/{tracing_v3 → core/tracing_v3}/storage/exceptions.py +0 -0
  732. /synth_ai/{tracing_v3 → core/tracing_v3}/storage/types.py +0 -0
  733. /synth_ai/{compound/cais.py → py.typed} +0 -0
  734. /synth_ai/{learning → sdk/learning}/core.py +0 -0
  735. /synth_ai/{learning → sdk/learning}/gateway.py +0 -0
  736. {synth_ai-0.2.6.dev1.dist-info → synth_ai-0.4.3.dist-info}/WHEEL +0 -0
  737. {synth_ai-0.2.6.dev1.dist-info → synth_ai-0.4.3.dist-info}/licenses/LICENSE +0 -0
  738. {synth_ai-0.2.6.dev1.dist-info → synth_ai-0.4.3.dist-info}/top_level.txt +0 -0
@@ -1,724 +0,0 @@
1
- #!/usr/bin/env python3
2
- """
3
- Generate Fine-tuning Data for Gemini Models
4
- ===========================================
5
- This script generates high-quality trajectories from Crafter using Gemini models
6
- and converts them to JSONL format suitable for Vertex AI fine-tuning.
7
- """
8
-
9
- import asyncio
10
- import json
11
- import uuid
12
- import argparse
13
- import toml
14
- import logging
15
- from datetime import datetime
16
- from typing import Dict, Any, Optional, List, Set, Tuple
17
- from pathlib import Path
18
- import sys
19
- import os
20
- import numpy as np
21
- from collections import defaultdict
22
- import time
23
- from tqdm.asyncio import tqdm_asyncio
24
- from httpx import AsyncClient
25
-
26
- # Add the src directory to the path
27
- sys.path.insert(0, os.path.join(os.path.dirname(__file__), "..", "..", "..", "..", "src"))
28
-
29
- from synth_ai.lm.core.main import LM
30
- from synth_ai.lm.tools.base import BaseTool
31
- from pydantic import BaseModel, Field
32
-
33
- # Import TaskInstance and related classes
34
- from synth_ai.environments.tasks.core import (
35
- Impetus,
36
- Intent,
37
- Task,
38
- TaskInstance,
39
- )
40
- from synth_ai.environments.examples.crafter_classic.taskset import CrafterTaskInstance, CrafterTaskInstanceMetadata
41
-
42
- # Import trace evaluation utilities
43
- sys.path.append(str(Path(__file__).parent))
44
- from trace_eval import evaluate_trace, WEIGHTS
45
- from filter_traces_sft import load_trace, extract_trajectory_score, extract_llm_calls
46
-
47
-
48
- # --- Helper Functions ---
49
- def parse_observation_text(obs_text: str) -> Dict[str, Any]:
50
- """Parse structured observation from text format."""
51
- obs_data = {
52
- "health": 10,
53
- "hunger": 10,
54
- "thirst": 10,
55
- "inventory": {},
56
- "achievements_dict": {},
57
- "player_position": [0, 0],
58
- "semantic_map": [],
59
- "done": False
60
- }
61
-
62
- if not obs_text:
63
- return obs_data
64
-
65
- lines = obs_text.strip().split('\n')
66
- current_section = None
67
-
68
- for line in lines:
69
- line = line.strip()
70
- if not line:
71
- continue
72
-
73
- # Parse stats
74
- if "Health:" in line:
75
- try:
76
- health = line.split(":")[1].strip().split("/")[0]
77
- obs_data["health"] = int(health)
78
- except:
79
- pass
80
- elif "Hunger:" in line:
81
- try:
82
- hunger = line.split(":")[1].strip().split("/")[0]
83
- obs_data["hunger"] = int(hunger)
84
- except:
85
- pass
86
- elif "Thirst:" in line:
87
- try:
88
- thirst = line.split(":")[1].strip().split("/")[0]
89
- obs_data["thirst"] = int(thirst)
90
- except:
91
- pass
92
- elif "Position:" in line:
93
- try:
94
- pos_str = line.split(":")[1].strip()
95
- x, y = pos_str.strip("()").split(",")
96
- obs_data["player_position"] = [int(x), int(y)]
97
- except:
98
- pass
99
- elif "Inventory:" in line:
100
- current_section = "inventory"
101
- elif "Achievements:" in line:
102
- current_section = "achievements"
103
- elif current_section == "inventory" and " - " in line:
104
- try:
105
- item, count = line.split(" - ")
106
- item = item.strip().strip("-").strip()
107
- count = int(count.split(":")[1].strip())
108
- obs_data["inventory"][item] = count
109
- except:
110
- pass
111
- elif current_section == "achievements" and line:
112
- # Parse achievements list
113
- achievements = line.split(", ")
114
- for ach in achievements:
115
- ach = ach.strip()
116
- if ach:
117
- obs_data["achievements_dict"][ach] = True
118
-
119
- return obs_data
120
-
121
-
122
- # --- Configuration ---
123
- class GenerationConfig:
124
- """Configuration for fine-tuning data generation."""
125
-
126
- def __init__(self, config_path: Optional[str] = None):
127
- # Default values
128
- self.model_name = "gemini-2.5-flash" # Best Gemini model for reasoning
129
- self.num_rollouts = 100
130
- self.max_turns = 30
131
- self.difficulty = "easy"
132
- self.service_base_url = "http://localhost:8901"
133
- self.service_timeout = 30.0
134
- self.seed = 42
135
- self.traces_dir = Path("traces_gemini")
136
- self.ft_data_dir = Path("ft_data_gemini")
137
-
138
- # Quality filtering
139
- self.min_score_threshold = 2.0 # Minimum trajectory score
140
- self.min_achievements = 3 # Minimum achievements required
141
- self.enable_thinking = True # Enable thinking/reasoning
142
- self.thinking_budget = 15000 # Token budget for thinking
143
-
144
- # Load from TOML if provided
145
- if config_path and os.path.exists(config_path):
146
- self.load_from_toml(config_path)
147
-
148
- def load_from_toml(self, config_path: str):
149
- """Load configuration from TOML file."""
150
- config = toml.load(config_path)
151
-
152
- # Extract generation settings
153
- gen_config = config.get("generation", {})
154
- self.model_name = gen_config.get("model_name", self.model_name)
155
- self.num_rollouts = gen_config.get("num_rollouts", self.num_rollouts)
156
- self.max_turns = gen_config.get("max_turns", self.max_turns)
157
- self.difficulty = gen_config.get("difficulty", self.difficulty)
158
- self.seed = gen_config.get("seed", self.seed)
159
-
160
- # Extract service settings
161
- service_config = config.get("service", {})
162
- self.service_base_url = service_config.get("base_url", self.service_base_url)
163
- self.service_timeout = service_config.get("timeout", self.service_timeout)
164
-
165
- # Extract quality settings
166
- quality_config = config.get("quality", {})
167
- self.min_score_threshold = quality_config.get("min_score_threshold", self.min_score_threshold)
168
- self.min_achievements = quality_config.get("min_achievements", self.min_achievements)
169
- self.enable_thinking = quality_config.get("enable_thinking", self.enable_thinking)
170
- self.thinking_budget = quality_config.get("thinking_budget", self.thinking_budget)
171
-
172
-
173
- # --- Crafter Action Tool ---
174
- class CrafterAction(BaseTool):
175
- """Tool for performing actions in Crafter environment."""
176
-
177
- name: str = "crafter_action"
178
- description: str = "Perform an action in the Crafter environment"
179
- params: List[tuple] = [
180
- ("action", "str", "The action to perform (e.g., 'move_north', 'collect', 'craft_wood_pickaxe')")
181
- ]
182
-
183
- def __init__(self, instance_id: str, client: AsyncClient):
184
- super().__init__()
185
- self.instance_id = instance_id
186
- self.client = client
187
- self.base_url = "http://localhost:8901"
188
-
189
- # Action mapping from string to integer
190
- self.action_map = {
191
- "noop": 0,
192
- "move_north": 1,
193
- "move_south": 2,
194
- "move_east": 3,
195
- "move_west": 4,
196
- "attack": 5,
197
- "collect": 6,
198
- "craft_wood_pickaxe": 7,
199
- "craft_stone_pickaxe": 8,
200
- "craft_iron_pickaxe": 9,
201
- "craft_wood_sword": 10,
202
- "craft_stone_sword": 11,
203
- "craft_iron_sword": 12,
204
- "eat": 13,
205
- "drink": 14,
206
- "sleep": 15,
207
- "place_stone": 16,
208
- "place_table": 17,
209
- "place_furnace": 18,
210
- "place_plant": 19,
211
- }
212
-
213
- def _action_to_int(self, action: str) -> int:
214
- """Convert action string to integer."""
215
- return self.action_map.get(action.lower(), 0)
216
-
217
- async def _run(self, action: str) -> Dict[str, Any]:
218
- """Execute action in environment."""
219
- response = await self.client.post(
220
- f"{self.base_url}/env/CrafterClassic/step",
221
- json={"env_id": self.instance_id, "tool_calls": [{
222
- "tool_name": "interact",
223
- "tool_call_id": str(uuid.uuid4()),
224
- "tool_args": {"action": self._action_to_int(action)}
225
- }]}
226
- )
227
- response.raise_for_status()
228
- result = response.json()
229
-
230
- # Return the full result for the agent to process
231
- return result
232
-
233
-
234
- # --- Gemini Agent ---
235
- class GeminiCrafterAgent:
236
- """Agent that plays Crafter using Gemini models via synth-ai LM."""
237
-
238
- def __init__(self, model_name: str, instance_id: str, client: AsyncClient):
239
- self.model_name = model_name
240
- self.instance_id = instance_id
241
- self.client = client
242
-
243
- # Initialize LM with Gemini model
244
- self.lm = LM(
245
- model_name=model_name,
246
- formatting_model_name=model_name,
247
- temperature=0.7 # Use some temperature for diversity
248
- )
249
-
250
- # Create action tool
251
- self.action_tool = CrafterAction(instance_id, client)
252
-
253
- # Initialize conversation history
254
- self.messages = []
255
-
256
- # System prompt
257
- self.system_prompt = """You are an expert Crafter player. Your goal is to achieve as many objectives as possible in the game.
258
-
259
- Key objectives (achievements) in order of importance:
260
- 1. Basic survival: collect resources, eat when hungry, drink when thirsty
261
- 2. Tool progression: craft pickaxe → stone pickaxe → iron pickaxe
262
- 3. Advanced goals: make iron sword, defeat enemies
263
-
264
- Action format: Use the crafter_action tool with one of these actions:
265
- - Movement: move_north, move_south, move_east, move_west
266
- - Resource gathering: collect (gathers wood/stone/etc), attack (mines harder materials)
267
- - Crafting: craft_wood_pickaxe, craft_stone_pickaxe, craft_iron_pickaxe, craft_wood_sword, craft_stone_sword, craft_iron_sword
268
- - Survival: eat, drink, sleep
269
- - Placing: place_stone, place_table, place_furnace, place_plant
270
-
271
- Tips:
272
- - Start by collecting wood (stand near trees and use 'collect')
273
- - Craft a wood pickaxe early to mine stone
274
- - Monitor your health, hunger, and thirst
275
- - Explore to find water, coal, and iron
276
- - Use the semantic map to navigate efficiently"""
277
-
278
- # Add system message
279
- self.messages.append({"role": "system", "content": self.system_prompt})
280
-
281
- def _format_observation(self, obs_data: Dict[str, Any]) -> str:
282
- """Format observation data into readable text."""
283
- lines = ["=== Current State ==="]
284
-
285
- # Stats
286
- lines.append(f"Position: ({obs_data.get('player_position', [0, 0])[0]}, {obs_data.get('player_position', [0, 0])[1]})")
287
- lines.append(f"Health: {obs_data.get('health', 0)}/10")
288
- lines.append(f"Hunger: {obs_data.get('hunger', 0)}/10")
289
- lines.append(f"Thirst: {obs_data.get('thirst', 0)}/10")
290
-
291
- # Inventory
292
- inventory = obs_data.get('inventory', {})
293
- if inventory:
294
- lines.append("\nInventory:")
295
- for item, count in inventory.items():
296
- if count > 0:
297
- lines.append(f" - {item}: {count}")
298
-
299
- # Achievements
300
- achievements = obs_data.get('achievements_dict', {})
301
- unlocked = [k for k, v in achievements.items() if v]
302
- if unlocked:
303
- lines.append(f"\nAchievements: {', '.join(unlocked)}")
304
-
305
- # Local view (simplified)
306
- lines.append("\nNearby (5x5 grid around you):")
307
- semantic_map = obs_data.get('semantic_map', [])
308
- if semantic_map:
309
- # Get center region of semantic map
310
- # Assuming semantic map is flattened, reconstruct as 2D
311
- map_size = int(np.sqrt(len(semantic_map)))
312
- if map_size * map_size == len(semantic_map):
313
- map_2d = np.array(semantic_map).reshape(map_size, map_size)
314
- center = map_size // 2
315
- view_radius = 2
316
-
317
- # Simple ID to symbol mapping
318
- id_to_symbol = {
319
- 0: '.', # void/empty
320
- 1: 'G', # grass
321
- 2: 'T', # tree
322
- 3: 'S', # stone
323
- 4: 'W', # water
324
- 5: 'C', # coal
325
- 6: 'I', # iron
326
- 7: '@', # player
327
- 8: 'E', # enemy
328
- 9: 'F', # furnace
329
- 10: 'P', # plant
330
- }
331
-
332
- for dy in range(-view_radius, view_radius + 1):
333
- row = []
334
- for dx in range(-view_radius, view_radius + 1):
335
- y, x = center + dy, center + dx
336
- if 0 <= y < map_size and 0 <= x < map_size:
337
- cell_id = int(map_2d[y, x])
338
- symbol = id_to_symbol.get(cell_id, '?')
339
- if dy == 0 and dx == 0:
340
- symbol = '@' # Player position
341
- row.append(symbol)
342
- else:
343
- row.append(' ')
344
- lines.append(' ' + ' '.join(row))
345
-
346
- return '\n'.join(lines)
347
-
348
- async def step(self, obs_data: Dict[str, Any]) -> Tuple[str, Dict[str, Any]]:
349
- """Take a step in the environment."""
350
- # Format observation
351
- obs_text = self._format_observation(obs_data)
352
-
353
- # Add observation to conversation
354
- self.messages.append({"role": "user", "content": obs_text})
355
-
356
- # Get action from LM with tool
357
- response = await self.lm.ainvoke(
358
- self.messages,
359
- tools=[self.action_tool],
360
- tool_choice="required"
361
- )
362
-
363
- # Extract action from response
364
- action = None
365
- thinking = None
366
-
367
- # Handle response based on type
368
- if hasattr(response, 'tool_calls') and response.tool_calls:
369
- # Tool was called
370
- tool_call = response.tool_calls[0]
371
- action = tool_call.function.arguments.get('action', 'noop')
372
-
373
- # Add assistant message
374
- self.messages.append({
375
- "role": "assistant",
376
- "content": response.content or f"Taking action: {action}",
377
- "tool_calls": response.tool_calls
378
- })
379
- else:
380
- # No tool call, extract action from text
381
- content = response.content if hasattr(response, 'content') else str(response)
382
- self.messages.append({"role": "assistant", "content": content})
383
- action = "noop"
384
-
385
- # Extract thinking if available
386
- if hasattr(response, '_raw_response'):
387
- raw = response._raw_response
388
- if isinstance(raw, dict) and 'thinking' in raw:
389
- thinking = raw['thinking']
390
-
391
- # Execute action
392
- result = await self.action_tool._run(action)
393
-
394
- # Add tool response
395
- if hasattr(response, 'tool_calls') and response.tool_calls:
396
- self.messages.append({
397
- "role": "tool",
398
- "content": json.dumps(result),
399
- "tool_call_id": response.tool_calls[0].id
400
- })
401
-
402
- return action, {"thinking": thinking} if thinking else {}
403
-
404
-
405
- # --- Main Generation Functions ---
406
- async def generate_trajectory(config: GenerationConfig, instance_num: int) -> Optional[Dict[str, Any]]:
407
- """Generate a single trajectory using Gemini model."""
408
- async with AsyncClient(timeout=config.service_timeout) as client:
409
- try:
410
- # Create task instance
411
- task_instance = CrafterTaskInstance(
412
- id=uuid.uuid4(),
413
- impetus=Impetus(
414
- instructions="Survive and unlock achievements. Focus on collecting resources, crafting tools, and progressing through the game."
415
- ),
416
- intent=Intent(
417
- rubric={"goal": "Unlock as many achievements as possible."},
418
- gold_trajectories=None,
419
- gold_state_diff={},
420
- deterministic_eval_functions=[]
421
- ),
422
- metadata=CrafterTaskInstanceMetadata(
423
- difficulty=config.difficulty,
424
- seed=config.seed + instance_num,
425
- num_trees_radius=4,
426
- num_cows_radius=2,
427
- num_hostiles_radius=0 if config.difficulty == "easy" else 2,
428
- world_config="normal"
429
- ),
430
- is_reproducible=True,
431
- initial_engine_snapshot=None # will be filled lazily when env starts
432
- )
433
-
434
- # Initialize environment
435
- create_response = await client.post(
436
- f"{config.service_base_url}/env/CrafterClassic/initialize",
437
- json={"task_instance": await task_instance.serialize()}
438
- )
439
- create_response.raise_for_status()
440
- env_data = create_response.json()
441
- instance_id = env_data["env_id"]
442
-
443
- print(f"🎮 Instance {instance_num}: Created {instance_id}")
444
-
445
- # Get initial observation
446
- obs_data = env_data.get("observations", [{}])[0]
447
-
448
- # Parse the observation to get structured data
449
- if "human_observation" in obs_data:
450
- obs_text = obs_data["human_observation"]
451
- # Parse structured data from observation text
452
- obs_data = parse_observation_text(obs_text)
453
- obs_data["raw_text"] = obs_text
454
-
455
- # Create agent
456
- agent = GeminiCrafterAgent(
457
- model_name=config.model_name,
458
- instance_id=instance_id,
459
- client=client
460
- )
461
-
462
- # Track trajectory data
463
- trajectory = {
464
- "instance_id": instance_id,
465
- "instance_num": instance_num,
466
- "model": config.model_name,
467
- "start_time": datetime.now().isoformat(),
468
- "actions": [],
469
- "observations": [],
470
- "llm_calls": [],
471
- "achievements": {},
472
- "final_score": 0.0
473
- }
474
-
475
- # Run episode
476
- for turn in range(config.max_turns):
477
- # Get action from agent
478
- action, metadata = await agent.step(obs_data)
479
-
480
- # Store LLM call data
481
- llm_call = {
482
- "turn": turn,
483
- "messages": agent.messages[-3:], # Last 3 messages (user, assistant, tool)
484
- "action": action,
485
- "metadata": metadata
486
- }
487
- trajectory["llm_calls"].append(llm_call)
488
-
489
- # Store action and observation
490
- trajectory["actions"].append(action)
491
- trajectory["observations"].append(obs_data)
492
-
493
- # Check if done
494
- if obs_data.get("done", False):
495
- print(f"✅ Instance {instance_num}: Episode done at turn {turn}")
496
- break
497
-
498
- # Step in environment and get next observation
499
- step_response = await client.post(
500
- f"{config.service_base_url}/env/CrafterClassic/step",
501
- json={"env_id": instance_id, "tool_calls": [{
502
- "tool_name": "interact",
503
- "tool_call_id": str(uuid.uuid4()),
504
- "tool_args": {"action": agent.action_tool._action_to_int(action)}
505
- }]}
506
- )
507
- step_response.raise_for_status()
508
- step_data = step_response.json()
509
-
510
- # Extract observation
511
- if "observations" in step_data and step_data["observations"]:
512
- obs = step_data["observations"][0]
513
- if "human_observation" in obs:
514
- obs_data = parse_observation_text(obs["human_observation"])
515
- obs_data["done"] = step_data.get("done", False)
516
- else:
517
- obs_data = {"done": step_data.get("done", False)}
518
- else:
519
- obs_data = {"done": True}
520
-
521
- # Get final achievements
522
- trajectory["achievements"] = obs_data.get("achievements_dict", {})
523
- trajectory["end_time"] = datetime.now().isoformat()
524
-
525
- # Also get achievements from last observation if available
526
- if trajectory["observations"] and "achievements_dict" in trajectory["observations"][-1]:
527
- trajectory["achievements"].update(trajectory["observations"][-1]["achievements_dict"])
528
-
529
- # Calculate score
530
- unlocked_achievements = sum(1 for v in trajectory["achievements"].values() if v)
531
- trajectory["final_score"] = float(unlocked_achievements)
532
-
533
- print(f"📊 Instance {instance_num}: Score={trajectory['final_score']:.1f}, Achievements={unlocked_achievements}")
534
-
535
- # Terminate instance
536
- await client.post(
537
- f"{config.service_base_url}/env/CrafterClassic/terminate",
538
- json={"env_id": instance_id}
539
- )
540
-
541
- return trajectory
542
-
543
- except Exception as e:
544
- print(f"❌ Instance {instance_num}: Error - {e}")
545
- return None
546
-
547
-
548
- async def generate_all_trajectories(config: GenerationConfig) -> List[Dict[str, Any]]:
549
- """Generate multiple trajectories concurrently."""
550
- print(f"\n🚀 Generating {config.num_rollouts} trajectories with {config.model_name}")
551
-
552
- # Create tasks
553
- tasks = [generate_trajectory(config, i) for i in range(config.num_rollouts)]
554
-
555
- # Run with progress bar
556
- trajectories = []
557
- with tqdm_asyncio(total=config.num_rollouts, desc="Generating") as pbar:
558
- for coro in asyncio.as_completed(tasks):
559
- trajectory = await coro
560
- if trajectory:
561
- trajectories.append(trajectory)
562
- pbar.update(1)
563
-
564
- return trajectories
565
-
566
-
567
- def filter_high_quality_trajectories(trajectories: List[Dict[str, Any]],
568
- min_score: float = 2.0,
569
- min_achievements: int = 3) -> List[Dict[str, Any]]:
570
- """Filter trajectories based on quality criteria."""
571
- filtered = []
572
-
573
- for traj in trajectories:
574
- # Count achievements
575
- achievements = traj.get("achievements", {})
576
- num_achievements = sum(1 for v in achievements.values() if v)
577
-
578
- # Calculate score (could be more sophisticated)
579
- score = traj.get("final_score", 0.0)
580
-
581
- # Apply filters
582
- if score >= min_score and num_achievements >= min_achievements:
583
- filtered.append(traj)
584
-
585
- print(f"\n📊 Filtering Results:")
586
- print(f" Total trajectories: {len(trajectories)}")
587
- if trajectories:
588
- print(f" High quality: {len(filtered)} ({len(filtered)/len(trajectories)*100:.1f}%)")
589
- else:
590
- print(f" High quality: 0 (no trajectories generated)")
591
-
592
- return filtered
593
-
594
-
595
- def convert_to_vertex_ai_format(trajectories: List[Dict[str, Any]], output_path: Path):
596
- """Convert trajectories to Vertex AI fine-tuning format."""
597
- output_path.parent.mkdir(parents=True, exist_ok=True)
598
-
599
- examples = []
600
-
601
- for traj in trajectories:
602
- # Extract LLM calls
603
- for llm_call in traj.get("llm_calls", []):
604
- messages = llm_call.get("messages", [])
605
-
606
- # Skip if not enough messages
607
- if len(messages) < 2:
608
- continue
609
-
610
- # Convert to Vertex AI format
611
- # Need user message and assistant response
612
- user_msg = None
613
- assistant_msg = None
614
-
615
- for msg in messages:
616
- if msg["role"] == "user":
617
- user_msg = msg["content"]
618
- elif msg["role"] == "assistant":
619
- assistant_msg = msg["content"]
620
-
621
- if user_msg and assistant_msg:
622
- example = {
623
- "messages": [
624
- {"role": "user", "content": user_msg},
625
- {"role": "assistant", "content": assistant_msg}
626
- ]
627
- }
628
- examples.append(example)
629
-
630
- # Write JSONL
631
- with open(output_path, 'w') as f:
632
- for example in examples:
633
- f.write(json.dumps(example) + '\n')
634
-
635
- print(f"\n✅ Wrote {len(examples)} examples to {output_path}")
636
- return len(examples)
637
-
638
-
639
- def save_trajectories(trajectories: List[Dict[str, Any]], traces_dir: Path):
640
- """Save trajectories to disk."""
641
- traces_dir.mkdir(parents=True, exist_ok=True)
642
-
643
- for i, traj in enumerate(trajectories):
644
- filename = f"trajectory_{i:04d}.json"
645
- with open(traces_dir / filename, 'w') as f:
646
- json.dump(traj, f, indent=2)
647
-
648
- print(f"💾 Saved {len(trajectories)} trajectories to {traces_dir}")
649
-
650
-
651
- # --- Main ---
652
- async def main():
653
- parser = argparse.ArgumentParser(description="Generate Gemini fine-tuning data for Crafter")
654
- parser.add_argument("--config", type=str, help="Path to TOML config file")
655
- parser.add_argument("--num-rollouts", type=int, help="Number of rollouts to generate")
656
- parser.add_argument("--model", type=str, help="Gemini model name")
657
- parser.add_argument("--filter-only", action="store_true", help="Only filter existing traces")
658
- parser.add_argument("--min-achievements", type=int, help="Minimum achievements for filtering")
659
-
660
- args = parser.parse_args()
661
-
662
- # Load config
663
- config = GenerationConfig(args.config)
664
-
665
- # Override with command line args
666
- if args.num_rollouts:
667
- config.num_rollouts = args.num_rollouts
668
- if args.model:
669
- config.model_name = args.model
670
- if args.min_achievements:
671
- config.min_achievements = args.min_achievements
672
-
673
- if args.filter_only:
674
- # Filter existing trajectories
675
- print("🔍 Filtering existing trajectories...")
676
-
677
- # Load trajectories
678
- trajectories = []
679
- for trace_file in sorted(config.traces_dir.glob("*.json")):
680
- with open(trace_file) as f:
681
- trajectories.append(json.load(f))
682
-
683
- # Filter
684
- filtered = filter_high_quality_trajectories(
685
- trajectories,
686
- min_score=config.min_score_threshold,
687
- min_achievements=config.min_achievements
688
- )
689
-
690
- # Convert to JSONL
691
- output_path = config.ft_data_dir / "crafter_gemini_ft.jsonl"
692
- num_examples = convert_to_vertex_ai_format(filtered, output_path)
693
-
694
- print(f"\n🎯 Summary:")
695
- print(f" Filtered trajectories: {len(filtered)}")
696
- print(f" Total training examples: {num_examples}")
697
-
698
- else:
699
- # Generate new trajectories
700
- trajectories = await generate_all_trajectories(config)
701
-
702
- # Save all trajectories
703
- save_trajectories(trajectories, config.traces_dir)
704
-
705
- # Filter high quality
706
- filtered = filter_high_quality_trajectories(
707
- trajectories,
708
- min_score=config.min_score_threshold,
709
- min_achievements=config.min_achievements
710
- )
711
-
712
- # Convert to JSONL
713
- output_path = config.ft_data_dir / "crafter_gemini_ft.jsonl"
714
- num_examples = convert_to_vertex_ai_format(filtered, output_path)
715
-
716
- print(f"\n🎯 Summary:")
717
- print(f" Generated trajectories: {len(trajectories)}")
718
- print(f" High quality trajectories: {len(filtered)}")
719
- print(f" Total training examples: {num_examples}")
720
- print(f" Output: {output_path}")
721
-
722
-
723
- if __name__ == "__main__":
724
- asyncio.run(main())