synth-ai 0.2.6.dev1__py3-none-any.whl → 0.4.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (738) hide show
  1. synth_ai/__init__.py +44 -24
  2. synth_ai/__main__.py +30 -3
  3. synth_ai/cli/__init__.py +103 -48
  4. synth_ai/cli/__main__.py +42 -0
  5. synth_ai/cli/_internal/__init__.py +5 -0
  6. synth_ai/cli/_internal/modal_wrapper.py +31 -0
  7. synth_ai/cli/_internal/storage.py +20 -0
  8. synth_ai/cli/_internal/typer_patch.py +47 -0
  9. synth_ai/cli/_internal/validate_task_app.py +29 -0
  10. synth_ai/cli/agents/__init__.py +17 -0
  11. synth_ai/cli/agents/claude.py +77 -0
  12. synth_ai/cli/agents/codex.py +265 -0
  13. synth_ai/cli/agents/opencode.py +253 -0
  14. synth_ai/cli/commands/__init__.py +18 -0
  15. synth_ai/cli/commands/artifacts/__init__.py +13 -0
  16. synth_ai/cli/commands/artifacts/client.py +119 -0
  17. synth_ai/cli/commands/artifacts/config.py +57 -0
  18. synth_ai/cli/commands/artifacts/core.py +24 -0
  19. synth_ai/cli/commands/artifacts/download.py +188 -0
  20. synth_ai/cli/commands/artifacts/export.py +186 -0
  21. synth_ai/cli/commands/artifacts/list.py +156 -0
  22. synth_ai/cli/commands/artifacts/parsing.py +250 -0
  23. synth_ai/cli/commands/artifacts/show.py +336 -0
  24. synth_ai/cli/commands/demo/__init__.py +3 -0
  25. synth_ai/cli/commands/demo/core.py +153 -0
  26. synth_ai/cli/commands/eval/__init__.py +10 -0
  27. synth_ai/cli/commands/eval/config.py +338 -0
  28. synth_ai/cli/commands/eval/core.py +256 -0
  29. synth_ai/cli/commands/eval/runner.py +704 -0
  30. synth_ai/cli/commands/eval/validation.py +60 -0
  31. synth_ai/cli/commands/filter/__init__.py +12 -0
  32. synth_ai/cli/commands/filter/core.py +424 -0
  33. synth_ai/cli/commands/filter/errors.py +55 -0
  34. synth_ai/cli/commands/filter/validation.py +77 -0
  35. synth_ai/cli/commands/help/__init__.py +185 -0
  36. synth_ai/cli/commands/help/core.py +72 -0
  37. synth_ai/cli/commands/scan/__init__.py +19 -0
  38. synth_ai/cli/commands/scan/cloudflare_scanner.py +403 -0
  39. synth_ai/cli/commands/scan/core.py +344 -0
  40. synth_ai/cli/commands/scan/health_checker.py +242 -0
  41. synth_ai/cli/commands/scan/local_scanner.py +278 -0
  42. synth_ai/cli/commands/scan/models.py +83 -0
  43. synth_ai/cli/commands/smoke/__init__.py +7 -0
  44. synth_ai/cli/commands/smoke/core.py +1428 -0
  45. synth_ai/cli/commands/status/__init__.py +3 -0
  46. synth_ai/cli/commands/status/client.py +91 -0
  47. synth_ai/cli/commands/status/config.py +12 -0
  48. synth_ai/cli/commands/status/errors.py +11 -0
  49. synth_ai/cli/commands/status/subcommands/__init__.py +3 -0
  50. synth_ai/cli/commands/status/subcommands/config.py +13 -0
  51. synth_ai/cli/commands/status/subcommands/files.py +34 -0
  52. synth_ai/cli/commands/status/subcommands/jobs.py +51 -0
  53. synth_ai/cli/commands/status/subcommands/models.py +35 -0
  54. synth_ai/cli/commands/status/subcommands/runs.py +34 -0
  55. synth_ai/cli/commands/status/subcommands/session.py +77 -0
  56. synth_ai/cli/commands/status/subcommands/summary.py +39 -0
  57. synth_ai/cli/commands/status/subcommands/utils.py +41 -0
  58. synth_ai/cli/commands/status/utils.py +23 -0
  59. synth_ai/cli/commands/train/__init__.py +53 -0
  60. synth_ai/cli/commands/train/core.py +22 -0
  61. synth_ai/cli/commands/train/errors.py +117 -0
  62. synth_ai/cli/commands/train/judge_schemas.py +201 -0
  63. synth_ai/cli/commands/train/judge_validation.py +305 -0
  64. synth_ai/cli/commands/train/prompt_learning_validation.py +633 -0
  65. synth_ai/cli/commands/train/validation.py +392 -0
  66. synth_ai/cli/demo_apps/__init__.py +10 -0
  67. synth_ai/cli/demo_apps/core/__init__.py +28 -0
  68. synth_ai/cli/demo_apps/core/cli.py +1735 -0
  69. synth_ai/cli/demo_apps/crafter/__init__.py +1 -0
  70. synth_ai/cli/demo_apps/crafter/crafter_fft_4b.toml +55 -0
  71. synth_ai/cli/demo_apps/crafter/grpo_crafter_task_app.py +186 -0
  72. synth_ai/cli/demo_apps/crafter/rl_from_base_qwen4b.toml +74 -0
  73. synth_ai/cli/demo_apps/demo_registry.py +176 -0
  74. synth_ai/cli/demo_apps/demo_task_apps/__init__.py +7 -0
  75. synth_ai/{demos → cli/demo_apps}/demo_task_apps/core.py +117 -51
  76. synth_ai/cli/demo_apps/demo_task_apps/crafter/__init__.py +1 -0
  77. synth_ai/cli/demo_apps/demo_task_apps/crafter/configs/crafter_fft_4b.toml +53 -0
  78. synth_ai/cli/demo_apps/demo_task_apps/crafter/configs/rl_from_base_qwen4b.toml +73 -0
  79. synth_ai/cli/demo_apps/demo_task_apps/crafter/grpo_crafter_task_app.py +185 -0
  80. synth_ai/cli/demo_apps/demo_task_apps/math/_common.py +16 -0
  81. synth_ai/{demos → cli/demo_apps}/demo_task_apps/math/app.py +2 -1
  82. synth_ai/cli/demo_apps/demo_task_apps/math/config.toml +73 -0
  83. synth_ai/{demos → cli/demo_apps}/demo_task_apps/math/deploy_modal.py +3 -6
  84. synth_ai/cli/demo_apps/demo_task_apps/math/modal_task_app.py +738 -0
  85. synth_ai/cli/demo_apps/demo_task_apps/math/task_app_entry.py +39 -0
  86. synth_ai/cli/demo_apps/math/__init__.py +1 -0
  87. synth_ai/cli/demo_apps/math/_common.py +16 -0
  88. synth_ai/cli/demo_apps/math/app.py +38 -0
  89. synth_ai/cli/demo_apps/math/config.toml +75 -0
  90. synth_ai/cli/demo_apps/math/deploy_modal.py +54 -0
  91. synth_ai/cli/demo_apps/math/modal_task_app.py +698 -0
  92. synth_ai/cli/demo_apps/math/task_app_entry.py +53 -0
  93. synth_ai/cli/demo_apps/mipro/main.py +271 -0
  94. synth_ai/cli/demo_apps/mipro/task_app.py +922 -0
  95. synth_ai/cli/demo_apps/mipro/train_cfg.toml +92 -0
  96. synth_ai/cli/demos/__init__.py +12 -0
  97. synth_ai/cli/demos/demo.py +32 -0
  98. synth_ai/cli/demos/rl_demo.py +254 -0
  99. synth_ai/cli/deploy.py +216 -0
  100. synth_ai/cli/infra/__init__.py +14 -0
  101. synth_ai/cli/{balance.py → infra/balance.py} +21 -3
  102. synth_ai/cli/infra/mcp.py +35 -0
  103. synth_ai/cli/infra/modal_app.py +36 -0
  104. synth_ai/cli/infra/setup.py +69 -0
  105. synth_ai/cli/infra/status.py +16 -0
  106. synth_ai/cli/infra/turso.py +77 -0
  107. synth_ai/cli/lib/__init__.py +10 -0
  108. synth_ai/cli/lib/agents.py +76 -0
  109. synth_ai/cli/lib/apps/modal_app.py +101 -0
  110. synth_ai/cli/lib/apps/task_app.py +642 -0
  111. synth_ai/cli/lib/bin.py +39 -0
  112. synth_ai/cli/lib/env.py +375 -0
  113. synth_ai/cli/lib/errors.py +85 -0
  114. synth_ai/cli/lib/modal.py +315 -0
  115. synth_ai/cli/lib/plotting.py +126 -0
  116. synth_ai/cli/lib/prompt_args.py +39 -0
  117. synth_ai/cli/lib/prompts.py +284 -0
  118. synth_ai/cli/lib/sqld.py +122 -0
  119. synth_ai/cli/lib/task_app_discovery.py +884 -0
  120. synth_ai/cli/lib/task_app_env.py +295 -0
  121. synth_ai/cli/lib/train_cfgs.py +300 -0
  122. synth_ai/cli/lib/tunnel_records.py +207 -0
  123. synth_ai/cli/local/__init__.py +14 -0
  124. synth_ai/cli/local/experiment_queue/__init__.py +72 -0
  125. synth_ai/cli/local/experiment_queue/api_schemas.py +221 -0
  126. synth_ai/cli/local/experiment_queue/celery_app.py +208 -0
  127. synth_ai/cli/local/experiment_queue/config.py +128 -0
  128. synth_ai/cli/local/experiment_queue/config_utils.py +272 -0
  129. synth_ai/cli/local/experiment_queue/database.py +175 -0
  130. synth_ai/cli/local/experiment_queue/dispatcher.py +119 -0
  131. synth_ai/cli/local/experiment_queue/models.py +231 -0
  132. synth_ai/cli/local/experiment_queue/progress_info.py +160 -0
  133. synth_ai/cli/local/experiment_queue/results.py +373 -0
  134. synth_ai/cli/local/experiment_queue/schemas.py +131 -0
  135. synth_ai/cli/local/experiment_queue/service.py +344 -0
  136. synth_ai/cli/local/experiment_queue/status.py +372 -0
  137. synth_ai/cli/local/experiment_queue/status_tracker.py +360 -0
  138. synth_ai/cli/local/experiment_queue/tasks.py +1984 -0
  139. synth_ai/cli/local/experiment_queue/trace_storage.py +65 -0
  140. synth_ai/cli/local/experiment_queue/validation.py +157 -0
  141. synth_ai/cli/local/session/__init__.py +92 -0
  142. synth_ai/cli/local/session/client.py +383 -0
  143. synth_ai/cli/local/session/constants.py +63 -0
  144. synth_ai/cli/local/session/exceptions.py +105 -0
  145. synth_ai/cli/local/session/manager.py +139 -0
  146. synth_ai/cli/local/session/models.py +89 -0
  147. synth_ai/cli/local/session/query.py +110 -0
  148. synth_ai/cli/root.py +150 -102
  149. synth_ai/cli/task_apps/__init__.py +37 -0
  150. synth_ai/cli/task_apps/commands.py +3145 -0
  151. synth_ai/cli/task_apps/deploy.py +7 -0
  152. synth_ai/cli/task_apps/list.py +26 -0
  153. synth_ai/cli/task_apps/main.py +36 -0
  154. synth_ai/cli/task_apps/modal_serve.py +11 -0
  155. synth_ai/cli/task_apps/serve.py +11 -0
  156. synth_ai/cli/training/__init__.py +8 -0
  157. synth_ai/cli/training/train.py +5 -0
  158. synth_ai/cli/training/train_cfg.py +34 -0
  159. synth_ai/cli/{watch.py → training/watch.py} +13 -18
  160. synth_ai/cli/turso.py +52 -0
  161. synth_ai/cli/utils/__init__.py +8 -0
  162. synth_ai/cli/utils/experiments.py +235 -0
  163. synth_ai/cli/utils/queue.py +504 -0
  164. synth_ai/cli/{recent.py → utils/recent.py} +13 -7
  165. synth_ai/cli/{traces.py → utils/traces.py} +9 -5
  166. synth_ai/contracts/__init__.py +67 -0
  167. synth_ai/core/__init__.py +100 -0
  168. synth_ai/core/_utils/__init__.py +54 -0
  169. synth_ai/core/_utils/base_url.py +10 -0
  170. synth_ai/core/_utils/http.py +10 -0
  171. synth_ai/core/_utils/prompts.py +14 -0
  172. synth_ai/core/_utils/task_app_state.py +12 -0
  173. synth_ai/core/_utils/user_config.py +10 -0
  174. synth_ai/core/apps/common.py +116 -0
  175. synth_ai/core/auth.py +95 -0
  176. synth_ai/core/cfgs.py +240 -0
  177. synth_ai/core/config/__init__.py +16 -0
  178. synth_ai/core/config/base.py +168 -0
  179. synth_ai/core/config/resolver.py +89 -0
  180. synth_ai/core/env.py +231 -0
  181. synth_ai/core/errors.py +126 -0
  182. synth_ai/core/http.py +230 -0
  183. synth_ai/core/integrations/__init__.py +11 -0
  184. synth_ai/core/integrations/cloudflare.py +1710 -0
  185. synth_ai/core/integrations/mcp/__init__.py +6 -0
  186. synth_ai/core/integrations/mcp/__main__.py +8 -0
  187. synth_ai/core/integrations/mcp/claude.py +36 -0
  188. synth_ai/core/integrations/mcp/main.py +254 -0
  189. synth_ai/core/integrations/mcp/setup.py +100 -0
  190. synth_ai/core/integrations/modal.py +277 -0
  191. synth_ai/core/json.py +72 -0
  192. synth_ai/core/log_filter.py +99 -0
  193. synth_ai/core/logging.py +82 -0
  194. synth_ai/core/paths.py +107 -0
  195. synth_ai/core/pricing.py +109 -0
  196. synth_ai/core/process.py +233 -0
  197. synth_ai/core/ssl.py +25 -0
  198. synth_ai/core/storage/__init__.py +71 -0
  199. synth_ai/core/task_app_state.py +318 -0
  200. synth_ai/core/telemetry.py +282 -0
  201. synth_ai/{tracing_v3 → core/tracing_v3}/__init__.py +5 -1
  202. synth_ai/{tracing_v3 → core/tracing_v3}/abstractions.py +21 -4
  203. synth_ai/core/tracing_v3/config.py +229 -0
  204. synth_ai/core/tracing_v3/constants.py +21 -0
  205. synth_ai/{tracing_v3 → core/tracing_v3}/db_config.py +42 -29
  206. synth_ai/{tracing_v3 → core/tracing_v3}/decorators.py +80 -45
  207. synth_ai/{tracing_v3 → core/tracing_v3}/examples/basic_usage.py +15 -9
  208. synth_ai/{tracing_v3 → core/tracing_v3}/hooks.py +6 -4
  209. synth_ai/{tracing_v3 → core/tracing_v3}/llm_call_record_helpers.py +161 -61
  210. synth_ai/{tracing_v3 → core/tracing_v3}/migration_helper.py +1 -2
  211. synth_ai/{tracing_v3 → core/tracing_v3}/replica_sync.py +12 -7
  212. synth_ai/core/tracing_v3/serialization.py +130 -0
  213. synth_ai/{tracing_v3 → core/tracing_v3}/session_tracer.py +88 -21
  214. synth_ai/{tracing_v3 → core/tracing_v3}/storage/base.py +99 -12
  215. synth_ai/core/tracing_v3/storage/config.py +109 -0
  216. synth_ai/{tracing_v3 → core/tracing_v3}/storage/factory.py +11 -9
  217. synth_ai/{tracing_v3 → core/tracing_v3}/storage/utils.py +15 -11
  218. synth_ai/core/tracing_v3/trace_utils.py +326 -0
  219. synth_ai/core/tracing_v3/turso/__init__.py +12 -0
  220. synth_ai/core/tracing_v3/turso/daemon.py +278 -0
  221. synth_ai/{tracing_v3 → core/tracing_v3}/turso/models.py +7 -3
  222. synth_ai/core/tracing_v3/turso/native_manager.py +1385 -0
  223. synth_ai/{tracing_v3 → core/tracing_v3}/utils.py +5 -4
  224. synth_ai/core/urls.py +18 -0
  225. synth_ai/core/user_config.py +137 -0
  226. synth_ai/core/uvicorn.py +222 -0
  227. synth_ai/data/__init__.py +83 -0
  228. synth_ai/data/enums.py +123 -0
  229. synth_ai/data/rewards.py +152 -0
  230. synth_ai/data/traces.py +35 -0
  231. synth_ai/products/__init__.py +6 -0
  232. synth_ai/products/graph_evolve/__init__.py +46 -0
  233. synth_ai/products/graph_evolve/client.py +226 -0
  234. synth_ai/products/graph_evolve/config.py +591 -0
  235. synth_ai/products/graph_evolve/converters/__init__.py +42 -0
  236. synth_ai/products/graph_evolve/converters/openai_sft.py +484 -0
  237. synth_ai/products/graph_evolve/examples/hotpotqa/config.toml +109 -0
  238. synth_ai/products/graph_evolve/run.py +222 -0
  239. synth_ai/products/graph_gepa/__init__.py +23 -0
  240. synth_ai/products/graph_gepa/converters/__init__.py +19 -0
  241. synth_ai/products/graph_gepa/converters/openai_sft.py +29 -0
  242. synth_ai/sdk/__init__.py +123 -0
  243. synth_ai/sdk/api/__init__.py +1 -0
  244. synth_ai/sdk/api/models/supported.py +514 -0
  245. synth_ai/sdk/api/research_agent/__init__.py +296 -0
  246. synth_ai/sdk/api/train/__init__.py +85 -0
  247. synth_ai/sdk/api/train/builders.py +895 -0
  248. synth_ai/sdk/api/train/cli.py +2199 -0
  249. synth_ai/sdk/api/train/config_finder.py +267 -0
  250. synth_ai/sdk/api/train/configs/__init__.py +65 -0
  251. synth_ai/sdk/api/train/configs/prompt_learning.py +1706 -0
  252. synth_ai/sdk/api/train/configs/rl.py +187 -0
  253. synth_ai/sdk/api/train/configs/sft.py +99 -0
  254. synth_ai/sdk/api/train/configs/shared.py +81 -0
  255. synth_ai/sdk/api/train/context_learning.py +312 -0
  256. synth_ai/sdk/api/train/env_resolver.py +418 -0
  257. synth_ai/sdk/api/train/graph_validators.py +216 -0
  258. synth_ai/sdk/api/train/graphgen.py +984 -0
  259. synth_ai/sdk/api/train/graphgen_models.py +823 -0
  260. synth_ai/sdk/api/train/graphgen_validators.py +109 -0
  261. synth_ai/sdk/api/train/local_api.py +10 -0
  262. synth_ai/sdk/api/train/pollers.py +124 -0
  263. synth_ai/sdk/api/train/progress/__init__.py +97 -0
  264. synth_ai/sdk/api/train/progress/dataclasses.py +569 -0
  265. synth_ai/sdk/api/train/progress/events.py +326 -0
  266. synth_ai/sdk/api/train/progress/results.py +428 -0
  267. synth_ai/sdk/api/train/progress/tracker.py +641 -0
  268. synth_ai/sdk/api/train/prompt_learning.py +469 -0
  269. synth_ai/sdk/api/train/rl.py +441 -0
  270. synth_ai/sdk/api/train/sft.py +396 -0
  271. synth_ai/sdk/api/train/summary.py +522 -0
  272. synth_ai/sdk/api/train/supported_algos.py +147 -0
  273. synth_ai/sdk/api/train/task_app.py +351 -0
  274. synth_ai/sdk/api/train/utils.py +279 -0
  275. synth_ai/sdk/api/train/validators.py +2424 -0
  276. synth_ai/sdk/graphs/__init__.py +15 -0
  277. synth_ai/sdk/graphs/completions.py +570 -0
  278. synth_ai/{inference → sdk/inference}/__init__.py +0 -1
  279. synth_ai/sdk/inference/client.py +128 -0
  280. synth_ai/sdk/jobs/__init__.py +16 -0
  281. synth_ai/sdk/jobs/client.py +371 -0
  282. synth_ai/sdk/judging/__init__.py +14 -0
  283. synth_ai/sdk/judging/base.py +24 -0
  284. synth_ai/sdk/judging/client.py +40 -0
  285. synth_ai/sdk/judging/schemas.py +222 -0
  286. synth_ai/sdk/judging/types.py +42 -0
  287. synth_ai/sdk/learning/__init__.py +99 -0
  288. synth_ai/sdk/learning/algorithms.py +14 -0
  289. synth_ai/{learning → sdk/learning}/client.py +121 -30
  290. synth_ai/sdk/learning/config.py +5 -0
  291. synth_ai/{learning → sdk/learning}/constants.py +0 -2
  292. synth_ai/sdk/learning/context_learning_client.py +531 -0
  293. synth_ai/sdk/learning/context_learning_types.py +292 -0
  294. synth_ai/sdk/learning/ft_client.py +7 -0
  295. synth_ai/{learning → sdk/learning}/health.py +15 -9
  296. synth_ai/{learning → sdk/learning}/jobs.py +44 -47
  297. synth_ai/sdk/learning/prompt_extraction.py +334 -0
  298. synth_ai/sdk/learning/prompt_learning_client.py +455 -0
  299. synth_ai/sdk/learning/prompt_learning_types.py +186 -0
  300. synth_ai/{rl → sdk/learning/rl}/__init__.py +13 -8
  301. synth_ai/{learning/rl_client.py → sdk/learning/rl/client.py} +89 -77
  302. synth_ai/sdk/learning/rl/config.py +31 -0
  303. synth_ai/{rl → sdk/learning/rl}/contracts.py +5 -14
  304. synth_ai/{rl → sdk/learning/rl}/env_keys.py +45 -16
  305. synth_ai/sdk/learning/rl/secrets.py +13 -0
  306. synth_ai/sdk/learning/rl_client.py +5 -0
  307. synth_ai/sdk/learning/sft/__init__.py +29 -0
  308. synth_ai/sdk/learning/sft/client.py +95 -0
  309. synth_ai/sdk/learning/sft/config.py +270 -0
  310. synth_ai/sdk/learning/sft/data.py +698 -0
  311. synth_ai/sdk/learning/sse.py +57 -0
  312. synth_ai/sdk/learning/validators.py +52 -0
  313. synth_ai/sdk/localapi/__init__.py +40 -0
  314. synth_ai/sdk/localapi/apps/__init__.py +28 -0
  315. synth_ai/sdk/localapi/client.py +10 -0
  316. synth_ai/sdk/localapi/contracts.py +10 -0
  317. synth_ai/sdk/localapi/helpers.py +519 -0
  318. synth_ai/sdk/localapi/rollouts.py +87 -0
  319. synth_ai/sdk/localapi/server.py +29 -0
  320. synth_ai/sdk/localapi/template.py +70 -0
  321. synth_ai/sdk/streaming/__init__.py +35 -0
  322. synth_ai/sdk/streaming/config.py +94 -0
  323. synth_ai/sdk/streaming/handlers.py +1997 -0
  324. synth_ai/sdk/streaming/streamer.py +713 -0
  325. synth_ai/sdk/streaming/types.py +112 -0
  326. synth_ai/sdk/task/__init__.py +164 -0
  327. synth_ai/sdk/task/apps/__init__.py +169 -0
  328. synth_ai/sdk/task/auth.py +165 -0
  329. synth_ai/sdk/task/client.py +175 -0
  330. synth_ai/sdk/task/config.py +257 -0
  331. synth_ai/sdk/task/contracts.py +219 -0
  332. synth_ai/sdk/task/datasets.py +108 -0
  333. synth_ai/sdk/task/errors.py +50 -0
  334. synth_ai/sdk/task/health.py +34 -0
  335. synth_ai/sdk/task/in_process.py +1190 -0
  336. synth_ai/sdk/task/in_process_runner.py +314 -0
  337. synth_ai/sdk/task/inference_api.py +299 -0
  338. synth_ai/sdk/task/json.py +111 -0
  339. synth_ai/sdk/task/proxy.py +287 -0
  340. synth_ai/sdk/task/rubrics/__init__.py +55 -0
  341. synth_ai/sdk/task/rubrics/loaders.py +156 -0
  342. synth_ai/sdk/task/rubrics/models.py +57 -0
  343. synth_ai/sdk/task/rubrics/scoring.py +116 -0
  344. synth_ai/sdk/task/rubrics/strict.py +149 -0
  345. synth_ai/sdk/task/rubrics.py +219 -0
  346. synth_ai/sdk/task/server.py +631 -0
  347. synth_ai/sdk/task/trace_correlation_helpers.py +539 -0
  348. synth_ai/sdk/task/tracing_utils.py +95 -0
  349. synth_ai/sdk/task/validators.py +441 -0
  350. synth_ai/sdk/task/vendors.py +59 -0
  351. synth_ai/sdk/training/__init__.py +102 -0
  352. synth_ai/sdk/tunnels/__init__.py +83 -0
  353. synth_ai/sdk/tunnels/cleanup.py +83 -0
  354. synth_ai/sdk/tunnels/ports.py +120 -0
  355. synth_ai/utils/__init__.py +213 -0
  356. synth_ai-0.4.3.dist-info/METADATA +262 -0
  357. synth_ai-0.4.3.dist-info/RECORD +370 -0
  358. {synth_ai-0.2.6.dev1.dist-info → synth_ai-0.4.3.dist-info}/entry_points.txt +0 -1
  359. synth_ai/cli/calc.py +0 -69
  360. synth_ai/cli/demo.py +0 -131
  361. synth_ai/cli/legacy_root_backup.py +0 -470
  362. synth_ai/cli/man.py +0 -106
  363. synth_ai/cli/rl_demo.py +0 -137
  364. synth_ai/cli/status.py +0 -133
  365. synth_ai/config/base_url.py +0 -98
  366. synth_ai/core/experiment.py +0 -15
  367. synth_ai/core/system.py +0 -15
  368. synth_ai/demos/core/__init__.py +0 -1
  369. synth_ai/demos/core/cli.py +0 -685
  370. synth_ai/demos/demo_task_apps/__init__.py +0 -1
  371. synth_ai/demos/demo_task_apps/math/config.toml +0 -44
  372. synth_ai/demos/demo_task_apps/math/deploy_task_app.sh +0 -22
  373. synth_ai/environments/__init__.py +0 -31
  374. synth_ai/environments/environment/__init__.py +0 -1
  375. synth_ai/environments/environment/artifacts/__init__.py +0 -1
  376. synth_ai/environments/environment/artifacts/base.py +0 -52
  377. synth_ai/environments/environment/core.py +0 -67
  378. synth_ai/environments/environment/db/__init__.py +0 -1
  379. synth_ai/environments/environment/db/sqlite.py +0 -45
  380. synth_ai/environments/environment/registry.py +0 -233
  381. synth_ai/environments/environment/resources/sqlite.py +0 -45
  382. synth_ai/environments/environment/results.py +0 -1
  383. synth_ai/environments/environment/rewards/__init__.py +0 -1
  384. synth_ai/environments/environment/rewards/core.py +0 -29
  385. synth_ai/environments/environment/shared_engine.py +0 -26
  386. synth_ai/environments/environment/tools/__init__.py +0 -200
  387. synth_ai/environments/examples/__init__.py +0 -1
  388. synth_ai/environments/examples/bandit/__init__.py +0 -33
  389. synth_ai/environments/examples/bandit/engine.py +0 -294
  390. synth_ai/environments/examples/bandit/environment.py +0 -194
  391. synth_ai/environments/examples/bandit/taskset.py +0 -200
  392. synth_ai/environments/examples/crafter_classic/__init__.py +0 -8
  393. synth_ai/environments/examples/crafter_classic/agent_demos/analyze_semantic_words_markdown.py +0 -250
  394. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_comprehensive_evaluation.py +0 -59
  395. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_evaluation_browser.py +0 -152
  396. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_evaluation_config.toml +0 -24
  397. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_evaluation_framework.py +0 -1194
  398. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/crafter_synth_config.toml +0 -56
  399. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/filter_config_modal.toml +0 -32
  400. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/filter_traces_sft_turso.py +0 -724
  401. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/kick_off_ft_modal.py +0 -384
  402. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_action_results.py +0 -53
  403. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_agent_actions.py +0 -178
  404. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_latest_run.py +0 -222
  405. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_lm_traces.py +0 -183
  406. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_no_rewards.py +0 -210
  407. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_trace_issue.py +0 -206
  408. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/check_db_schema.py +0 -49
  409. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/check_latest_results.py +0 -64
  410. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/debug_agent_responses.py +0 -88
  411. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/quick_trace_check.py +0 -77
  412. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/compare_experiments.py +0 -324
  413. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/filter_traces_sft_turso.py +0 -580
  414. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/kick_off_ft_oai.py +0 -362
  415. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/multi_model_config.toml +0 -49
  416. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/analyze_enhanced_hooks.py +0 -332
  417. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/analyze_hook_events.py +0 -97
  418. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/analyze_hook_results.py +0 -217
  419. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/check_hook_storage.py +0 -87
  420. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/check_seeds.py +0 -88
  421. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/compare_seed_performance.py +0 -195
  422. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/custom_eval_pipelines.py +0 -400
  423. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/plot_hook_frequency.py +0 -195
  424. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/seed_analysis_summary.py +0 -56
  425. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/run_rollouts_for_models_and_compare_v3.py +0 -858
  426. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_quick_evaluation.py +0 -52
  427. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_react_agent.py +0 -874
  428. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_trace_evaluation.py +0 -1412
  429. synth_ai/environments/examples/crafter_classic/agent_demos/example_v3_usage.py +0 -216
  430. synth_ai/environments/examples/crafter_classic/agent_demos/old/compare_traces.py +0 -296
  431. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_comprehensive_evaluation.py +0 -58
  432. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_env_serialization.py +0 -464
  433. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_evaluation_browser.py +0 -152
  434. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_quick_evaluation.py +0 -51
  435. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_trace_evaluation.py +0 -1412
  436. synth_ai/environments/examples/crafter_classic/agent_demos/old/debug_player_loss.py +0 -112
  437. synth_ai/environments/examples/crafter_classic/agent_demos/old/diagnose_service.py +0 -203
  438. synth_ai/environments/examples/crafter_classic/agent_demos/old/diagnose_slowness.py +0 -305
  439. synth_ai/environments/examples/crafter_classic/agent_demos/old/eval_by_difficulty.py +0 -126
  440. synth_ai/environments/examples/crafter_classic/agent_demos/old/eval_example.py +0 -94
  441. synth_ai/environments/examples/crafter_classic/agent_demos/old/explore_saved_states.py +0 -142
  442. synth_ai/environments/examples/crafter_classic/agent_demos/old/filter_traces_sft.py +0 -26
  443. synth_ai/environments/examples/crafter_classic/agent_demos/old/filter_traces_sft_OLD.py +0 -984
  444. synth_ai/environments/examples/crafter_classic/agent_demos/old/generate_ft_data_gemini.py +0 -724
  445. synth_ai/environments/examples/crafter_classic/agent_demos/old/generate_ft_data_modal.py +0 -386
  446. synth_ai/environments/examples/crafter_classic/agent_demos/old/generate_ft_metadata.py +0 -205
  447. synth_ai/environments/examples/crafter_classic/agent_demos/old/kick_off_ft_gemini.py +0 -150
  448. synth_ai/environments/examples/crafter_classic/agent_demos/old/kick_off_ft_modal.py +0 -283
  449. synth_ai/environments/examples/crafter_classic/agent_demos/old/prepare_vertex_ft.py +0 -280
  450. synth_ai/environments/examples/crafter_classic/agent_demos/old/profile_env_slowness.py +0 -456
  451. synth_ai/environments/examples/crafter_classic/agent_demos/old/replicate_issue.py +0 -166
  452. synth_ai/environments/examples/crafter_classic/agent_demos/old/run_and_eval.py +0 -102
  453. synth_ai/environments/examples/crafter_classic/agent_demos/old/run_comparison.py +0 -128
  454. synth_ai/environments/examples/crafter_classic/agent_demos/old/run_qwen_rollouts.py +0 -655
  455. synth_ai/environments/examples/crafter_classic/agent_demos/old/trace_eval_OLD.py +0 -202
  456. synth_ai/environments/examples/crafter_classic/agent_demos/old/validate_openai_format.py +0 -166
  457. synth_ai/environments/examples/crafter_classic/config_logging.py +0 -111
  458. synth_ai/environments/examples/crafter_classic/debug_translation.py +0 -0
  459. synth_ai/environments/examples/crafter_classic/engine.py +0 -579
  460. synth_ai/environments/examples/crafter_classic/engine_deterministic_patch.py +0 -64
  461. synth_ai/environments/examples/crafter_classic/engine_helpers/action_map.py +0 -6
  462. synth_ai/environments/examples/crafter_classic/engine_helpers/serialization.py +0 -75
  463. synth_ai/environments/examples/crafter_classic/engine_serialization_patch_v3.py +0 -267
  464. synth_ai/environments/examples/crafter_classic/environment.py +0 -404
  465. synth_ai/environments/examples/crafter_classic/taskset.py +0 -233
  466. synth_ai/environments/examples/crafter_classic/trace_hooks_v3.py +0 -228
  467. synth_ai/environments/examples/crafter_classic/world_config_patch_simple.py +0 -299
  468. synth_ai/environments/examples/crafter_custom/__init__.py +0 -4
  469. synth_ai/environments/examples/crafter_custom/agent_demos/__init__.py +0 -1
  470. synth_ai/environments/examples/crafter_custom/agent_demos/trace_eval.py +0 -202
  471. synth_ai/environments/examples/crafter_custom/crafter/__init__.py +0 -7
  472. synth_ai/environments/examples/crafter_custom/crafter/config.py +0 -182
  473. synth_ai/environments/examples/crafter_custom/crafter/constants.py +0 -8
  474. synth_ai/environments/examples/crafter_custom/crafter/engine.py +0 -269
  475. synth_ai/environments/examples/crafter_custom/crafter/env.py +0 -262
  476. synth_ai/environments/examples/crafter_custom/crafter/objects.py +0 -417
  477. synth_ai/environments/examples/crafter_custom/crafter/recorder.py +0 -187
  478. synth_ai/environments/examples/crafter_custom/crafter/worldgen.py +0 -118
  479. synth_ai/environments/examples/crafter_custom/dataset_builder.py +0 -373
  480. synth_ai/environments/examples/crafter_custom/environment.py +0 -312
  481. synth_ai/environments/examples/crafter_custom/old/analyze_diamond_issue.py +0 -159
  482. synth_ai/environments/examples/crafter_custom/old/analyze_diamond_spawning.py +0 -158
  483. synth_ai/environments/examples/crafter_custom/old/compare_worlds.py +0 -71
  484. synth_ai/environments/examples/crafter_custom/old/dataset_stats.py +0 -105
  485. synth_ai/environments/examples/crafter_custom/old/diamond_spawning_summary.py +0 -119
  486. synth_ai/environments/examples/crafter_custom/old/example_dataset_usage.py +0 -52
  487. synth_ai/environments/examples/crafter_custom/run_dataset.py +0 -305
  488. synth_ai/environments/examples/enron/art_helpers/email_search_tools.py +0 -156
  489. synth_ai/environments/examples/enron/art_helpers/local_email_db.py +0 -281
  490. synth_ai/environments/examples/enron/art_helpers/types_enron.py +0 -25
  491. synth_ai/environments/examples/enron/engine.py +0 -295
  492. synth_ai/environments/examples/enron/environment.py +0 -166
  493. synth_ai/environments/examples/enron/taskset.py +0 -112
  494. synth_ai/environments/examples/enron/units/keyword_stats.py +0 -112
  495. synth_ai/environments/examples/minigrid/__init__.py +0 -48
  496. synth_ai/environments/examples/minigrid/agent_demos/minigrid_evaluation_framework.py +0 -1188
  497. synth_ai/environments/examples/minigrid/agent_demos/minigrid_quick_evaluation.py +0 -48
  498. synth_ai/environments/examples/minigrid/agent_demos/minigrid_react_agent.py +0 -562
  499. synth_ai/environments/examples/minigrid/agent_demos/minigrid_trace_evaluation.py +0 -221
  500. synth_ai/environments/examples/minigrid/engine.py +0 -589
  501. synth_ai/environments/examples/minigrid/environment.py +0 -274
  502. synth_ai/environments/examples/minigrid/environment_mapping.py +0 -242
  503. synth_ai/environments/examples/minigrid/puzzle_loader.py +0 -417
  504. synth_ai/environments/examples/minigrid/taskset.py +0 -583
  505. synth_ai/environments/examples/nethack/__init__.py +0 -7
  506. synth_ai/environments/examples/nethack/achievements.py +0 -337
  507. synth_ai/environments/examples/nethack/agent_demos/nethack_evaluation_framework.py +0 -981
  508. synth_ai/environments/examples/nethack/agent_demos/nethack_quick_evaluation.py +0 -74
  509. synth_ai/environments/examples/nethack/agent_demos/nethack_react_agent.py +0 -831
  510. synth_ai/environments/examples/nethack/engine.py +0 -739
  511. synth_ai/environments/examples/nethack/environment.py +0 -256
  512. synth_ai/environments/examples/nethack/helpers/__init__.py +0 -41
  513. synth_ai/environments/examples/nethack/helpers/action_mapping.py +0 -301
  514. synth_ai/environments/examples/nethack/helpers/nle_wrapper.py +0 -402
  515. synth_ai/environments/examples/nethack/helpers/observation_utils.py +0 -433
  516. synth_ai/environments/examples/nethack/helpers/recording_wrapper.py +0 -200
  517. synth_ai/environments/examples/nethack/helpers/trajectory_recorder.py +0 -269
  518. synth_ai/environments/examples/nethack/helpers/visualization/replay_viewer.py +0 -308
  519. synth_ai/environments/examples/nethack/helpers/visualization/visualizer.py +0 -431
  520. synth_ai/environments/examples/nethack/taskset.py +0 -323
  521. synth_ai/environments/examples/red/__init__.py +0 -7
  522. synth_ai/environments/examples/red/agent_demos/__init__.py +0 -1
  523. synth_ai/environments/examples/red/config_logging.py +0 -110
  524. synth_ai/environments/examples/red/engine.py +0 -694
  525. synth_ai/environments/examples/red/engine_helpers/__init__.py +0 -1
  526. synth_ai/environments/examples/red/engine_helpers/memory_map.py +0 -28
  527. synth_ai/environments/examples/red/engine_helpers/reward_components.py +0 -276
  528. synth_ai/environments/examples/red/engine_helpers/reward_library/__init__.py +0 -142
  529. synth_ai/environments/examples/red/engine_helpers/reward_library/adaptive_rewards.py +0 -57
  530. synth_ai/environments/examples/red/engine_helpers/reward_library/battle_rewards.py +0 -284
  531. synth_ai/environments/examples/red/engine_helpers/reward_library/composite_rewards.py +0 -150
  532. synth_ai/environments/examples/red/engine_helpers/reward_library/economy_rewards.py +0 -138
  533. synth_ai/environments/examples/red/engine_helpers/reward_library/efficiency_rewards.py +0 -57
  534. synth_ai/environments/examples/red/engine_helpers/reward_library/exploration_rewards.py +0 -331
  535. synth_ai/environments/examples/red/engine_helpers/reward_library/novelty_rewards.py +0 -121
  536. synth_ai/environments/examples/red/engine_helpers/reward_library/pallet_town_rewards.py +0 -559
  537. synth_ai/environments/examples/red/engine_helpers/reward_library/pokemon_rewards.py +0 -313
  538. synth_ai/environments/examples/red/engine_helpers/reward_library/social_rewards.py +0 -148
  539. synth_ai/environments/examples/red/engine_helpers/reward_library/story_rewards.py +0 -247
  540. synth_ai/environments/examples/red/engine_helpers/screen_analysis.py +0 -368
  541. synth_ai/environments/examples/red/engine_helpers/state_extraction.py +0 -140
  542. synth_ai/environments/examples/red/environment.py +0 -238
  543. synth_ai/environments/examples/red/taskset.py +0 -79
  544. synth_ai/environments/examples/red/units/__init__.py +0 -1
  545. synth_ai/environments/examples/sokoban/__init__.py +0 -1
  546. synth_ai/environments/examples/sokoban/agent_demos/sokoban_full_eval.py +0 -899
  547. synth_ai/environments/examples/sokoban/engine.py +0 -678
  548. synth_ai/environments/examples/sokoban/engine_helpers/__init__.py +0 -1
  549. synth_ai/environments/examples/sokoban/engine_helpers/room_utils.py +0 -657
  550. synth_ai/environments/examples/sokoban/engine_helpers/vendored/__init__.py +0 -18
  551. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/__init__.py +0 -3
  552. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/boxoban_env.py +0 -131
  553. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/render_utils.py +0 -370
  554. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/room_utils.py +0 -332
  555. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env.py +0 -306
  556. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_fixed_targets.py +0 -67
  557. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_pull.py +0 -115
  558. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_two_player.py +0 -123
  559. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_variations.py +0 -394
  560. synth_ai/environments/examples/sokoban/environment.py +0 -229
  561. synth_ai/environments/examples/sokoban/generate_verified_puzzles.py +0 -440
  562. synth_ai/environments/examples/sokoban/puzzle_loader.py +0 -312
  563. synth_ai/environments/examples/sokoban/taskset.py +0 -428
  564. synth_ai/environments/examples/sokoban/units/astar_common.py +0 -95
  565. synth_ai/environments/examples/tictactoe/__init__.py +0 -1
  566. synth_ai/environments/examples/tictactoe/engine.py +0 -368
  567. synth_ai/environments/examples/tictactoe/environment.py +0 -240
  568. synth_ai/environments/examples/tictactoe/taskset.py +0 -215
  569. synth_ai/environments/examples/verilog/__init__.py +0 -10
  570. synth_ai/environments/examples/verilog/engine.py +0 -329
  571. synth_ai/environments/examples/verilog/environment.py +0 -350
  572. synth_ai/environments/examples/verilog/taskset.py +0 -420
  573. synth_ai/environments/examples/wordle/__init__.py +0 -29
  574. synth_ai/environments/examples/wordle/engine.py +0 -398
  575. synth_ai/environments/examples/wordle/environment.py +0 -159
  576. synth_ai/environments/examples/wordle/helpers/generate_instances_wordfreq.py +0 -75
  577. synth_ai/environments/examples/wordle/taskset.py +0 -230
  578. synth_ai/environments/reproducibility/core.py +0 -42
  579. synth_ai/environments/reproducibility/helpers.py +0 -0
  580. synth_ai/environments/reproducibility/tree.py +0 -364
  581. synth_ai/environments/service/app.py +0 -91
  582. synth_ai/environments/service/core_routes.py +0 -1020
  583. synth_ai/environments/service/external_registry.py +0 -56
  584. synth_ai/environments/service/registry.py +0 -9
  585. synth_ai/environments/stateful/__init__.py +0 -1
  586. synth_ai/environments/stateful/core.py +0 -163
  587. synth_ai/environments/stateful/engine.py +0 -21
  588. synth_ai/environments/stateful/state.py +0 -7
  589. synth_ai/environments/tasks/api.py +0 -19
  590. synth_ai/environments/tasks/core.py +0 -80
  591. synth_ai/environments/tasks/filters.py +0 -41
  592. synth_ai/environments/tasks/utils.py +0 -91
  593. synth_ai/environments/v0_observability/history.py +0 -3
  594. synth_ai/environments/v0_observability/log.py +0 -2
  595. synth_ai/evals/base.py +0 -15
  596. synth_ai/experimental/synth_oss.py +0 -446
  597. synth_ai/http.py +0 -102
  598. synth_ai/inference/client.py +0 -20
  599. synth_ai/install_sqld.sh +0 -40
  600. synth_ai/jobs/client.py +0 -246
  601. synth_ai/learning/__init__.py +0 -24
  602. synth_ai/learning/config.py +0 -43
  603. synth_ai/learning/filtering.py +0 -0
  604. synth_ai/learning/ft_client.py +0 -59
  605. synth_ai/learning/offline/dpo.py +0 -0
  606. synth_ai/learning/offline/providers.py +0 -7
  607. synth_ai/learning/offline/sft.py +0 -0
  608. synth_ai/learning/offline/shared.py +0 -0
  609. synth_ai/learning/online/grpo.py +0 -0
  610. synth_ai/learning/online/irft.py +0 -0
  611. synth_ai/learning/prompts/banking77_injection_eval.py +0 -168
  612. synth_ai/learning/prompts/gepa.py +0 -0
  613. synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +0 -213
  614. synth_ai/learning/prompts/mipro.py +0 -289
  615. synth_ai/learning/prompts/random_search.py +0 -246
  616. synth_ai/learning/prompts/run_mipro_banking77.py +0 -172
  617. synth_ai/learning/prompts/run_random_search_banking77.py +0 -324
  618. synth_ai/learning/sse.py +0 -58
  619. synth_ai/learning/validators.py +0 -48
  620. synth_ai/lm/__init__.py +0 -51
  621. synth_ai/lm/caching/constants.py +0 -6
  622. synth_ai/lm/caching/dbs.py +0 -0
  623. synth_ai/lm/caching/ephemeral.py +0 -102
  624. synth_ai/lm/caching/handler.py +0 -137
  625. synth_ai/lm/caching/initialize.py +0 -11
  626. synth_ai/lm/caching/persistent.py +0 -114
  627. synth_ai/lm/config.py +0 -110
  628. synth_ai/lm/constants.py +0 -32
  629. synth_ai/lm/core/__init__.py +0 -8
  630. synth_ai/lm/core/all.py +0 -73
  631. synth_ai/lm/core/exceptions.py +0 -7
  632. synth_ai/lm/core/main.py +0 -319
  633. synth_ai/lm/core/main_v3.py +0 -594
  634. synth_ai/lm/core/synth_models.py +0 -48
  635. synth_ai/lm/core/vendor_clients.py +0 -188
  636. synth_ai/lm/cost/__init__.py +0 -0
  637. synth_ai/lm/cost/monitor.py +0 -1
  638. synth_ai/lm/cost/statefulness.py +0 -1
  639. synth_ai/lm/injection.py +0 -80
  640. synth_ai/lm/overrides.py +0 -206
  641. synth_ai/lm/provider_support/__init__.py +0 -8
  642. synth_ai/lm/provider_support/anthropic.py +0 -972
  643. synth_ai/lm/provider_support/openai.py +0 -1139
  644. synth_ai/lm/provider_support/suppress_logging.py +0 -31
  645. synth_ai/lm/structured_outputs/__init__.py +0 -0
  646. synth_ai/lm/structured_outputs/handler.py +0 -440
  647. synth_ai/lm/structured_outputs/inject.py +0 -297
  648. synth_ai/lm/structured_outputs/rehabilitate.py +0 -185
  649. synth_ai/lm/tools/__init__.py +0 -3
  650. synth_ai/lm/tools/base.py +0 -172
  651. synth_ai/lm/unified_interface.py +0 -202
  652. synth_ai/lm/vendors/__init__.py +0 -0
  653. synth_ai/lm/vendors/base.py +0 -81
  654. synth_ai/lm/vendors/core/__init__.py +0 -0
  655. synth_ai/lm/vendors/core/anthropic_api.py +0 -387
  656. synth_ai/lm/vendors/core/gemini_api.py +0 -292
  657. synth_ai/lm/vendors/core/mistral_api.py +0 -322
  658. synth_ai/lm/vendors/core/openai_api.py +0 -220
  659. synth_ai/lm/vendors/core/synth_dev_api.py +0 -0
  660. synth_ai/lm/vendors/local/__init__.py +0 -0
  661. synth_ai/lm/vendors/local/ollama.py +0 -0
  662. synth_ai/lm/vendors/openai_standard.py +0 -780
  663. synth_ai/lm/vendors/openai_standard_responses.py +0 -256
  664. synth_ai/lm/vendors/retries.py +0 -22
  665. synth_ai/lm/vendors/supported/__init__.py +0 -0
  666. synth_ai/lm/vendors/supported/custom_endpoint.py +0 -417
  667. synth_ai/lm/vendors/supported/deepseek.py +0 -69
  668. synth_ai/lm/vendors/supported/grok.py +0 -75
  669. synth_ai/lm/vendors/supported/groq.py +0 -16
  670. synth_ai/lm/vendors/supported/ollama.py +0 -15
  671. synth_ai/lm/vendors/supported/openrouter.py +0 -74
  672. synth_ai/lm/vendors/supported/together.py +0 -11
  673. synth_ai/lm/vendors/synth_client.py +0 -808
  674. synth_ai/lm/warmup.py +0 -186
  675. synth_ai/rl/secrets.py +0 -19
  676. synth_ai/scripts/verify_rewards.py +0 -100
  677. synth_ai/task/__init__.py +0 -10
  678. synth_ai/task/contracts.py +0 -120
  679. synth_ai/task/health.py +0 -28
  680. synth_ai/task/validators.py +0 -12
  681. synth_ai/tracing/__init__.py +0 -30
  682. synth_ai/tracing_v1/__init__.py +0 -33
  683. synth_ai/tracing_v3/config.py +0 -84
  684. synth_ai/tracing_v3/storage/config.py +0 -62
  685. synth_ai/tracing_v3/turso/__init__.py +0 -25
  686. synth_ai/tracing_v3/turso/daemon.py +0 -144
  687. synth_ai/tracing_v3/turso/manager.py +0 -760
  688. synth_ai/v0/tracing/__init__.py +0 -0
  689. synth_ai/v0/tracing/abstractions.py +0 -224
  690. synth_ai/v0/tracing/base_client.py +0 -91
  691. synth_ai/v0/tracing/client_manager.py +0 -131
  692. synth_ai/v0/tracing/config.py +0 -140
  693. synth_ai/v0/tracing/context.py +0 -146
  694. synth_ai/v0/tracing/decorators.py +0 -680
  695. synth_ai/v0/tracing/events/__init__.py +0 -0
  696. synth_ai/v0/tracing/events/manage.py +0 -147
  697. synth_ai/v0/tracing/events/scope.py +0 -86
  698. synth_ai/v0/tracing/events/store.py +0 -228
  699. synth_ai/v0/tracing/immediate_client.py +0 -151
  700. synth_ai/v0/tracing/local.py +0 -18
  701. synth_ai/v0/tracing/log_client_base.py +0 -73
  702. synth_ai/v0/tracing/retry_queue.py +0 -186
  703. synth_ai/v0/tracing/trackers.py +0 -515
  704. synth_ai/v0/tracing/upload.py +0 -510
  705. synth_ai/v0/tracing/utils.py +0 -9
  706. synth_ai/v0/tracing_v1/__init__.py +0 -16
  707. synth_ai/v0/tracing_v1/abstractions.py +0 -224
  708. synth_ai/v0/tracing_v1/base_client.py +0 -91
  709. synth_ai/v0/tracing_v1/client_manager.py +0 -131
  710. synth_ai/v0/tracing_v1/config.py +0 -140
  711. synth_ai/v0/tracing_v1/context.py +0 -146
  712. synth_ai/v0/tracing_v1/decorators.py +0 -701
  713. synth_ai/v0/tracing_v1/events/__init__.py +0 -0
  714. synth_ai/v0/tracing_v1/events/manage.py +0 -147
  715. synth_ai/v0/tracing_v1/events/scope.py +0 -86
  716. synth_ai/v0/tracing_v1/events/store.py +0 -228
  717. synth_ai/v0/tracing_v1/immediate_client.py +0 -151
  718. synth_ai/v0/tracing_v1/local.py +0 -18
  719. synth_ai/v0/tracing_v1/log_client_base.py +0 -73
  720. synth_ai/v0/tracing_v1/retry_queue.py +0 -186
  721. synth_ai/v0/tracing_v1/trackers.py +0 -515
  722. synth_ai/v0/tracing_v1/upload.py +0 -525
  723. synth_ai/v0/tracing_v1/utils.py +0 -9
  724. synth_ai/zyk/__init__.py +0 -30
  725. synth_ai-0.2.6.dev1.dist-info/METADATA +0 -106
  726. synth_ai-0.2.6.dev1.dist-info/RECORD +0 -416
  727. /synth_ai/{demos → cli/demo_apps}/demo_task_apps/math/__init__.py +0 -0
  728. /synth_ai/{lm/caching → core/apps}/__init__.py +0 -0
  729. /synth_ai/{tracing_v3 → core/tracing_v3}/lm_call_record_abstractions.py +0 -0
  730. /synth_ai/{tracing_v3 → core/tracing_v3}/storage/__init__.py +0 -0
  731. /synth_ai/{tracing_v3 → core/tracing_v3}/storage/exceptions.py +0 -0
  732. /synth_ai/{tracing_v3 → core/tracing_v3}/storage/types.py +0 -0
  733. /synth_ai/{compound/cais.py → py.typed} +0 -0
  734. /synth_ai/{learning → sdk/learning}/core.py +0 -0
  735. /synth_ai/{learning → sdk/learning}/gateway.py +0 -0
  736. {synth_ai-0.2.6.dev1.dist-info → synth_ai-0.4.3.dist-info}/WHEEL +0 -0
  737. {synth_ai-0.2.6.dev1.dist-info → synth_ai-0.4.3.dist-info}/licenses/LICENSE +0 -0
  738. {synth_ai-0.2.6.dev1.dist-info → synth_ai-0.4.3.dist-info}/top_level.txt +0 -0
@@ -1,678 +0,0 @@
1
- from __future__ import annotations
2
-
3
- import logging
4
- from dataclasses import dataclass
5
- from typing import Any, Dict, Optional, Tuple
6
-
7
- import numpy as np
8
-
9
- from synth_ai.environments.environment.rewards.core import RewardComponent, RewardStack
10
- from synth_ai.environments.environment.shared_engine import (
11
- GetObservationCallable,
12
- InternalObservation,
13
- )
14
- from synth_ai.environments.examples.sokoban.engine_helpers.vendored.envs.sokoban_env import (
15
- ACTION_LOOKUP,
16
- )
17
- from synth_ai.environments.examples.sokoban.engine_helpers.vendored.envs.sokoban_env import (
18
- SokobanEnv as GymSokobanEnv,
19
- )
20
- from synth_ai.environments.examples.sokoban.taskset import (
21
- SokobanTaskInstance,
22
- ) # Assuming this is where SokobanTaskInstance is defined
23
- from synth_ai.environments.reproducibility.core import IReproducibleEngine # Added import
24
- from synth_ai.environments.stateful.engine import StatefulEngine, StatefulEngineSnapshot
25
- from synth_ai.environments.tasks.core import TaskInstance
26
-
27
- # No monkey-patch needed - we fixed the vendored code directly
28
-
29
- # Configure logging for debugging SokobanEngine steps
30
- logger = logging.getLogger(__name__)
31
- logging.basicConfig(level=logging.DEBUG)
32
- # Suppress verbose PIL debug logs
33
- logging.getLogger("PIL").setLevel(logging.WARNING)
34
-
35
- # --- Action Mapping ---
36
- ACTION_STRING_TO_INT: Dict[str, int] = {
37
- "no operation": 0,
38
- "push up": 1,
39
- "push down": 2,
40
- "push left": 3,
41
- "push right": 4,
42
- "move up": 5,
43
- "move down": 6,
44
- "move left": 7,
45
- "move right": 8,
46
- }
47
- INT_TO_ACTION_STRING: Dict[int, str] = {v: k for k, v in ACTION_STRING_TO_INT.items()}
48
-
49
-
50
- @dataclass
51
- class SokobanEngineSnapshot(StatefulEngineSnapshot):
52
- task_instance_dict: Dict
53
- engine_snapshot: Dict
54
-
55
-
56
- @dataclass
57
- class SokobanPublicState:
58
- dim_room: Tuple[int, int]
59
- room_fixed: np.ndarray # numpy kinda sucks
60
- room_state: np.ndarray
61
- player_position: Tuple[int, int]
62
- boxes_on_target: int
63
- num_steps: int
64
- max_steps: int
65
- last_action_name: str
66
- num_boxes: int
67
- error_info: Optional[str] = None
68
-
69
- def diff(self, prev_state: "SokobanPublicState") -> Dict[str, Any]:
70
- changes: Dict[str, Any] = {}
71
- for field in self.__dataclass_fields__: # type: ignore[attr-defined]
72
- new_v, old_v = getattr(self, field), getattr(prev_state, field)
73
- if isinstance(new_v, np.ndarray):
74
- if not np.array_equal(new_v, old_v):
75
- changes[field] = True
76
- elif new_v != old_v:
77
- changes[field] = (old_v, new_v)
78
- return changes
79
-
80
- @property
81
- def room_text(self) -> str:
82
- """ASCII visualization of the room state"""
83
- return _grid_to_text(self.room_state)
84
-
85
- def to_dict(self) -> Dict[str, Any]:
86
- """Convert to dictionary with proper numpy array serialization."""
87
- return {
88
- "dim_room": self.dim_room,
89
- "room_fixed": self.room_fixed.tolist(), # Convert numpy array to list
90
- "room_state": self.room_state.tolist(), # Convert numpy array to list
91
- "player_position": self.player_position,
92
- "boxes_on_target": self.boxes_on_target,
93
- "num_steps": self.num_steps,
94
- "max_steps": self.max_steps,
95
- "last_action_name": self.last_action_name,
96
- "num_boxes": self.num_boxes,
97
- "error_info": self.error_info,
98
- }
99
-
100
- def __repr__(self) -> str:
101
- """Safe string representation that avoids numpy array recursion."""
102
- return f"SokobanPublicState(dim_room={self.dim_room}, num_steps={self.num_steps}, boxes_on_target={self.boxes_on_target})"
103
-
104
- def __str__(self) -> str:
105
- """Safe string representation that avoids numpy array recursion."""
106
- return self.__repr__()
107
-
108
-
109
- @dataclass
110
- class SokobanPrivateState:
111
- reward_last: float
112
- total_reward: float
113
- terminated: bool
114
- truncated: bool
115
- rng_state: dict | None = None
116
-
117
- def diff(self, prev_state: "SokobanPrivateState") -> Dict[str, Any]:
118
- changes: Dict[str, Any] = {}
119
- for field in self.__dataclass_fields__: # type: ignore[attr-defined]
120
- new_v, old_v = getattr(self, field), getattr(prev_state, field)
121
- if new_v != old_v:
122
- changes[field] = (old_v, new_v)
123
- return changes
124
-
125
- def to_dict(self) -> Dict[str, Any]:
126
- """Convert to dictionary with proper serialization."""
127
- return {
128
- "reward_last": self.reward_last,
129
- "total_reward": self.total_reward,
130
- "terminated": self.terminated,
131
- "truncated": self.truncated,
132
- "rng_state": self.rng_state,
133
- }
134
-
135
- def __repr__(self) -> str:
136
- """Safe string representation."""
137
- return f"SokobanPrivateState(reward_last={self.reward_last}, total_reward={self.total_reward}, terminated={self.terminated})"
138
-
139
- def __str__(self) -> str:
140
- """Safe string representation."""
141
- return self.__repr__()
142
-
143
-
144
- # Note - just how we roll! Show your agent whatever state you want
145
- # Close to original
146
- def _grid_to_text(grid: np.ndarray) -> str:
147
- """Pretty 3-char glyphs for each cell – same lookup the legacy renderer used."""
148
- return "\n".join(
149
- "".join(GRID_LOOKUP.get(int(cell), "?") for cell in row) # type: ignore[arg-type]
150
- for row in grid
151
- )
152
-
153
-
154
- class SynthSokobanObservationCallable(GetObservationCallable):
155
- def __init__(self):
156
- pass
157
-
158
- async def get_observation(
159
- self, pub: SokobanPublicState, priv: SokobanPrivateState
160
- ) -> InternalObservation: # type: ignore[override]
161
- board_txt = _grid_to_text(pub.room_state)
162
- return {
163
- "room_text": board_txt,
164
- "player_position": tuple(map(int, pub.player_position)),
165
- "boxes_on_target": int(pub.boxes_on_target),
166
- "steps_taken": int(pub.num_steps),
167
- "max_steps": int(pub.max_steps),
168
- "last_action": pub.last_action_name,
169
- "reward_last": float(priv.reward_last),
170
- "total_reward": float(priv.total_reward),
171
- "terminated": bool(priv.terminated),
172
- "truncated": bool(priv.truncated),
173
- "num_boxes": int(pub.num_boxes),
174
- }
175
-
176
-
177
- # Close to original
178
- class SynthSokobanCheckpointObservationCallable(GetObservationCallable):
179
- """
180
- Snapshot emitted once after the episode finishes.
181
- Mirrors the legacy 'final_observation' concept: full board + final tallies.
182
- """
183
-
184
- def __init__(self):
185
- pass
186
-
187
- async def get_observation(
188
- self, pub: SokobanPublicState, priv: SokobanPrivateState
189
- ) -> InternalObservation: # type: ignore[override]
190
- board_txt = _grid_to_text(pub.room_state)
191
- return {
192
- "room_text_final": board_txt,
193
- "boxes_on_target_final": int(pub.boxes_on_target),
194
- "steps_taken_final": int(pub.num_steps),
195
- "total_reward": float(priv.total_reward),
196
- "terminated": bool(priv.terminated),
197
- "truncated": bool(priv.truncated),
198
- "num_boxes": int(pub.num_boxes),
199
- }
200
-
201
-
202
- # Think of engine as the actual logic, then with hooks to update the public and private state
203
- # Note - I don't really want to split up the transformation/engine logic from the instance information. There's already quite a bit of abstraction, so let's make the hard call here. I observe that this class does combine the responsibility of tracking engine state AND containing dynamics, but I think it's fine.
204
-
205
-
206
- GRID_LOOKUP = {0: " # ", 1: " _ ", 2: " O ", 3: " √ ", 4: " X ", 5: " P ", 6: " S "}
207
-
208
-
209
- def _count_boxes_on_target(room_state: np.ndarray) -> int:
210
- """Return number of boxes currently sitting on target tiles."""
211
- return int(np.sum(room_state == 3))
212
-
213
-
214
- def package_sokoban_env_from_engine_snapshot(
215
- engine_snapshot: Dict[str, Any],
216
- ) -> GymSokobanEnv:
217
- """Instantiate SokobanEnv and load every field from a saved-state dict."""
218
- # 1. create empty env (skip reset)
219
- env = GymSokobanEnv(
220
- dim_room=tuple(engine_snapshot["dim_room"]),
221
- max_steps=engine_snapshot.get("max_steps", 120),
222
- num_boxes=engine_snapshot.get("num_boxes", 1),
223
- reset=False,
224
- )
225
-
226
- # 2. restore core grids
227
- env.room_fixed = np.asarray(engine_snapshot["room_fixed"], dtype=int)
228
- env.room_state = np.asarray(engine_snapshot["room_state"], dtype=int)
229
-
230
- # 3. restore auxiliary data
231
- raw_map = engine_snapshot.get("box_mapping", {})
232
- if isinstance(raw_map, list): # list-of-dict form
233
- env.box_mapping = {tuple(e["original"]): tuple(e["current"]) for e in raw_map}
234
- else: # string-keyed dict form
235
- env.box_mapping = {
236
- tuple(map(int, k.strip("[]").split(","))): tuple(v) for k, v in raw_map.items()
237
- }
238
-
239
- env.player_position = np.argwhere(env.room_state == 5)[0]
240
- env.num_env_steps = engine_snapshot.get("num_env_steps", 0)
241
- env.boxes_on_target = engine_snapshot.get("boxes_on_target", int(np.sum(env.room_state == 3)))
242
- env.reward_last = engine_snapshot.get("reward_last", 0)
243
-
244
- # 4. restore RNG (if provided)
245
- rng = engine_snapshot.get("np_random_state")
246
- if rng:
247
- env.seed() # init env.np_random
248
- env.np_random.set_state(
249
- (
250
- rng["key"],
251
- np.array(rng["state"], dtype=np.uint32),
252
- rng["pos"],
253
- 0, # has_gauss
254
- 0.0, # cached_gaussian
255
- )
256
- )
257
-
258
- return env
259
-
260
-
261
- # --- Reward Components ---
262
- class SokobanGoalAchievedComponent(RewardComponent):
263
- async def score(self, state: "SokobanPublicState", action: Any) -> float:
264
- if state.boxes_on_target == state.num_boxes:
265
- return 1.0
266
- return 0.0
267
-
268
-
269
- class SokobanStepPenaltyComponent(RewardComponent):
270
- def __init__(self, penalty: float = -0.01):
271
- super().__init__()
272
- self.penalty = penalty
273
- self.weight = 1.0
274
-
275
- async def score(self, state: Any, action: Any) -> float:
276
- return self.penalty
277
-
278
-
279
- class SokobanEngine(StatefulEngine, IReproducibleEngine):
280
- task_instance: TaskInstance
281
- package_sokoban_env: GymSokobanEnv
282
-
283
- # sokoban stuff
284
-
285
- def __init__(self, task_instance: TaskInstance):
286
- self.task_instance = task_instance
287
- self._total_reward = 0.0 # Initialize total_reward
288
- self._current_action_for_reward: Optional[int] = None
289
- self.reward_stack = RewardStack(
290
- components=[
291
- SokobanGoalAchievedComponent(),
292
- SokobanStepPenaltyComponent(penalty=-0.01),
293
- ]
294
- )
295
-
296
- init_snap: dict | None = getattr(self.task_instance, "initial_engine_snapshot", None)
297
-
298
- if init_snap:
299
- # Initialize package_sokoban_env here using the snapshot
300
- self.package_sokoban_env = package_sokoban_env_from_engine_snapshot(init_snap)
301
- # Ensure counters are consistent with the snapshot state
302
- self.package_sokoban_env.boxes_on_target = _count_boxes_on_target(
303
- self.package_sokoban_env.room_state
304
- )
305
- else:
306
- # No initial snapshot - this should not happen with the new pre-generated puzzle system
307
- # Create a minimal default environment as fallback
308
- logger.warning(
309
- "No initial_engine_snapshot provided - this should not happen with verified puzzles"
310
- )
311
- self.package_sokoban_env = GymSokobanEnv(
312
- dim_room=(5, 5),
313
- max_steps=50,
314
- num_boxes=1,
315
- reset=False, # Don't reset during creation to avoid generation
316
- )
317
-
318
- # gives the observation!
319
- # also final rewards when those are passed in
320
- async def _render(
321
- self,
322
- private_state: SokobanPrivateState,
323
- public_state: SokobanPublicState,
324
- get_observation: Optional[GetObservationCallable] = None,
325
- ) -> str:
326
- """
327
- 1. choose the observation callable (default = SynthSokobanObservationCallable)
328
- 2. fetch obs via callable(pub, priv)
329
- 3. if callable returned a dict -> pretty-print board + footer
330
- if str -> forward unchanged
331
- """
332
- # 1 – pick callable
333
- obs_cb = get_observation or SynthSokobanObservationCallable()
334
-
335
- # 2 – pull observation
336
- obs = await obs_cb.get_observation(public_state, private_state)
337
-
338
- # 3 – stringify
339
- if isinstance(obs, str):
340
- return obs
341
-
342
- if isinstance(obs, dict):
343
- board_txt = (
344
- obs.get("room_text")
345
- or obs.get("room_text_final")
346
- or _grid_to_text(public_state.room_state)
347
- )
348
- footer = (
349
- f"steps: {public_state.num_steps}/{public_state.max_steps} | "
350
- f"boxes✓: {public_state.boxes_on_target} | "
351
- f"last_r: {private_state.reward_last:.2f} | "
352
- f"total_r: {private_state.total_reward:.2f}"
353
- )
354
- return f"{board_txt}\n{footer}"
355
-
356
- # unknown payload type -> fallback
357
- return str(obs)
358
-
359
- # yields private state, public state
360
- async def _step_engine(self, action: int) -> Tuple[SokobanPrivateState, SokobanPublicState]:
361
- self._current_action_for_reward = action # Set context for reward
362
-
363
- # --- Run underlying package environment step ---
364
- # The raw reward from package_sokoban_env.step() will be ignored,
365
- # as we are now using our RewardStack for a more structured reward calculation.
366
- obs_raw, _, terminated_gym, info = self.package_sokoban_env.step(action)
367
-
368
- self.package_sokoban_env.boxes_on_target = _count_boxes_on_target(
369
- self.package_sokoban_env.room_state
370
- )
371
- current_pub_state = SokobanPublicState(
372
- dim_room=self.package_sokoban_env.dim_room,
373
- room_fixed=self.package_sokoban_env.room_fixed.copy(),
374
- room_state=self.package_sokoban_env.room_state.copy(),
375
- player_position=tuple(self.package_sokoban_env.player_position),
376
- boxes_on_target=self.package_sokoban_env.boxes_on_target,
377
- num_steps=self.package_sokoban_env.num_env_steps,
378
- max_steps=self.package_sokoban_env.max_steps,
379
- last_action_name=ACTION_LOOKUP.get(action, "Unknown"),
380
- num_boxes=self.package_sokoban_env.num_boxes,
381
- )
382
-
383
- # --- Calculate reward using RewardStack ---
384
- # The 'state' for reward components is current_pub_state.
385
- # The 'action' for reward components is the raw agent action.
386
- reward_from_stack = await self.reward_stack.step_reward(
387
- state=current_pub_state, action=self._current_action_for_reward
388
- )
389
- self._current_action_for_reward = None # Reset context
390
-
391
- self._total_reward += reward_from_stack
392
- # Update reward_last on the package_sokoban_env if it's used by its internal logic or for direct inspection.
393
- # However, the authoritative reward for our framework is reward_from_stack.
394
- self.package_sokoban_env.reward_last = reward_from_stack
395
-
396
- # --- Determine terminated and truncated status based on gym env and game logic ---
397
- solved = self.package_sokoban_env.boxes_on_target == self.package_sokoban_env.num_boxes
398
- terminated = terminated_gym or solved # terminated_gym from underlying env, or solved state
399
- # If underlying env says terminated due to max_steps, it is truncation for us.
400
- # If solved, it's termination. Otherwise, depends on max_steps.
401
- truncated = (
402
- self.package_sokoban_env.num_env_steps >= self.package_sokoban_env.max_steps
403
- ) and not solved
404
- if solved:
405
- terminated = True # Ensure solved always terminates
406
- truncated = False # Cannot be truncated if solved
407
-
408
- priv = SokobanPrivateState(
409
- reward_last=reward_from_stack,
410
- total_reward=self._total_reward,
411
- terminated=terminated,
412
- truncated=truncated,
413
- )
414
- return priv, current_pub_state
415
-
416
- async def _reset_engine(
417
- self, *, seed: int | None = None
418
- ) -> Tuple[SokobanPrivateState, SokobanPublicState]:
419
- """
420
- (Re)build the wrapped PackageSokobanEnv in a fresh state.
421
-
422
- 1. Decide whether we have an initial snapshot in the TaskInstance.
423
- 2. If yes → hydrate env from it; otherwise call env.reset(seed).
424
- 3. Zero-out cumulative reward and emit fresh state objects.
425
- """
426
- self._total_reward = 0.0
427
- self._current_action_for_reward = None
428
-
429
- init_snap: dict | None = getattr(self.task_instance, "initial_engine_snapshot")
430
-
431
- if init_snap:
432
- self.package_sokoban_env = package_sokoban_env_from_engine_snapshot(init_snap)
433
- # ensure counter correct even if snapshot was stale
434
- self.package_sokoban_env.boxes_on_target = _count_boxes_on_target(
435
- self.package_sokoban_env.room_state
436
- )
437
- else:
438
- # No initial snapshot - this should not happen with the new pre-generated puzzle system
439
- logger.warning(
440
- "No initial_engine_snapshot provided during reset - this should not happen with verified puzzles"
441
- )
442
- # Simple fallback: try to reset the existing environment
443
- try:
444
- _ = self.package_sokoban_env.reset(seed=seed)
445
- # Update the boxes_on_target counter
446
- self.package_sokoban_env.boxes_on_target = _count_boxes_on_target(
447
- self.package_sokoban_env.room_state
448
- )
449
- except Exception as e:
450
- logger.error(f"Failed to reset environment: {e}")
451
- raise RuntimeError(
452
- "Environment reset failed. This should not happen with verified puzzles. "
453
- "Ensure task instances have initial_engine_snapshot."
454
- ) from e
455
-
456
- # build first public/private views
457
- priv = SokobanPrivateState(
458
- reward_last=0.0,
459
- total_reward=0.0,
460
- terminated=False,
461
- truncated=False,
462
- rng_state=self.package_sokoban_env.np_random.bit_generator.state,
463
- )
464
- pub = SokobanPublicState(
465
- dim_room=self.package_sokoban_env.dim_room,
466
- room_fixed=self.package_sokoban_env.room_fixed.copy(),
467
- room_state=self.package_sokoban_env.room_state.copy(),
468
- player_position=tuple(self.package_sokoban_env.player_position),
469
- boxes_on_target=self.package_sokoban_env.boxes_on_target,
470
- num_steps=self.package_sokoban_env.num_env_steps,
471
- max_steps=self.package_sokoban_env.max_steps,
472
- last_action_name="Initial",
473
- num_boxes=self.package_sokoban_env.num_boxes,
474
- )
475
- return priv, pub
476
-
477
- async def _serialize_engine(self) -> SokobanEngineSnapshot:
478
- """Dump wrapped env + task_instance into a JSON-ready snapshot."""
479
- env = self.package_sokoban_env
480
-
481
- # helper – numpy RNG → dict
482
- def _rng_state(e):
483
- state = e.np_random.bit_generator.state
484
- state["state"] = state["state"].tolist()
485
- return state
486
-
487
- snap: Dict[str, Any] = {
488
- "dim_room": list(env.dim_room),
489
- "max_steps": env.max_steps,
490
- "num_boxes": env.num_boxes,
491
- "room_fixed": env.room_fixed.tolist(),
492
- "room_state": env.room_state.tolist(),
493
- "box_mapping": [
494
- {"original": list(k), "current": list(v)} for k, v in env.box_mapping.items()
495
- ],
496
- "player_position": env.player_position.tolist(),
497
- "num_env_steps": env.num_env_steps,
498
- "boxes_on_target": env.boxes_on_target,
499
- "reward_last": env.reward_last,
500
- "total_reward": getattr(self, "_total_reward", 0.0),
501
- # "np_random_state": _rng_state(env), # Assuming _rng_state is defined if needed
502
- }
503
-
504
- # Serialize the TaskInstance using its own serialize method
505
- task_instance_dict = await self.task_instance.serialize()
506
-
507
- return SokobanEngineSnapshot(
508
- task_instance_dict=task_instance_dict, # Store serialized TaskInstance
509
- engine_snapshot=snap,
510
- )
511
-
512
- @classmethod
513
- async def _deserialize_engine(
514
- cls, sokoban_engine_snapshot: "SokobanEngineSnapshot"
515
- ) -> "SokobanEngine":
516
- """
517
- Recreate a SokobanEngine (including wrapped env and TaskInstance) from a snapshot blob.
518
- """
519
- # --- 1. rebuild TaskInstance ----------------------------------- #
520
- # Use the concrete SokobanTaskInstance.deserialize method
521
- instance = await SokobanTaskInstance.deserialize(sokoban_engine_snapshot.task_instance_dict)
522
-
523
- # --- 2. create engine shell ------------------------------------ #
524
- engine = cls.__new__(cls) # bypass __init__
525
- StatefulEngine.__init__(engine) # initialise mix-in parts
526
- engine.task_instance = instance # assign restored TaskInstance
527
-
528
- # --- 3. initialize attributes that are normally set in __init__ --- #
529
- engine._current_action_for_reward = None
530
- engine.reward_stack = RewardStack(
531
- components=[
532
- SokobanGoalAchievedComponent(),
533
- SokobanStepPenaltyComponent(penalty=-0.01),
534
- ]
535
- )
536
-
537
- # --- 4. hydrate env & counters --------------------------------- #
538
- engine.package_sokoban_env = package_sokoban_env_from_engine_snapshot(
539
- sokoban_engine_snapshot.engine_snapshot
540
- )
541
- engine._total_reward = sokoban_engine_snapshot.engine_snapshot.get("total_reward", 0.0)
542
- return engine
543
-
544
- def get_current_states_for_observation(
545
- self,
546
- ) -> Tuple[SokobanPrivateState, SokobanPublicState]:
547
- # Helper to get current state without advancing engine, useful for error in Environment.step
548
- terminated = bool(
549
- self.package_sokoban_env.boxes_on_target == self.package_sokoban_env.num_boxes
550
- )
551
- truncated = bool(
552
- self.package_sokoban_env.num_env_steps >= self.package_sokoban_env.max_steps
553
- )
554
- priv = SokobanPrivateState(
555
- reward_last=self.package_sokoban_env.reward_last, # Last known reward
556
- total_reward=self._total_reward,
557
- terminated=terminated,
558
- truncated=truncated,
559
- )
560
- pub = SokobanPublicState(
561
- dim_room=self.package_sokoban_env.dim_room,
562
- room_fixed=self.package_sokoban_env.room_fixed.copy(),
563
- room_state=self.package_sokoban_env.room_state.copy(),
564
- player_position=tuple(self.package_sokoban_env.player_position),
565
- boxes_on_target=self.package_sokoban_env.boxes_on_target,
566
- num_steps=self.package_sokoban_env.num_env_steps,
567
- max_steps=self.package_sokoban_env.max_steps,
568
- last_action_name=ACTION_LOOKUP.get(
569
- getattr(self.package_sokoban_env, "last_action", -1), "Initial"
570
- ),
571
- num_boxes=self.package_sokoban_env.num_boxes,
572
- )
573
- return priv, pub
574
-
575
-
576
- if __name__ == "__main__":
577
- # // 0=wall, 1=floor, 2=target
578
- # // 4=box-not-on-target, 5=player
579
- # initial_room = {
580
- # "dim_room": [5, 5],
581
- # "max_steps": 120,
582
- # "num_boxes": 1,
583
- # "seed": 42,
584
- # "room_fixed": [
585
- # [0, 0, 0, 0, 0],
586
- # [0, 1, 1, 2, 0],
587
- # [0, 1, 0, 1, 0],
588
- # [0, 1, 5, 1, 0],
589
- # [0, 0, 0, 0, 0]
590
- # ],
591
- # "room_state": [
592
- # [0, 0, 0, 0, 0],
593
- # [0, 1, 4, 1, 0],
594
- # [0, 1, 0, 1, 0],
595
- # [0, 1, 5, 1, 0],
596
- # [0, 0, 0, 0, 0]
597
- # ]
598
- # }
599
- task_instance_dict = {
600
- "initial_engine_snapshot": {
601
- "dim_room": [5, 5],
602
- "max_steps": 120,
603
- "num_boxes": 1,
604
- "room_fixed": [
605
- [0, 0, 0, 0, 0],
606
- [0, 1, 1, 2, 0],
607
- [0, 1, 0, 1, 0],
608
- [0, 1, 1, 1, 0],
609
- [0, 0, 0, 0, 0],
610
- ],
611
- "room_state": [
612
- [0, 0, 0, 0, 0],
613
- [0, 1, 4, 1, 0],
614
- [0, 1, 0, 1, 0],
615
- [0, 1, 5, 1, 0],
616
- [0, 0, 0, 0, 0],
617
- ],
618
- "box_mapping": [{"original": [1, 2], "current": [3, 2]}],
619
- "boxes_on_target": 0,
620
- "np_random_state": {
621
- "key": "MT19937",
622
- "state": [1804289383, 846930886, 1681692777, 1714636915],
623
- "pos": 0,
624
- },
625
- "reward_last": 0,
626
- "num_env_steps": 0,
627
- }
628
- }
629
- import asyncio
630
- import random
631
-
632
- async def sanity():
633
- task_instance = TaskInstance()
634
- engine = SokobanEngine(task_instance=task_instance)
635
- priv, pub = await engine._reset_engine()
636
- print(await engine._render(priv, pub)) # initial board
637
-
638
- for _ in range(10): # play 10 random moves
639
- a = random.randint(0, 8) # action range 0-8
640
- priv, pub = await engine._step_engine(a)
641
- print(f"\n### step {pub.num_steps} — {ACTION_LOOKUP[a]} ###")
642
- print("public:", pub)
643
- print("private:", priv)
644
- print(await engine._render(priv, pub))
645
- if priv.terminated or priv.truncated:
646
- break
647
-
648
- asyncio.run(sanity())
649
- # sokoban_engine = SokobanEngine.deserialize(
650
- # engine_snapshot=SokobanEngineSnapshot(
651
- # instance=instance_information,
652
- # snapshot_dict=instance_information["initial_engine_snapshot"],
653
- # )
654
- # )
655
-
656
-
657
- # {
658
- # "dim_room": [5, 5],
659
- # "max_steps": 120,
660
- # "num_boxes": 1,
661
-
662
- # "room_fixed": [...], // as above
663
- # "room_state": [...], // current grid (3 = box-on-target)
664
-
665
- # "box_mapping": {
666
- # "[1,3]": [3,2] // origin-target → current-pos pairs
667
- # },
668
- # "player_position": [3, 2], // row, col
669
-
670
- # "num_env_steps": 15, // steps already taken
671
- # "boxes_on_target": 0, // live counter
672
-
673
- # "np_random_state": { // optional but makes replay bit-exact
674
- # "key": "MT19937",
675
- # "state": [1804289383, 846930886, ...],
676
- # "pos": 123
677
- # }
678
- # }
@@ -1 +0,0 @@
1
- # Engine helpers for Sokoban