synth-ai 0.2.9.dev3__py3-none-any.whl → 0.2.9.dev5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of synth-ai might be problematic. Click here for more details.

Files changed (107) hide show
  1. examples/analyze_semantic_words.sh +17 -0
  2. examples/common_old/backend.py +21 -0
  3. examples/crafter_debug_render.py +180 -0
  4. examples/evals_old/README.md +98 -0
  5. examples/evals_old/__init__.py +6 -0
  6. examples/evals_old/compare_models.py +1037 -0
  7. examples/evals_old/example_log.md +145 -0
  8. examples/evals_old/run_demo.sh +126 -0
  9. examples/evals_old/trace_analysis.py +270 -0
  10. examples/finetuning_old/_backup_synth_qwen/config.toml +29 -0
  11. examples/finetuning_old/_backup_synth_qwen/example_log.md +324 -0
  12. examples/finetuning_old/_backup_synth_qwen/filter_traces.py +60 -0
  13. examples/finetuning_old/_backup_synth_qwen/filter_traces_achievements.py +239 -0
  14. examples/finetuning_old/_backup_synth_qwen/purge_v3_traces.py +109 -0
  15. examples/finetuning_old/_backup_synth_qwen/react_agent_lm.py +1924 -0
  16. examples/finetuning_old/_backup_synth_qwen/readme.md +49 -0
  17. examples/finetuning_old/_backup_synth_qwen/run_crafter_qwen4b.py +114 -0
  18. examples/finetuning_old/_backup_synth_qwen/run_demo.sh +195 -0
  19. examples/finetuning_old/_backup_synth_qwen/sft_kickoff.py +118 -0
  20. examples/finetuning_old/synth_qwen_v1/README.md +68 -0
  21. examples/finetuning_old/synth_qwen_v1/filter_traces.py +60 -0
  22. examples/finetuning_old/synth_qwen_v1/filter_traces_achievements.py +239 -0
  23. examples/finetuning_old/synth_qwen_v1/finetune.py +46 -0
  24. examples/finetuning_old/synth_qwen_v1/hello_ft_model.py +71 -0
  25. examples/finetuning_old/synth_qwen_v1/infer.py +37 -0
  26. examples/finetuning_old/synth_qwen_v1/poll.py +44 -0
  27. examples/finetuning_old/synth_qwen_v1/prepare_data.py +35 -0
  28. examples/finetuning_old/synth_qwen_v1/purge_v3_traces.py +109 -0
  29. examples/finetuning_old/synth_qwen_v1/react_agent_lm.py +1932 -0
  30. examples/finetuning_old/synth_qwen_v1/run_crafter_sft_job.py +207 -0
  31. examples/finetuning_old/synth_qwen_v1/run_ft_job.py +232 -0
  32. examples/finetuning_old/synth_qwen_v1/upload_data.py +34 -0
  33. examples/finetuning_old/synth_qwen_v1/util.py +147 -0
  34. examples/rl/README.md +169 -0
  35. examples/rl/configs/eval_base_qwen.toml +15 -0
  36. examples/rl/configs/eval_rl_qwen.toml +11 -0
  37. examples/rl/configs/rl_from_base_qwen.toml +35 -0
  38. examples/rl/configs/rl_from_base_qwen17.toml +74 -0
  39. examples/rl/configs/rl_from_ft_qwen.toml +35 -0
  40. examples/rl/download_dataset.py +64 -0
  41. examples/rl/run_eval.py +435 -0
  42. examples/rl/run_rl_and_save.py +94 -0
  43. examples/rl/task_app/README.md +22 -0
  44. {synth_ai/task/apps → examples/rl/task_app}/math_single_step.py +8 -8
  45. examples/rl/task_app/math_task_app.py +107 -0
  46. examples/rl_old/task_app.py +962 -0
  47. examples/run_crafter_demo.sh +10 -0
  48. examples/warming_up_to_rl/analyze_trace_db.py +420 -0
  49. examples/warming_up_to_rl/configs/crafter_fft.toml +48 -0
  50. examples/warming_up_to_rl/configs/crafter_fft_4b.toml +54 -0
  51. examples/warming_up_to_rl/configs/eval_fft_qwen4b.toml +20 -0
  52. examples/warming_up_to_rl/configs/eval_groq_qwen32b.toml +13 -0
  53. examples/warming_up_to_rl/configs/eval_modal_qwen4b.toml +23 -0
  54. examples/warming_up_to_rl/configs/rl_from_base_qwen4b.toml +73 -0
  55. examples/warming_up_to_rl/configs/rl_from_ft.toml +56 -0
  56. examples/warming_up_to_rl/export_trace_sft.py +541 -0
  57. examples/warming_up_to_rl/groq_test.py +88 -0
  58. examples/warming_up_to_rl/manage_secrets.py +127 -0
  59. examples/warming_up_to_rl/old/event_rewards.md +234 -0
  60. examples/warming_up_to_rl/old/notes.md +73 -0
  61. examples/warming_up_to_rl/readme.md +172 -0
  62. examples/warming_up_to_rl/run_eval.py +434 -0
  63. examples/warming_up_to_rl/run_fft_and_save.py +309 -0
  64. examples/warming_up_to_rl/run_local_rollout.py +188 -0
  65. examples/warming_up_to_rl/run_local_rollout_modal.py +160 -0
  66. examples/warming_up_to_rl/run_local_rollout_parallel.py +342 -0
  67. examples/warming_up_to_rl/run_local_rollout_traced.py +372 -0
  68. examples/warming_up_to_rl/run_rl_and_save.py +101 -0
  69. examples/warming_up_to_rl/run_rollout_remote.py +129 -0
  70. examples/warming_up_to_rl/task_app/README.md +38 -0
  71. {synth_ai/task/apps → examples/warming_up_to_rl/task_app}/grpo_crafter.py +7 -7
  72. examples/warming_up_to_rl/task_app/grpo_crafter_task_app.py +165 -0
  73. examples/warming_up_to_rl/task_app/synth_envs_hosted/README.md +173 -0
  74. examples/warming_up_to_rl/task_app/synth_envs_hosted/__init__.py +5 -0
  75. examples/warming_up_to_rl/task_app/synth_envs_hosted/branching.py +145 -0
  76. examples/warming_up_to_rl/task_app/synth_envs_hosted/environment_routes.py +1271 -0
  77. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/__init__.py +1 -0
  78. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/__init__.py +6 -0
  79. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/app.py +1 -0
  80. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/environment.py +429 -0
  81. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/policy.py +442 -0
  82. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/react_agent.py +96 -0
  83. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/shared.py +302 -0
  84. examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/tools.py +47 -0
  85. examples/warming_up_to_rl/task_app/synth_envs_hosted/hosted_app.py +202 -0
  86. examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/__init__.py +5 -0
  87. examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py +512 -0
  88. examples/warming_up_to_rl/task_app/synth_envs_hosted/main.py +102 -0
  89. examples/warming_up_to_rl/task_app/synth_envs_hosted/policy_routes.py +985 -0
  90. examples/warming_up_to_rl/task_app/synth_envs_hosted/registry.py +197 -0
  91. examples/warming_up_to_rl/task_app/synth_envs_hosted/rollout.py +1749 -0
  92. examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/__init__.py +5 -0
  93. examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/volume.py +217 -0
  94. examples/warming_up_to_rl/task_app/synth_envs_hosted/test_agents.py +160 -0
  95. examples/warming_up_to_rl/task_app/synth_envs_hosted/test_service.py +146 -0
  96. examples/warming_up_to_rl/task_app/synth_envs_hosted/utils.py +61 -0
  97. synth_ai/api/train/config_finder.py +18 -18
  98. synth_ai/api/train/env_resolver.py +28 -1
  99. synth_ai/cli/task_apps.py +291 -56
  100. synth_ai/task/apps/__init__.py +54 -13
  101. {synth_ai-0.2.9.dev3.dist-info → synth_ai-0.2.9.dev5.dist-info}/METADATA +1 -1
  102. {synth_ai-0.2.9.dev3.dist-info → synth_ai-0.2.9.dev5.dist-info}/RECORD +106 -13
  103. {synth_ai-0.2.9.dev3.dist-info → synth_ai-0.2.9.dev5.dist-info}/top_level.txt +1 -0
  104. synth_ai/environments/examples/sokoban/units/astar_common.py +0 -95
  105. {synth_ai-0.2.9.dev3.dist-info → synth_ai-0.2.9.dev5.dist-info}/WHEEL +0 -0
  106. {synth_ai-0.2.9.dev3.dist-info → synth_ai-0.2.9.dev5.dist-info}/entry_points.txt +0 -0
  107. {synth_ai-0.2.9.dev3.dist-info → synth_ai-0.2.9.dev5.dist-info}/licenses/LICENSE +0 -0
@@ -1,3 +1,99 @@
1
+ examples/analyze_semantic_words.sh,sha256=z-3qJBAlQuMrfRzoszofle_2b3Fy79rymvEAcoBQGXU,652
2
+ examples/crafter_debug_render.py,sha256=6Zak0RQZPXYy88v5dcon-XEdt01_NI027o1v2Fx4nhk,6178
3
+ examples/run_crafter_demo.sh,sha256=7FNvooSgq-ezccGy5j_h_uRXObiQtcnybPcTwaVGDpo,392
4
+ examples/common_old/backend.py,sha256=ygPtZREi9W2JQI7xI0J1jz3VaWBgILTfgpgFLVGMEPY,538
5
+ examples/evals_old/README.md,sha256=Te1TsgcOyDBf-ICdHkA12XBd4ClQXGFj8uytbggto1s,3503
6
+ examples/evals_old/__init__.py,sha256=6E7OuWJsBiG7USgsR5uFGeU1JYZ6TFreUFMwgBxrJ6A,189
7
+ examples/evals_old/compare_models.py,sha256=bCqtIKkR06u5pJHY65496ImokYlIEOMrtWFT_T_b3dM,43883
8
+ examples/evals_old/example_log.md,sha256=DgdmUkU0N_g2WhobwCqkpw1Itjq8E7wS2CCcLsLSLJw,9470
9
+ examples/evals_old/run_demo.sh,sha256=UwygYAn-LDdq-XSjygrDSs30UykQX5EO9Q5atqspc0Q,4625
10
+ examples/evals_old/trace_analysis.py,sha256=uIImBarDqo81zJOcFxjCusZg9YHsARs09q0Y5l6-iXs,10686
11
+ examples/finetuning_old/_backup_synth_qwen/config.toml,sha256=7bs3-AS23Cu9nbTYYurlk1fMJPF5LuYPD1Vumyt3XK4,734
12
+ examples/finetuning_old/_backup_synth_qwen/example_log.md,sha256=1CG-1dZsIzdWDVLrTYBO3vld_b8o9sqG_-rDEpTcA_I,12246
13
+ examples/finetuning_old/_backup_synth_qwen/filter_traces.py,sha256=aFGy0-KoPQyIbk4cJBh4wnqzuqgCEVsrFbEor454ktY,2045
14
+ examples/finetuning_old/_backup_synth_qwen/filter_traces_achievements.py,sha256=bploSuwCeLelHytJcVoDKkRyldvrFfZMpTVfWrwEzcg,9359
15
+ examples/finetuning_old/_backup_synth_qwen/purge_v3_traces.py,sha256=qGHwWA0DKBCNs8rB39NHwpTFe8izNNYQjtyHVrzWYTk,3406
16
+ examples/finetuning_old/_backup_synth_qwen/react_agent_lm.py,sha256=sYTauRlPdsZeA17YNffjdWyHUZeojRUFHgQ4bu27TvQ,80387
17
+ examples/finetuning_old/_backup_synth_qwen/readme.md,sha256=2M7m1VqHNCEDOPmEWC0NsyXMFn0rB3bjMX4uNA5GOp0,1763
18
+ examples/finetuning_old/_backup_synth_qwen/run_crafter_qwen4b.py,sha256=gUrjpMtLRJCuM4UMY9k-8gKqDoY4nyK4aY5G4rC9exw,4353
19
+ examples/finetuning_old/_backup_synth_qwen/run_demo.sh,sha256=bN3TdD2Bowdu2yFrcKkN1rDqeSjivSNS63fO5tAjB6o,7239
20
+ examples/finetuning_old/_backup_synth_qwen/sft_kickoff.py,sha256=oFyK6LQDQ5SbsTJXJUzyUTPklWOZwdw_VyO3SR7IXSw,4223
21
+ examples/finetuning_old/synth_qwen_v1/README.md,sha256=ZWYfjax9iyrljAwUqiZwNHqtJAajz1G75rSiBNTveHo,4322
22
+ examples/finetuning_old/synth_qwen_v1/filter_traces.py,sha256=aFGy0-KoPQyIbk4cJBh4wnqzuqgCEVsrFbEor454ktY,2045
23
+ examples/finetuning_old/synth_qwen_v1/filter_traces_achievements.py,sha256=bploSuwCeLelHytJcVoDKkRyldvrFfZMpTVfWrwEzcg,9359
24
+ examples/finetuning_old/synth_qwen_v1/finetune.py,sha256=6dLJjR3T-QOCgyOwz9jiucKuCz-So_eN88Z8ZwChJiU,1204
25
+ examples/finetuning_old/synth_qwen_v1/hello_ft_model.py,sha256=G4JLMmqGYBsV2rEfguOU-ZZlryE2bVO7vGxoxFBi3Jg,2286
26
+ examples/finetuning_old/synth_qwen_v1/infer.py,sha256=q9ykYhlP7Rrtb8RSK0qn6y8Tm63hax6rBpsFwtTMocY,918
27
+ examples/finetuning_old/synth_qwen_v1/poll.py,sha256=AJx2StdxkZBLnZPNupBSoIc4BHCifEmybPt5pb57QqA,1228
28
+ examples/finetuning_old/synth_qwen_v1/prepare_data.py,sha256=1UMP23z-TkJOGYCEEJqC9980_k2l7x5cpPSpEUWykx0,832
29
+ examples/finetuning_old/synth_qwen_v1/purge_v3_traces.py,sha256=qGHwWA0DKBCNs8rB39NHwpTFe8izNNYQjtyHVrzWYTk,3406
30
+ examples/finetuning_old/synth_qwen_v1/react_agent_lm.py,sha256=NYjf5Vqyi2Ri_oC6etDYmCE4Am9kK4aF3d1wqDut6j8,80577
31
+ examples/finetuning_old/synth_qwen_v1/run_crafter_sft_job.py,sha256=-bpXjFPp00JCEE5T7TCeRARZjQzCTmcpd0nH4y-sDho,7878
32
+ examples/finetuning_old/synth_qwen_v1/run_ft_job.py,sha256=-OOt2dJNw5dwYq5lF7XXZkuY5Qsj1Qnl5dKulZvDoSA,8561
33
+ examples/finetuning_old/synth_qwen_v1/upload_data.py,sha256=bYEFbsaKGt6nZ6kQKNnx7AklFmE3Hxp9d6r6xsh8PeE,882
34
+ examples/finetuning_old/synth_qwen_v1/util.py,sha256=v_4c2JQNRG7oIHIKOkXLZXg42CMqs4-yav2MuId7MpY,5801
35
+ examples/rl/README.md,sha256=qzv-URBhEr3r4ipEyh-mP9CiCIz_KbckZWlfXdWbafA,6560
36
+ examples/rl/download_dataset.py,sha256=XZwRbASLN4rjvfwqvet-sdhOojcEjCAvXWFNOSUZhWc,2515
37
+ examples/rl/run_eval.py,sha256=TlUlTHJ9dNOxZuyTF4A6F6JpSghvQ6rqC3yk4271BKw,14973
38
+ examples/rl/run_rl_and_save.py,sha256=Pe-zQzLrdO6CbRTt3vMslRlACMmLXQSUTr5Ow_DVh6k,3160
39
+ examples/rl/configs/eval_base_qwen.toml,sha256=EntLk6oScfan4-CiK0MeqO9vu-ZFBTo97tjlNSQOhd8,323
40
+ examples/rl/configs/eval_rl_qwen.toml,sha256=o07ZvAxjj_ejj3zbjESmtpIOh6QqkwpTD2ZUL9Lzx5A,247
41
+ examples/rl/configs/rl_from_base_qwen.toml,sha256=KDDtpvVikHZCcyUKYtgWq9XAfAEY5vRADPpcxpkdVsg,605
42
+ examples/rl/configs/rl_from_base_qwen17.toml,sha256=CLfuzZaTvpqezPrpOy03ZKvR6D3tZ0vExOsyvdn4ETo,1346
43
+ examples/rl/configs/rl_from_ft_qwen.toml,sha256=7s5HK_YM7zVnvjJavvfai8Nc_eUx_70cgHeWN19vXXM,638
44
+ examples/rl/task_app/README.md,sha256=oHfcMF9V_CPLnGbrarTRRIQpQ1wqV1zL74KWUZtcKwI,802
45
+ examples/rl/task_app/math_single_step.py,sha256=DIucCB5MC_1doIxfJxH6qXVsSijqh78cz-vQaKjFDEk,30379
46
+ examples/rl/task_app/math_task_app.py,sha256=e8inAZsLJxcAMtjwDVzvgb9-x9DYds4OKugthtm_riw,4180
47
+ examples/rl_old/task_app.py,sha256=ctVxuMKPaEKuf46fmSi2tb2bXe55bvhpxA5xTAYxwh4,47078
48
+ examples/warming_up_to_rl/analyze_trace_db.py,sha256=ywtQj-p2vsGQ8ikr4zXQY18YDKsbEnCRcz1MkJZot68,14424
49
+ examples/warming_up_to_rl/export_trace_sft.py,sha256=dreS63IyvpEjm2wVOGfPKIsE67bX0sui4WVS8aq46yA,20278
50
+ examples/warming_up_to_rl/groq_test.py,sha256=McqwDlKc2YZXmJQ9sI27dpdUl5wqn8xEDNi7V58ltl4,3089
51
+ examples/warming_up_to_rl/manage_secrets.py,sha256=ySZ6V_AXOWpFzjVSpxA-TaBWkhpWeIiC5jM6K3FOrmQ,4372
52
+ examples/warming_up_to_rl/readme.md,sha256=viacw40ZG-u-duqBd2RN5mG63__h2x1w37DPnKqpYV8,6169
53
+ examples/warming_up_to_rl/run_eval.py,sha256=llgsyx7E8pi7egn0qcDONzldDXShP6_Ntp-qTjQuNQQ,19078
54
+ examples/warming_up_to_rl/run_fft_and_save.py,sha256=DPeFnGJ2U2lB0azJ9CcN1c5pn0lSOfb6qYgtSGi0cEw,13426
55
+ examples/warming_up_to_rl/run_local_rollout.py,sha256=V6uMFZkfnh6ndndNq-rPnTkzWr3gNVWLVNmQlWb6Oik,8164
56
+ examples/warming_up_to_rl/run_local_rollout_modal.py,sha256=XxKZv_zE9zWFrt99N1tP6X8TfB883pKWsvDUUsHW1oc,6798
57
+ examples/warming_up_to_rl/run_local_rollout_parallel.py,sha256=_p11RDzH6DVVzanML9VKQahDxuKRH5PwwGsBgzo7DSE,12951
58
+ examples/warming_up_to_rl/run_local_rollout_traced.py,sha256=_UL46Rdj_oo8gEnyBfPfVkvCj7VoU99eahn3_i_-pMI,13656
59
+ examples/warming_up_to_rl/run_rl_and_save.py,sha256=dpFr42Vk03jTlDPyOUcDbu8zGJwGsMW4PKKPuBciAJs,3649
60
+ examples/warming_up_to_rl/run_rollout_remote.py,sha256=iIW5FI5cFDcnt80Tjh-uqL_O4uVoIqdnqfIjjLjFGZg,4769
61
+ examples/warming_up_to_rl/configs/crafter_fft.toml,sha256=Hbp2tVhaGxRAip1vwhID73rCIO6bi_yI-gUen-oylcA,1137
62
+ examples/warming_up_to_rl/configs/crafter_fft_4b.toml,sha256=q_cnU3P-eGG_VFOepw9IA1U-m7L-uJH37EUFR3mNWBI,1358
63
+ examples/warming_up_to_rl/configs/eval_fft_qwen4b.toml,sha256=YP4HLWDh6iIvw6McPXw5kK1RUFQF4dvKP4yH5bHT5nI,678
64
+ examples/warming_up_to_rl/configs/eval_groq_qwen32b.toml,sha256=zQi31JYa83kW-ceEqDZi-7oajsCmEPrlJR57zN5ygO8,340
65
+ examples/warming_up_to_rl/configs/eval_modal_qwen4b.toml,sha256=6eeU1GVvK1cYSEuGXk-AhOwJLgRcf74CTOI5XlqNYBc,817
66
+ examples/warming_up_to_rl/configs/rl_from_base_qwen4b.toml,sha256=qVSypYOMUd8g6pmiovi7nsgk4jgMBjJIORpIsrmNV4U,1644
67
+ examples/warming_up_to_rl/configs/rl_from_ft.toml,sha256=d1cIoLeC80NgOjn0Wohk0a5IXE_ImHVgMsxWPkyAFKQ,1381
68
+ examples/warming_up_to_rl/old/event_rewards.md,sha256=gHJd3ZeYOnj4xPXt-7sSJamgOaJQ-BpfdaF-CKJK3-0,13450
69
+ examples/warming_up_to_rl/old/notes.md,sha256=Y9Zs_tUb2Y6kv0MmGe-kAvGM9zCtEDY3Ccf5j7PoFGU,4468
70
+ examples/warming_up_to_rl/task_app/README.md,sha256=kqDPpv7f0Oh0CoH4qSXqZoKXNIh8guNpxHrELW0z6RY,1346
71
+ examples/warming_up_to_rl/task_app/grpo_crafter.py,sha256=Cx_uNlo1hXpN5VO72O5MdBSz0Z8CZNfhlhbm868lTmg,15898
72
+ examples/warming_up_to_rl/task_app/grpo_crafter_task_app.py,sha256=lMfIcWpJdXMdQyozLAaCeK9dx2D1LPNSav2I2zG7Z9I,6046
73
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/README.md,sha256=kJaN1do8V4XM2_g51WMI3edCDpv5zEw_nrMFtEwO1SQ,4614
74
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/__init__.py,sha256=_zdnpK5Dl26o0-CTcljBBRfdwTy4o60aOLhex59VE6U,120
75
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/branching.py,sha256=SlCgKMg8_quH8bIJSMKlkommz36XvngVvgzrjRR1SBs,5393
76
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/environment_routes.py,sha256=W8MWFhRor65u0lp6FhOXJjc-j5W5ooEwWwF2UnCg1KE,50069
77
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/hosted_app.py,sha256=QMQHxi6glj9cnTJc6F8H7ivv2x8Mer5WQrR5Vs-xv94,7776
78
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/main.py,sha256=0g7OZl6CnrddETD1DOAQZxz_P1fZR0F7kuCeZb4BRHg,2510
79
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/policy_routes.py,sha256=qP3E9XAhHihKyz1l44FD4Zb5zoZt8v6m5HNhOLe4fxk,43685
80
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/registry.py,sha256=pMVwiutZe5DcPXdNmIhRJGwxIz3Xn3FtdkKKqrOEdOM,5613
81
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/rollout.py,sha256=506KV0x0oOajTuNVVWLUxeIXG2YaZjWwfgbVg2EorcA,71477
82
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/test_agents.py,sha256=PRkQlVKGfn2-w4EOTTHc8T-tqFW6m21mS7BII6TUUd4,5599
83
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/test_service.py,sha256=PAYPP0tWU0cQUUxJuAYbDwvWeGjAcPFRHsW2vG3vOpg,5228
84
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/utils.py,sha256=Qcxfa_WASxbUCbAKejiZB6QIl8eJeeIrFPt5GU-Zb6E,2013
85
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/__init__.py,sha256=5e-BmaXi_5EGcqF2hEGsnbtkHsNvPNMTX9wJ3yiz3XQ,34
86
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/__init__.py,sha256=nTmSVzOfRUnjxEN1-IHjxuvPHij-AdRu_NZoH6Ozv2M,197
87
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/app.py,sha256=MnaRrqkxxeOaHLD-ulH5P1BauDs3tWKdxM0n85jfp6g,19
88
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/environment.py,sha256=9OzSAPO5HMhMLQ2cfJMs6TO8-r4uGSw_JQgztu1MXGM,20112
89
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/policy.py,sha256=Bf7ypw2VqPUtiIycAP_irglYtf7sGvAWIvvIZsok-qI,19373
90
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/react_agent.py,sha256=dHASD8zbinK32mE4dEMQqmQpGjaomFbJQ_yIw8vYOrY,6157
91
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/shared.py,sha256=2ampoR9RVrh7T05nq-z4hg2KnSGVBo5A1ESYMae780s,10180
92
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/tools.py,sha256=-jVxok4pkDm3t9VwuUivm0y4xmYBq16wqOrSpAHoT6Q,1787
93
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/__init__.py,sha256=6O23CobxVe8fkuGmWDPhg4Kzf1Q6pmtQZIad8DHubjI,178
94
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py,sha256=3lIubZOcCslZTu1dK8qt76yB68l9RAx9WFKy6_9BaVk,23807
95
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/__init__.py,sha256=55vZdcz3qI1wt4qfNyC1LSFTPm6wKM7oF5iyNnR6Lvg,133
96
+ examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/volume.py,sha256=dxAHrHnOa-_pnbHrtLYdD1EwYX8la8LwR5B6kOmt_n8,6953
1
97
  synth_ai/__init__.py,sha256=NixuXddy4lS2Wmj0F8eMt0HS_oYCTnq3iVVq5VYwWIc,1341
2
98
  synth_ai/__main__.py,sha256=Kh1xBKkTE5Vs2qNMtDuuOXerHUptMcOiF3YziOpC6DA,146
3
99
  synth_ai/demo_registry.py,sha256=pH-Pyrocp2vNBcw7J80Nu_525nBtI5G_dC4d4mQDYl8,8531
@@ -8,8 +104,8 @@ synth_ai/install_sqld.sh,sha256=AMBhlfq661PxeTTc6D4K_Nei_qwMvA84ei4NhQzmUUk,928
8
104
  synth_ai/api/train/__init__.py,sha256=aBwlmrj1HWVwDcvUrX4TqpS0BgvkE7Pv7npoIZmtTFU,118
9
105
  synth_ai/api/train/builders.py,sha256=Fe684cGh-CQGPXydESCOjTkQpxbTJb47rVYKT8uONTs,6045
10
106
  synth_ai/api/train/cli.py,sha256=OyS6-NU1BUVitjUYYCtQenLXmprU9dDqYOR6tfeW7B0,17897
11
- synth_ai/api/train/config_finder.py,sha256=iH4a-_6rtGvhxBNINag5WivEX2W-Jb1_YysjN-ooOYM,5311
12
- synth_ai/api/train/env_resolver.py,sha256=PLvuorBg3ugxZUsfDeZAMrqmqEt56aGRInmhuHD6z8g,10715
107
+ synth_ai/api/train/config_finder.py,sha256=8HwyVRZ3WuXU2c7MdJgQVT29C-53zOWGcaucbkMso6c,5194
108
+ synth_ai/api/train/env_resolver.py,sha256=PoXGD-Gpifs8FuSGF_xKNIA90QrUnLW8S5zMaUGm_yg,11451
13
109
  synth_ai/api/train/pollers.py,sha256=EbkoV601aXEpqgfjNuugivtDooiRgOxBXSYZZ0Muj24,2114
14
110
  synth_ai/api/train/task_app.py,sha256=Pk-bCqBEkjgbf9tzFeRik5uC0No_2Y536TSiLcJ47h0,6419
15
111
  synth_ai/api/train/utils.py,sha256=rkouZjOFvY9WKXIuG-rlJhH9eyLLxi_ID6dj0JMNSmI,7213
@@ -23,7 +119,7 @@ synth_ai/cli/recent.py,sha256=mHhM-QrR_MfjfKSzBvvPUEC-lkXTWUZrQwqYTmb2x0Y,4173
23
119
  synth_ai/cli/rl_demo.py,sha256=P09_atVrSTfGUhAs0Obe63erniJ3EDHtm51yL2xBouM,8796
24
120
  synth_ai/cli/root.py,sha256=0fuWNO5NeWTSCANzPBfoQsZKe3iUxnJ9hsSWS-SK2UM,11370
25
121
  synth_ai/cli/status.py,sha256=M_bt7U58Ubi-q-ZlrIpgCASKq9_k6uMjpx926f6kLLA,4591
26
- synth_ai/cli/task_apps.py,sha256=gJDoW4aH2HFZK1fLPkCQ4EpVaBq_3lL8DmHzwObtdDo,40070
122
+ synth_ai/cli/task_apps.py,sha256=AQmZtnvNDHMRhvUF0KOvnIF1tRbg0J-nwnJe1T49ajg,52077
27
123
  synth_ai/cli/traces.py,sha256=_QBdCR92u0Gv51U4DH0Ws1d5yCrbJRpaYKe7pmcHrHs,6484
28
124
  synth_ai/cli/watch.py,sha256=HBKbAcpUkkPhGvsPRofckbu8oILiVqp35NXHkIEpTTc,17808
29
125
  synth_ai/compound/cais.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -237,7 +333,6 @@ synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_
237
333
  synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_pull.py,sha256=ZCEr6LoSxKvVQzbRGwRBN62RAQPP5jiLoNqI8c4Ij2Q,3808
238
334
  synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_two_player.py,sha256=99yZCBsbx3i5Wiuf786TiHQjq2tMEY0OKsOEa-obhXY,3763
239
335
  synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_variations.py,sha256=VKMXRVmVdIxfa0q_T5Dfll5HHadc5QHpktRQztEIxGs,15455
240
- synth_ai/environments/examples/sokoban/units/astar_common.py,sha256=4vG-_JrGI-yX8HY22CTY9P3DXPqCV_AHMPwH-flr0Z4,3006
241
336
  synth_ai/environments/examples/tictactoe/__init__.py,sha256=XGoOP8GEGXjG-TI_E_-3b1jOhpGNtl_LmR9G3K59Gig,31
242
337
  synth_ai/environments/examples/tictactoe/engine.py,sha256=B2OYQ3TVi_c75BRy_zHIEWjcTSaO4vnZZQJTo6wFe7k,12430
243
338
  synth_ai/environments/examples/tictactoe/environment.py,sha256=p_ZN5-AyYKUnIJ5Df46fXMlJZ6yRerkvXC9GA1W0Ht8,9336
@@ -374,9 +469,7 @@ synth_ai/task/server.py,sha256=bYrqnwtbGEdI_lieBMslgh-sUwdyzEbbHnmjovrRef8,15187
374
469
  synth_ai/task/tracing_utils.py,sha256=kro--A6BTCVReLMNRX4_v2arLVXYIQNKtn3RDMMrOmE,2400
375
470
  synth_ai/task/validators.py,sha256=IGE9zTjHYXOehwakMkcOAaDLSaHw_0Tp8uzL2ydCZ9U,361
376
471
  synth_ai/task/vendors.py,sha256=zG-qeP2OC1s5kJECZdf02QBvn-v_qHcz-rG0C8Ws0wA,1664
377
- synth_ai/task/apps/__init__.py,sha256=M0DeEhvUhyXh1A_AnVSBXTeJY75c7BVsW0A_1vxL_08,2677
378
- synth_ai/task/apps/grpo_crafter.py,sha256=eCxD9eHYLIkvo4mFhlIY14u-Ipp_zmHj6wvg08Vu58Y,15809
379
- synth_ai/task/apps/math_single_step.py,sha256=jhoArV52jlWxN6HO2XYTnrLC3aWF23G1B9PRVx5LkVM,30278
472
+ synth_ai/task/apps/__init__.py,sha256=yLY31OII4Hbt9ibTj1vmxVCd9JBluCGh6Xgy6biKEIs,4151
380
473
  synth_ai/tracing/__init__.py,sha256=0Yy1YDMe_Duw976yu0HL1cbqPWdZEvtgEdtjDguNvcc,781
381
474
  synth_ai/tracing_v1/__init__.py,sha256=uV6qf8_rJTxRx6tCsXvqnjHhA1mR0im2rANuh0McrHA,930
382
475
  synth_ai/tracing_v3/__init__.py,sha256=9lKM-blbXo6Sk1oBpyYayjMVU43f9Y_35M1OvRynWoU,3251
@@ -440,9 +533,9 @@ synth_ai/v0/tracing_v1/events/manage.py,sha256=ZDXXP-ZwLH9LCsmw7Ru9o55d7bl_diPtJ
440
533
  synth_ai/v0/tracing_v1/events/scope.py,sha256=BuBkhSpVHUJt8iGT9HJZF82rbb88mQcd2vM2shg-w2I,2550
441
534
  synth_ai/v0/tracing_v1/events/store.py,sha256=0342lvAcalyJbVEIzQFaPuMQGgwiFm7M5rE6gr-G0E8,9041
442
535
  synth_ai/zyk/__init__.py,sha256=htVLnzTYQ5rxzYpzSYBm7_o6uNKZ3pB_PrqkBrgTRS4,771
443
- synth_ai-0.2.9.dev3.dist-info/licenses/LICENSE,sha256=ynhjRQUfqA_RdGRATApfFA_fBAy9cno04sLtLUqxVFM,1069
444
- synth_ai-0.2.9.dev3.dist-info/METADATA,sha256=Km3_Hf_1bxFLGaBHdljL_V7Xx9WKKkTRKj29ep7J5p8,5200
445
- synth_ai-0.2.9.dev3.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
446
- synth_ai-0.2.9.dev3.dist-info/entry_points.txt,sha256=Neq-3bT7TAijjgOIR77pKL-WYg6TWBDeO8pp_nL4vGY,91
447
- synth_ai-0.2.9.dev3.dist-info/top_level.txt,sha256=fBmtZyVHuKaGa29oHBaaUkrUIWTqSpoVMPiVdCDP3k8,9
448
- synth_ai-0.2.9.dev3.dist-info/RECORD,,
536
+ synth_ai-0.2.9.dev5.dist-info/licenses/LICENSE,sha256=ynhjRQUfqA_RdGRATApfFA_fBAy9cno04sLtLUqxVFM,1069
537
+ synth_ai-0.2.9.dev5.dist-info/METADATA,sha256=-GRGwjAZPLUJpTxbLEiu-B_fZtBPodHuem1ySlmqiXk,5200
538
+ synth_ai-0.2.9.dev5.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
539
+ synth_ai-0.2.9.dev5.dist-info/entry_points.txt,sha256=Neq-3bT7TAijjgOIR77pKL-WYg6TWBDeO8pp_nL4vGY,91
540
+ synth_ai-0.2.9.dev5.dist-info/top_level.txt,sha256=1moNHgctEUJ3F3eH3V-7FSMb2iTTze1V13dj1R04oUY,18
541
+ synth_ai-0.2.9.dev5.dist-info/RECORD,,
@@ -1,95 +0,0 @@
1
- """
2
- astar_common.py – one A* routine usable by both engine-level and
3
- environment-level unit tests.
4
- """
5
-
6
- import heapq
7
- import itertools
8
- import json
9
- from typing import Any, Awaitable, Callable, List, Tuple
10
-
11
- import numpy as np
12
-
13
-
14
- # ---------- generic utilities ------------------------------------ #
15
- def _boxes_left(env_pkg) -> int:
16
- """#targets – #boxes-on-targets (uses raw grids, never the counter)."""
17
- return int(np.sum(env_pkg.room_fixed == 2) - np.sum(env_pkg.room_state == 3))
18
-
19
-
20
- def solved(obj: Any) -> bool:
21
- """Expects obj to have a .package_sokoban_env attribute."""
22
- return _boxes_left(obj.package_sokoban_env) == 0
23
-
24
-
25
- def heuristic(obj: Any) -> int:
26
- """Expects obj to have a .package_sokoban_env attribute."""
27
- return _boxes_left(obj.package_sokoban_env)
28
-
29
-
30
- # ---------- single reusable A* ----------------------------------- #
31
- async def astar(
32
- root_obj: Any,
33
- step_fn: Callable[[Any, int], Awaitable[None]],
34
- deserialize_fn: Callable[[Any], Awaitable[Any]],
35
- max_nodes: int = 1000,
36
- ) -> List[int]:
37
- """
38
- Generic A* over Sokoban snapshots.
39
-
40
- • `root_obj` - current engine *or* environment
41
- • `step_fn(obj, action)` - async: apply one move to *obj*
42
- • `deserialize_fn(snapshot)` - async: new obj from snapshot
43
- """
44
- start_snap = await root_obj._serialize_engine()
45
-
46
- frontier: List[Tuple[int, int, Any, List[int]]] = []
47
- counter = itertools.count()
48
- frontier.append((heuristic(root_obj), next(counter), start_snap, []))
49
- seen: set[str] = set()
50
-
51
- nodes = 0
52
- while frontier and nodes < max_nodes:
53
- f, _, snap, path = heapq.heappop(frontier)
54
- cur = await deserialize_fn(snap)
55
- key = json.dumps(snap.engine_snapshot, sort_keys=True)
56
- if key in seen:
57
- continue
58
- seen.add(key)
59
- if solved(cur):
60
- return path
61
-
62
- nodes += 1
63
- for action in range(cur.package_sokoban_env.action_space.n):
64
- child = await deserialize_fn(snap) # fresh copy
65
- try:
66
- await step_fn(child, action)
67
- except Exception: # illegal/off-board
68
- continue
69
-
70
- child_snap = await child._serialize_engine()
71
- g = len(path) + 1
72
- heapq.heappush(
73
- frontier,
74
- (g + heuristic(child), next(counter), child_snap, path + [action]),
75
- )
76
- return []
77
-
78
-
79
- # convenience lambdas for the two concrete APIs
80
- async def _engine_step(e, a): # `SokobanEngine`
81
- await e._step_engine(a)
82
-
83
-
84
- async def _env_step(env, a): # `SokobanEnvironment` (expects Move wrapper)
85
- from synth_ai.environments.examples.sokoban.units.test_sokoban_environment import Move
86
-
87
- await env.step([[Move(a)]])
88
-
89
-
90
- ENGINE_ASTAR = lambda eng, **kw: astar(eng, _engine_step, eng.__class__._deserialize_engine, **kw)
91
- ENV_ASTAR = lambda env, **kw: astar(
92
- env.engine, _env_step, env.engine.__class__._deserialize_engine, **kw
93
- )
94
-
95
- # ----------------------------------------------------------------- #