torchrl 0.11.0__cp314-cp314-macosx_11_0_arm64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (395) hide show
  1. benchmarks/benchmark_batched_envs.py +104 -0
  2. benchmarks/conftest.py +91 -0
  3. benchmarks/ecosystem/gym_env_throughput.py +321 -0
  4. benchmarks/ecosystem/vmas_rllib_vs_torchrl_sampling_performance.py +231 -0
  5. benchmarks/requirements.txt +7 -0
  6. benchmarks/storage/benchmark_sample_latency_over_rpc.py +193 -0
  7. benchmarks/test_collectors_benchmark.py +240 -0
  8. benchmarks/test_compressed_storage_benchmark.py +145 -0
  9. benchmarks/test_envs_benchmark.py +133 -0
  10. benchmarks/test_llm.py +101 -0
  11. benchmarks/test_non_tensor_env_benchmark.py +70 -0
  12. benchmarks/test_objectives_benchmarks.py +1199 -0
  13. benchmarks/test_replaybuffer_benchmark.py +254 -0
  14. sota-check/README.md +35 -0
  15. sota-implementations/README.md +142 -0
  16. sota-implementations/a2c/README.md +39 -0
  17. sota-implementations/a2c/a2c_atari.py +291 -0
  18. sota-implementations/a2c/a2c_mujoco.py +273 -0
  19. sota-implementations/a2c/utils_atari.py +240 -0
  20. sota-implementations/a2c/utils_mujoco.py +160 -0
  21. sota-implementations/bandits/README.md +7 -0
  22. sota-implementations/bandits/dqn.py +126 -0
  23. sota-implementations/cql/cql_offline.py +198 -0
  24. sota-implementations/cql/cql_online.py +249 -0
  25. sota-implementations/cql/discrete_cql_offline.py +180 -0
  26. sota-implementations/cql/discrete_cql_online.py +227 -0
  27. sota-implementations/cql/utils.py +471 -0
  28. sota-implementations/crossq/crossq.py +271 -0
  29. sota-implementations/crossq/utils.py +320 -0
  30. sota-implementations/ddpg/ddpg.py +231 -0
  31. sota-implementations/ddpg/utils.py +325 -0
  32. sota-implementations/decision_transformer/dt.py +163 -0
  33. sota-implementations/decision_transformer/lamb.py +167 -0
  34. sota-implementations/decision_transformer/online_dt.py +178 -0
  35. sota-implementations/decision_transformer/utils.py +562 -0
  36. sota-implementations/discrete_sac/discrete_sac.py +243 -0
  37. sota-implementations/discrete_sac/utils.py +324 -0
  38. sota-implementations/dqn/README.md +30 -0
  39. sota-implementations/dqn/dqn_atari.py +272 -0
  40. sota-implementations/dqn/dqn_cartpole.py +236 -0
  41. sota-implementations/dqn/utils_atari.py +132 -0
  42. sota-implementations/dqn/utils_cartpole.py +90 -0
  43. sota-implementations/dreamer/README.md +129 -0
  44. sota-implementations/dreamer/dreamer.py +586 -0
  45. sota-implementations/dreamer/dreamer_utils.py +1107 -0
  46. sota-implementations/expert-iteration/README.md +352 -0
  47. sota-implementations/expert-iteration/ei_utils.py +770 -0
  48. sota-implementations/expert-iteration/expert-iteration-async.py +512 -0
  49. sota-implementations/expert-iteration/expert-iteration-sync.py +508 -0
  50. sota-implementations/expert-iteration/requirements_gsm8k.txt +13 -0
  51. sota-implementations/expert-iteration/requirements_ifeval.txt +16 -0
  52. sota-implementations/gail/gail.py +327 -0
  53. sota-implementations/gail/gail_utils.py +68 -0
  54. sota-implementations/gail/ppo_utils.py +157 -0
  55. sota-implementations/grpo/README.md +273 -0
  56. sota-implementations/grpo/grpo-async.py +437 -0
  57. sota-implementations/grpo/grpo-sync.py +435 -0
  58. sota-implementations/grpo/grpo_utils.py +843 -0
  59. sota-implementations/grpo/requirements_gsm8k.txt +11 -0
  60. sota-implementations/grpo/requirements_ifeval.txt +16 -0
  61. sota-implementations/impala/README.md +33 -0
  62. sota-implementations/impala/impala_multi_node_ray.py +292 -0
  63. sota-implementations/impala/impala_multi_node_submitit.py +284 -0
  64. sota-implementations/impala/impala_single_node.py +261 -0
  65. sota-implementations/impala/utils.py +184 -0
  66. sota-implementations/iql/discrete_iql.py +230 -0
  67. sota-implementations/iql/iql_offline.py +164 -0
  68. sota-implementations/iql/iql_online.py +225 -0
  69. sota-implementations/iql/utils.py +437 -0
  70. sota-implementations/multiagent/README.md +74 -0
  71. sota-implementations/multiagent/iql.py +237 -0
  72. sota-implementations/multiagent/maddpg_iddpg.py +266 -0
  73. sota-implementations/multiagent/mappo_ippo.py +267 -0
  74. sota-implementations/multiagent/qmix_vdn.py +271 -0
  75. sota-implementations/multiagent/sac.py +337 -0
  76. sota-implementations/multiagent/utils/__init__.py +4 -0
  77. sota-implementations/multiagent/utils/logging.py +151 -0
  78. sota-implementations/multiagent/utils/utils.py +43 -0
  79. sota-implementations/ppo/README.md +29 -0
  80. sota-implementations/ppo/ppo_atari.py +305 -0
  81. sota-implementations/ppo/ppo_mujoco.py +293 -0
  82. sota-implementations/ppo/utils_atari.py +238 -0
  83. sota-implementations/ppo/utils_mujoco.py +152 -0
  84. sota-implementations/ppo_trainer/train.py +21 -0
  85. sota-implementations/redq/README.md +7 -0
  86. sota-implementations/redq/redq.py +199 -0
  87. sota-implementations/redq/utils.py +1060 -0
  88. sota-implementations/sac/sac-async.py +266 -0
  89. sota-implementations/sac/sac.py +239 -0
  90. sota-implementations/sac/utils.py +381 -0
  91. sota-implementations/sac_trainer/train.py +16 -0
  92. sota-implementations/td3/td3.py +254 -0
  93. sota-implementations/td3/utils.py +319 -0
  94. sota-implementations/td3_bc/td3_bc.py +177 -0
  95. sota-implementations/td3_bc/utils.py +251 -0
  96. torchrl/.dylibs/libc++.1.0.dylib +0 -0
  97. torchrl/__init__.py +144 -0
  98. torchrl/_extension.py +74 -0
  99. torchrl/_torchrl.cpython-314-darwin.so +0 -0
  100. torchrl/_utils.py +1431 -0
  101. torchrl/collectors/__init__.py +48 -0
  102. torchrl/collectors/_base.py +1058 -0
  103. torchrl/collectors/_constants.py +88 -0
  104. torchrl/collectors/_multi_async.py +324 -0
  105. torchrl/collectors/_multi_base.py +1805 -0
  106. torchrl/collectors/_multi_sync.py +464 -0
  107. torchrl/collectors/_runner.py +581 -0
  108. torchrl/collectors/_single.py +2009 -0
  109. torchrl/collectors/_single_async.py +259 -0
  110. torchrl/collectors/collectors.py +62 -0
  111. torchrl/collectors/distributed/__init__.py +32 -0
  112. torchrl/collectors/distributed/default_configs.py +133 -0
  113. torchrl/collectors/distributed/generic.py +1306 -0
  114. torchrl/collectors/distributed/ray.py +1092 -0
  115. torchrl/collectors/distributed/rpc.py +1006 -0
  116. torchrl/collectors/distributed/sync.py +731 -0
  117. torchrl/collectors/distributed/utils.py +160 -0
  118. torchrl/collectors/llm/__init__.py +10 -0
  119. torchrl/collectors/llm/base.py +494 -0
  120. torchrl/collectors/llm/ray_collector.py +275 -0
  121. torchrl/collectors/llm/utils.py +36 -0
  122. torchrl/collectors/llm/weight_update/__init__.py +10 -0
  123. torchrl/collectors/llm/weight_update/vllm.py +348 -0
  124. torchrl/collectors/llm/weight_update/vllm_v2.py +311 -0
  125. torchrl/collectors/utils.py +433 -0
  126. torchrl/collectors/weight_update.py +591 -0
  127. torchrl/csrc/numpy_utils.h +38 -0
  128. torchrl/csrc/pybind.cpp +27 -0
  129. torchrl/csrc/segment_tree.h +458 -0
  130. torchrl/csrc/torch_utils.h +34 -0
  131. torchrl/csrc/utils.cpp +48 -0
  132. torchrl/csrc/utils.h +31 -0
  133. torchrl/data/__init__.py +187 -0
  134. torchrl/data/datasets/__init__.py +58 -0
  135. torchrl/data/datasets/atari_dqn.py +878 -0
  136. torchrl/data/datasets/common.py +281 -0
  137. torchrl/data/datasets/d4rl.py +489 -0
  138. torchrl/data/datasets/d4rl_infos.py +187 -0
  139. torchrl/data/datasets/gen_dgrl.py +375 -0
  140. torchrl/data/datasets/minari_data.py +643 -0
  141. torchrl/data/datasets/openml.py +177 -0
  142. torchrl/data/datasets/openx.py +798 -0
  143. torchrl/data/datasets/roboset.py +363 -0
  144. torchrl/data/datasets/utils.py +11 -0
  145. torchrl/data/datasets/vd4rl.py +432 -0
  146. torchrl/data/llm/__init__.py +34 -0
  147. torchrl/data/llm/dataset.py +491 -0
  148. torchrl/data/llm/history.py +1378 -0
  149. torchrl/data/llm/prompt.py +198 -0
  150. torchrl/data/llm/reward.py +225 -0
  151. torchrl/data/llm/topk.py +186 -0
  152. torchrl/data/llm/utils.py +543 -0
  153. torchrl/data/map/__init__.py +21 -0
  154. torchrl/data/map/hash.py +185 -0
  155. torchrl/data/map/query.py +204 -0
  156. torchrl/data/map/tdstorage.py +363 -0
  157. torchrl/data/map/tree.py +1434 -0
  158. torchrl/data/map/utils.py +103 -0
  159. torchrl/data/postprocs/__init__.py +8 -0
  160. torchrl/data/postprocs/postprocs.py +391 -0
  161. torchrl/data/replay_buffers/__init__.py +99 -0
  162. torchrl/data/replay_buffers/checkpointers.py +622 -0
  163. torchrl/data/replay_buffers/ray_buffer.py +292 -0
  164. torchrl/data/replay_buffers/replay_buffers.py +2376 -0
  165. torchrl/data/replay_buffers/samplers.py +2578 -0
  166. torchrl/data/replay_buffers/scheduler.py +265 -0
  167. torchrl/data/replay_buffers/storages.py +2412 -0
  168. torchrl/data/replay_buffers/utils.py +1042 -0
  169. torchrl/data/replay_buffers/writers.py +781 -0
  170. torchrl/data/tensor_specs.py +7101 -0
  171. torchrl/data/utils.py +334 -0
  172. torchrl/envs/__init__.py +265 -0
  173. torchrl/envs/async_envs.py +1105 -0
  174. torchrl/envs/batched_envs.py +3093 -0
  175. torchrl/envs/common.py +4241 -0
  176. torchrl/envs/custom/__init__.py +11 -0
  177. torchrl/envs/custom/chess.py +617 -0
  178. torchrl/envs/custom/llm.py +214 -0
  179. torchrl/envs/custom/pendulum.py +401 -0
  180. torchrl/envs/custom/san_moves.txt +29274 -0
  181. torchrl/envs/custom/tictactoeenv.py +288 -0
  182. torchrl/envs/env_creator.py +263 -0
  183. torchrl/envs/gym_like.py +752 -0
  184. torchrl/envs/libs/__init__.py +68 -0
  185. torchrl/envs/libs/_gym_utils.py +326 -0
  186. torchrl/envs/libs/brax.py +846 -0
  187. torchrl/envs/libs/dm_control.py +544 -0
  188. torchrl/envs/libs/envpool.py +447 -0
  189. torchrl/envs/libs/gym.py +2239 -0
  190. torchrl/envs/libs/habitat.py +138 -0
  191. torchrl/envs/libs/isaac_lab.py +87 -0
  192. torchrl/envs/libs/isaacgym.py +203 -0
  193. torchrl/envs/libs/jax_utils.py +166 -0
  194. torchrl/envs/libs/jumanji.py +963 -0
  195. torchrl/envs/libs/meltingpot.py +599 -0
  196. torchrl/envs/libs/openml.py +153 -0
  197. torchrl/envs/libs/openspiel.py +652 -0
  198. torchrl/envs/libs/pettingzoo.py +1042 -0
  199. torchrl/envs/libs/procgen.py +351 -0
  200. torchrl/envs/libs/robohive.py +429 -0
  201. torchrl/envs/libs/smacv2.py +645 -0
  202. torchrl/envs/libs/unity_mlagents.py +891 -0
  203. torchrl/envs/libs/utils.py +147 -0
  204. torchrl/envs/libs/vmas.py +813 -0
  205. torchrl/envs/llm/__init__.py +63 -0
  206. torchrl/envs/llm/chat.py +730 -0
  207. torchrl/envs/llm/datasets/README.md +4 -0
  208. torchrl/envs/llm/datasets/__init__.py +17 -0
  209. torchrl/envs/llm/datasets/gsm8k.py +353 -0
  210. torchrl/envs/llm/datasets/ifeval.py +274 -0
  211. torchrl/envs/llm/envs.py +789 -0
  212. torchrl/envs/llm/libs/README.md +3 -0
  213. torchrl/envs/llm/libs/__init__.py +8 -0
  214. torchrl/envs/llm/libs/mlgym.py +869 -0
  215. torchrl/envs/llm/reward/__init__.py +10 -0
  216. torchrl/envs/llm/reward/gsm8k.py +324 -0
  217. torchrl/envs/llm/reward/ifeval/README.md +13 -0
  218. torchrl/envs/llm/reward/ifeval/__init__.py +10 -0
  219. torchrl/envs/llm/reward/ifeval/_instructions.py +1667 -0
  220. torchrl/envs/llm/reward/ifeval/_instructions_main.py +131 -0
  221. torchrl/envs/llm/reward/ifeval/_instructions_registry.py +100 -0
  222. torchrl/envs/llm/reward/ifeval/_instructions_util.py +1677 -0
  223. torchrl/envs/llm/reward/ifeval/_scorer.py +454 -0
  224. torchrl/envs/llm/transforms/__init__.py +55 -0
  225. torchrl/envs/llm/transforms/browser.py +292 -0
  226. torchrl/envs/llm/transforms/dataloading.py +859 -0
  227. torchrl/envs/llm/transforms/format.py +73 -0
  228. torchrl/envs/llm/transforms/kl.py +1544 -0
  229. torchrl/envs/llm/transforms/policy_version.py +189 -0
  230. torchrl/envs/llm/transforms/reason.py +323 -0
  231. torchrl/envs/llm/transforms/tokenizer.py +321 -0
  232. torchrl/envs/llm/transforms/tools.py +1955 -0
  233. torchrl/envs/model_based/__init__.py +9 -0
  234. torchrl/envs/model_based/common.py +180 -0
  235. torchrl/envs/model_based/dreamer.py +112 -0
  236. torchrl/envs/transforms/__init__.py +147 -0
  237. torchrl/envs/transforms/functional.py +48 -0
  238. torchrl/envs/transforms/gym_transforms.py +203 -0
  239. torchrl/envs/transforms/module.py +341 -0
  240. torchrl/envs/transforms/r3m.py +372 -0
  241. torchrl/envs/transforms/ray_service.py +663 -0
  242. torchrl/envs/transforms/rb_transforms.py +214 -0
  243. torchrl/envs/transforms/transforms.py +11835 -0
  244. torchrl/envs/transforms/utils.py +94 -0
  245. torchrl/envs/transforms/vc1.py +307 -0
  246. torchrl/envs/transforms/vecnorm.py +845 -0
  247. torchrl/envs/transforms/vip.py +407 -0
  248. torchrl/envs/utils.py +1718 -0
  249. torchrl/envs/vec_envs.py +11 -0
  250. torchrl/modules/__init__.py +206 -0
  251. torchrl/modules/distributions/__init__.py +73 -0
  252. torchrl/modules/distributions/continuous.py +830 -0
  253. torchrl/modules/distributions/discrete.py +908 -0
  254. torchrl/modules/distributions/truncated_normal.py +187 -0
  255. torchrl/modules/distributions/utils.py +233 -0
  256. torchrl/modules/llm/__init__.py +62 -0
  257. torchrl/modules/llm/backends/__init__.py +65 -0
  258. torchrl/modules/llm/backends/vllm/__init__.py +94 -0
  259. torchrl/modules/llm/backends/vllm/_models.py +46 -0
  260. torchrl/modules/llm/backends/vllm/base.py +72 -0
  261. torchrl/modules/llm/backends/vllm/vllm_async.py +2075 -0
  262. torchrl/modules/llm/backends/vllm/vllm_plugin.py +22 -0
  263. torchrl/modules/llm/backends/vllm/vllm_sync.py +446 -0
  264. torchrl/modules/llm/backends/vllm/vllm_utils.py +129 -0
  265. torchrl/modules/llm/policies/__init__.py +28 -0
  266. torchrl/modules/llm/policies/common.py +1809 -0
  267. torchrl/modules/llm/policies/transformers_wrapper.py +2756 -0
  268. torchrl/modules/llm/policies/vllm_wrapper.py +2241 -0
  269. torchrl/modules/llm/utils.py +23 -0
  270. torchrl/modules/mcts/__init__.py +21 -0
  271. torchrl/modules/mcts/scores.py +579 -0
  272. torchrl/modules/models/__init__.py +86 -0
  273. torchrl/modules/models/batchrenorm.py +119 -0
  274. torchrl/modules/models/decision_transformer.py +179 -0
  275. torchrl/modules/models/exploration.py +731 -0
  276. torchrl/modules/models/llm.py +156 -0
  277. torchrl/modules/models/model_based.py +596 -0
  278. torchrl/modules/models/models.py +1712 -0
  279. torchrl/modules/models/multiagent.py +1067 -0
  280. torchrl/modules/models/recipes/impala.py +185 -0
  281. torchrl/modules/models/utils.py +162 -0
  282. torchrl/modules/planners/__init__.py +10 -0
  283. torchrl/modules/planners/cem.py +228 -0
  284. torchrl/modules/planners/common.py +73 -0
  285. torchrl/modules/planners/mppi.py +265 -0
  286. torchrl/modules/tensordict_module/__init__.py +89 -0
  287. torchrl/modules/tensordict_module/actors.py +2457 -0
  288. torchrl/modules/tensordict_module/common.py +529 -0
  289. torchrl/modules/tensordict_module/exploration.py +814 -0
  290. torchrl/modules/tensordict_module/probabilistic.py +321 -0
  291. torchrl/modules/tensordict_module/rnn.py +1639 -0
  292. torchrl/modules/tensordict_module/sequence.py +132 -0
  293. torchrl/modules/tensordict_module/world_models.py +34 -0
  294. torchrl/modules/utils/__init__.py +38 -0
  295. torchrl/modules/utils/mappings.py +9 -0
  296. torchrl/modules/utils/utils.py +89 -0
  297. torchrl/objectives/__init__.py +78 -0
  298. torchrl/objectives/a2c.py +659 -0
  299. torchrl/objectives/common.py +753 -0
  300. torchrl/objectives/cql.py +1346 -0
  301. torchrl/objectives/crossq.py +710 -0
  302. torchrl/objectives/ddpg.py +453 -0
  303. torchrl/objectives/decision_transformer.py +371 -0
  304. torchrl/objectives/deprecated.py +516 -0
  305. torchrl/objectives/dqn.py +683 -0
  306. torchrl/objectives/dreamer.py +488 -0
  307. torchrl/objectives/functional.py +48 -0
  308. torchrl/objectives/gail.py +258 -0
  309. torchrl/objectives/iql.py +996 -0
  310. torchrl/objectives/llm/__init__.py +30 -0
  311. torchrl/objectives/llm/grpo.py +846 -0
  312. torchrl/objectives/llm/sft.py +482 -0
  313. torchrl/objectives/multiagent/__init__.py +8 -0
  314. torchrl/objectives/multiagent/qmixer.py +396 -0
  315. torchrl/objectives/ppo.py +1669 -0
  316. torchrl/objectives/redq.py +683 -0
  317. torchrl/objectives/reinforce.py +530 -0
  318. torchrl/objectives/sac.py +1580 -0
  319. torchrl/objectives/td3.py +570 -0
  320. torchrl/objectives/td3_bc.py +625 -0
  321. torchrl/objectives/utils.py +782 -0
  322. torchrl/objectives/value/__init__.py +28 -0
  323. torchrl/objectives/value/advantages.py +1956 -0
  324. torchrl/objectives/value/functional.py +1459 -0
  325. torchrl/objectives/value/utils.py +360 -0
  326. torchrl/record/__init__.py +17 -0
  327. torchrl/record/loggers/__init__.py +23 -0
  328. torchrl/record/loggers/common.py +48 -0
  329. torchrl/record/loggers/csv.py +226 -0
  330. torchrl/record/loggers/mlflow.py +142 -0
  331. torchrl/record/loggers/tensorboard.py +139 -0
  332. torchrl/record/loggers/trackio.py +163 -0
  333. torchrl/record/loggers/utils.py +78 -0
  334. torchrl/record/loggers/wandb.py +214 -0
  335. torchrl/record/recorder.py +554 -0
  336. torchrl/services/__init__.py +79 -0
  337. torchrl/services/base.py +109 -0
  338. torchrl/services/ray_service.py +453 -0
  339. torchrl/testing/__init__.py +107 -0
  340. torchrl/testing/assertions.py +179 -0
  341. torchrl/testing/dist_utils.py +122 -0
  342. torchrl/testing/env_creators.py +227 -0
  343. torchrl/testing/env_helper.py +35 -0
  344. torchrl/testing/gym_helpers.py +156 -0
  345. torchrl/testing/llm_mocks.py +119 -0
  346. torchrl/testing/mocking_classes.py +2720 -0
  347. torchrl/testing/modules.py +295 -0
  348. torchrl/testing/mp_helpers.py +15 -0
  349. torchrl/testing/ray_helpers.py +293 -0
  350. torchrl/testing/utils.py +190 -0
  351. torchrl/trainers/__init__.py +42 -0
  352. torchrl/trainers/algorithms/__init__.py +11 -0
  353. torchrl/trainers/algorithms/configs/__init__.py +705 -0
  354. torchrl/trainers/algorithms/configs/collectors.py +216 -0
  355. torchrl/trainers/algorithms/configs/common.py +41 -0
  356. torchrl/trainers/algorithms/configs/data.py +308 -0
  357. torchrl/trainers/algorithms/configs/envs.py +104 -0
  358. torchrl/trainers/algorithms/configs/envs_libs.py +361 -0
  359. torchrl/trainers/algorithms/configs/logging.py +80 -0
  360. torchrl/trainers/algorithms/configs/modules.py +570 -0
  361. torchrl/trainers/algorithms/configs/objectives.py +177 -0
  362. torchrl/trainers/algorithms/configs/trainers.py +340 -0
  363. torchrl/trainers/algorithms/configs/transforms.py +955 -0
  364. torchrl/trainers/algorithms/configs/utils.py +252 -0
  365. torchrl/trainers/algorithms/configs/weight_sync_schemes.py +191 -0
  366. torchrl/trainers/algorithms/configs/weight_update.py +159 -0
  367. torchrl/trainers/algorithms/ppo.py +373 -0
  368. torchrl/trainers/algorithms/sac.py +308 -0
  369. torchrl/trainers/helpers/__init__.py +40 -0
  370. torchrl/trainers/helpers/collectors.py +416 -0
  371. torchrl/trainers/helpers/envs.py +573 -0
  372. torchrl/trainers/helpers/logger.py +33 -0
  373. torchrl/trainers/helpers/losses.py +132 -0
  374. torchrl/trainers/helpers/models.py +658 -0
  375. torchrl/trainers/helpers/replay_buffer.py +59 -0
  376. torchrl/trainers/helpers/trainers.py +301 -0
  377. torchrl/trainers/trainers.py +2052 -0
  378. torchrl/weight_update/__init__.py +33 -0
  379. torchrl/weight_update/_distributed.py +749 -0
  380. torchrl/weight_update/_mp.py +624 -0
  381. torchrl/weight_update/_noupdate.py +102 -0
  382. torchrl/weight_update/_ray.py +1032 -0
  383. torchrl/weight_update/_rpc.py +284 -0
  384. torchrl/weight_update/_shared.py +891 -0
  385. torchrl/weight_update/llm/__init__.py +32 -0
  386. torchrl/weight_update/llm/vllm_double_buffer.py +370 -0
  387. torchrl/weight_update/llm/vllm_nccl.py +710 -0
  388. torchrl/weight_update/utils.py +73 -0
  389. torchrl/weight_update/weight_sync_schemes.py +1244 -0
  390. torchrl-0.11.0.dist-info/METADATA +1308 -0
  391. torchrl-0.11.0.dist-info/RECORD +395 -0
  392. torchrl-0.11.0.dist-info/WHEEL +5 -0
  393. torchrl-0.11.0.dist-info/entry_points.txt +2 -0
  394. torchrl-0.11.0.dist-info/licenses/LICENSE +21 -0
  395. torchrl-0.11.0.dist-info/top_level.txt +7 -0
@@ -0,0 +1,395 @@
1
+ sota-implementations/README.md,sha256=TfddOyaN0oMdok03QQc1L3zld1D8bWNfFx6cyKT0mQQ,3620
2
+ sota-implementations/gail/gail_utils.py,sha256=0S5gLw1a5v2I5Z0XiPcRLSvhSwmnHQuBFrzR7j1_qcE,2118
3
+ sota-implementations/gail/ppo_utils.py,sha256=mvLxsBQBeBBgzjw_TgeUuS9WjgJpjs84V4tIsGyXYhI,4919
4
+ sota-implementations/gail/gail.py,sha256=tJmOrCIFEvaWSryJ3q2zpiTtJf31ZIYCKPmC5KBPwZ0,11268
5
+ sota-implementations/multiagent/mappo_ippo.py,sha256=bjwjvYO5F2tXRAPf7-phr-t9VQ1_GV93mn_aJ6coJXQ,8944
6
+ sota-implementations/multiagent/qmix_vdn.py,sha256=IWQZFFd8oV0iIffmayUrLnZym-EnRytUp8YNPBcg0Lg,9302
7
+ sota-implementations/multiagent/iql.py,sha256=1vO1C45W7JyzdWSkMppk0gtf79AGglbjCYHvI2rRqIc,7997
8
+ sota-implementations/multiagent/README.md,sha256=9YbB6xfP-FnECr-8Uz-okaOPHemEgqk6rWx8p3uq2cM,2487
9
+ sota-implementations/multiagent/sac.py,sha256=dufk3wivxoBp1yNJa9TOAkAtuRhpw5H0snSAgTjfLHo,11914
10
+ sota-implementations/multiagent/maddpg_iddpg.py,sha256=oTtXjdVVgqIgZveRqcZeZDC4-6vSND_it8kY-gIFrRc,9002
11
+ sota-implementations/multiagent/utils/logging.py,sha256=jnBCT-W7JClKUUAaT_weCzzx-ql5YPPIHdPVvNM7ShI,5198
12
+ sota-implementations/multiagent/utils/__init__.py,sha256=D9ECsap08rcUtHyaR111nTjArlKkUjQwP8usXwXAAVQ,179
13
+ sota-implementations/multiagent/utils/utils.py,sha256=qQnVturblIRQ_QVyttz3vF_LE4sh471foOK7WqZebfk,1317
14
+ sota-implementations/sac/sac-async.py,sha256=fJEk3g79fMxqr7SdjApfRhylCfm_OsCLKM52e2GJGSg,9231
15
+ sota-implementations/sac/sac.py,sha256=f0rLmI0xfoqOJNSRm2yxqdZ6C5SvAT4XD0cuZbz0z_w,7995
16
+ sota-implementations/sac/utils.py,sha256=HPt8uiqQK5CSRyVcFOwDaqPgsNUeLBcmQrKn7QC6Pbc,11113
17
+ sota-implementations/bandits/README.md,sha256=QhO8uHi1cBMeHnGO0A6xDwVbaJSlBS1rR0J4qd64s-M,393
18
+ sota-implementations/bandits/dqn.py,sha256=TNgKK9ND25mZWxqZG76OxBosVt6jq0zbc0x7IRK8tX4,4199
19
+ sota-implementations/discrete_sac/discrete_sac.py,sha256=H8c3KoEFqW1fidJbhNvOwC7ODDMuUYn9Y8bdpDC9cN4,7966
20
+ sota-implementations/discrete_sac/utils.py,sha256=QUWxf8YyM47sgtT2CVcXCGxvCeYoQ-Pjx-kgZDnzOyY,9196
21
+ sota-implementations/cql/cql_offline.py,sha256=fLdWlrFwMIL5DcYwcaAfO89NfmNJisbQwTxFK5mymSQ,6209
22
+ sota-implementations/cql/discrete_cql_online.py,sha256=XxM58bzn6f-31vSSheDuKVRpBCATInhAPRGy0naYhwc,7479
23
+ sota-implementations/cql/discrete_cql_offline.py,sha256=hYvqM-Zcyi_BJwLnFIO4ylKMYXn0SulT2JtdLjjqb0Y,5692
24
+ sota-implementations/cql/cql_online.py,sha256=hrCFhlwl93YyHewOEA9j_7AtsM4VRX57pysOqLtCZ_0,8422
25
+ sota-implementations/cql/utils.py,sha256=dgjR87jcprVzChOK_WtspMLRBrihQO_2GpfFwR2R2O4,13623
26
+ sota-implementations/ppo_trainer/train.py,sha256=xsgAWgamxxG1_Oa1CmT0I8Fx5ZxDWvAzn76d1V8ynjE,646
27
+ sota-implementations/iql/discrete_iql.py,sha256=pszUITbviD8AjtT2_zoSykHb3fKEY-I_UftgBytze8s,7880
28
+ sota-implementations/iql/iql_online.py,sha256=ZoFYyrK7TCoCBvpXObWMM8zyTKsrmIfxOfUM9JH3Hro,7617
29
+ sota-implementations/iql/iql_offline.py,sha256=mMFzs9tU6vOCDc0Ofw1G66VV2eTWUy1fLJBccuJrhKA,5009
30
+ sota-implementations/iql/utils.py,sha256=28WjY29Rd7fMYAzog_US9Vm6JihGOruCt9B_NqTSfJ8,12636
31
+ sota-implementations/ddpg/utils.py,sha256=R_mUCNwjN_90zlaUde4aVjY1xkYluFMqIXok0dwvXp8,8834
32
+ sota-implementations/ddpg/ddpg.py,sha256=33wRTzd4uR1EPXO1SNRnLoA_fxWHo7tk7KB-Fy45few,7530
33
+ sota-implementations/impala/impala_multi_node_ray.py,sha256=a0ofL4FKNeA-ItjcodylLwS3RD0W6R2EIfjGEWKfU3Y,10411
34
+ sota-implementations/impala/impala_single_node.py,sha256=ofXkZKZd6ePYNglQfjSmKmekXZDTed-8q_JjCjRnxpE,8882
35
+ sota-implementations/impala/impala_multi_node_submitit.py,sha256=75m_4E_SJ1kqei4rtDdYnyTdG1KBA00UiZV_WAm4Ceo,9944
36
+ sota-implementations/impala/README.md,sha256=vOHZWML9zqai4-9MHGpDkWuU4UxINz2pRAFqF0jkx2s,1570
37
+ sota-implementations/impala/utils.py,sha256=HBTC-IEzH76BI6Vfk6WxCCuF0r5kc0EbEZ-n6pzsGyE,5383
38
+ sota-implementations/sac_trainer/train.py,sha256=3NWoSmGRx_PgGanwRB4P_naS9-oNiCeKa0ksxr77xnQ,465
39
+ sota-implementations/dqn/dqn_cartpole.py,sha256=a6pUzq8uxBGl-OkwK08DCfL2LW03h-vflwe6hyZIKfQ,8366
40
+ sota-implementations/dqn/dqn_atari.py,sha256=Qz82jsSCP0g6gHUMzdag_XvanyGnPAab_tR11TkA6W4,9213
41
+ sota-implementations/dqn/README.md,sha256=0xdIBDXORRr28rxj_rYJMjw7KcovNrIkFzCxobEQ_Zg,1275
42
+ sota-implementations/dqn/utils_atari.py,sha256=unAZg9v7cvXdNFqVimV79c7q-pYm3tT2wq5vU9zA9q8,4014
43
+ sota-implementations/dqn/utils_cartpole.py,sha256=pw2DNE_jm9SrMd34WGlAAus73LHcWekuf5jFTTQ-C-Y,2841
44
+ sota-implementations/dreamer/dreamer.py,sha256=GT1WdSF6eICP7xjXYrNHsOC6pwGJ4usY6eTV5NPzYFc,24103
45
+ sota-implementations/dreamer/dreamer_utils.py,sha256=62tufz5418hwU88fsrEh5j-19CVvb1m27lfqZIN9dDE,36322
46
+ sota-implementations/dreamer/README.md,sha256=KcgFkne8S0aRHM5yQgBIKQ3wm1Qq7JnSltWESqjBAGU,3910
47
+ sota-implementations/grpo/requirements_gsm8k.txt,sha256=O5LVRsH0IbGebLC6fzSeKZHNSVUhXNVRXbVbNZmpXGM,97
48
+ sota-implementations/grpo/requirements_ifeval.txt,sha256=o2zv-erbS7kZaAKPl0--CvrOSypr8mdASMiUjifsGis,146
49
+ sota-implementations/grpo/grpo-async.py,sha256=PwZ9zKsMUopngJPmjjmPsXI_kEGWOFh3g_dyKivXLkY,15972
50
+ sota-implementations/grpo/README.md,sha256=ElokAa5M_uTBUhsLG30bw7K3rIaPuunWblcYgwCqeu4,11452
51
+ sota-implementations/grpo/grpo_utils.py,sha256=e6cXX6k7lraRkecK3aPc4z_ARLQXCHsY8s-DfHWbap8,31738
52
+ sota-implementations/grpo/grpo-sync.py,sha256=q5ItqoCI5HF0Z8T1630ea9dKfeGifBfG59sn1oGdRbs,16206
53
+ sota-implementations/td3_bc/utils.py,sha256=a4ZCpaIvXDra1UGC8eWS-T099-8OAVr6jsyDvfUN_IY,6700
54
+ sota-implementations/td3_bc/td3_bc.py,sha256=JN-dR6RumXRUhZn4l4fC4c7Q5lanPzFvgbkTyeAdCzk,5694
55
+ sota-implementations/decision_transformer/online_dt.py,sha256=CJQiBcvzinvvzFyjE3pBr8T2ToDhH0paaWFm5GLuJgA,5915
56
+ sota-implementations/decision_transformer/lamb.py,sha256=X2gbswsaTEtvLJKXYyJeIHDFecHwT_OAUX9Eqm-PNNM,7160
57
+ sota-implementations/decision_transformer/dt.py,sha256=7Hy3Bml_KSrJ2bgBq_cSJRvqm70eDL6ijqNVrEdIyag,5191
58
+ sota-implementations/decision_transformer/utils.py,sha256=wygFxa-AILKeqll4r38vXAeD2YQYG69q2HmV0K3B5H4,15847
59
+ sota-implementations/ppo/ppo_mujoco.py,sha256=WVohjWDrq_pvdDJA4yjhsuEYop1xcM6sO2nvytiabks,10535
60
+ sota-implementations/ppo/ppo_atari.py,sha256=BgI97Y_I3mozn53tDam_BU9YgFEYw4HckVhTJfD8tro,10963
61
+ sota-implementations/ppo/README.md,sha256=hTZp2wh2QKSpxatuAGidjvCugecOHs_ekDXskxwvwOo,1409
62
+ sota-implementations/ppo/utils_atari.py,sha256=BZ-CErXGrhSdL6-Rr56ommw7ERxq9gEe7lq8QM_dDoc,6997
63
+ sota-implementations/ppo/utils_mujoco.py,sha256=suK6FOsUShlzCWjWNyE5j35AcYAmhYipbr6ISlAEIjc,4805
64
+ sota-implementations/redq/redq.py,sha256=owdTPZs87LK6Pw4-r_hPX3GxzNNGEp4b8FOgxQsafas,6120
65
+ sota-implementations/redq/README.md,sha256=YOgUjQPKu0etio4HyDeDTdD35ggTQGqupEu-9Y1Jdyk,390
66
+ sota-implementations/redq/utils.py,sha256=Z8gfmnPqVHztFDQNs2o1AefD_OVK3xJy9NTYbX62W_8,39271
67
+ sota-implementations/a2c/a2c_atari.py,sha256=2yhuSimHtmB6OiDi84fGZCDbPzvC73bifFufV2Lsdko,9619
68
+ sota-implementations/a2c/README.md,sha256=pT-PNhZJirOOdz75XG1szO24luDss-jUCNYcpxHXh6g,1732
69
+ sota-implementations/a2c/utils_atari.py,sha256=FmmnZsaTmaqyyHK4JBd4-MIsSEN_gLhm9FVzi_yJUGE,6975
70
+ sota-implementations/a2c/utils_mujoco.py,sha256=98MVXN-7Her1wEWbRwC0JuLWUvUuxefwoW93YLeFyjY,4947
71
+ sota-implementations/a2c/a2c_mujoco.py,sha256=8SBlP8YXoRyUV4grB3CB8D2ecVptoGbu4jL7MBBDcpI,9247
72
+ sota-implementations/expert-iteration/requirements_gsm8k.txt,sha256=eBTywFljWINKBunZgCfi9y3LcAm-iyP9Rg8UtBRRwPI,210
73
+ sota-implementations/expert-iteration/requirements_ifeval.txt,sha256=fUIfErsmY0rE45Th84HlZYccWOOgvtIJiAT0H4bUGVA,261
74
+ sota-implementations/expert-iteration/ei_utils.py,sha256=QkTZ_hpKXRxxsS6N9z7UdDAzp2wX2RM0L3kYwwPwsNE,28828
75
+ sota-implementations/expert-iteration/README.md,sha256=uWRUrKqVGKxrm6Z3L5NsgrQ0B9tvtGxUynBefv_XqqM,13113
76
+ sota-implementations/expert-iteration/expert-iteration-sync.py,sha256=wuo5TFDB73vKEwu5R1_DvYxl7QkFj9eoynByPEBVk2Q,19680
77
+ sota-implementations/expert-iteration/expert-iteration-async.py,sha256=Y1zWCsG_IOtj7yN19WlFaQ_IvcGz82w-EaS7smF_0sY,18667
78
+ sota-implementations/td3/td3.py,sha256=HhN4R8j3d4m9x7LJI3XoVjQrx2PcXnRS0UszK_Kuwxc,8235
79
+ sota-implementations/td3/utils.py,sha256=TJUHQb5GVCEvSzifo4rGvz6GOXzXZtmWVrPBxvddbf4,9242
80
+ sota-implementations/crossq/crossq.py,sha256=ZVxtxhfs4eDog3YIPre2Aug_iAg7FF5TwqXKND69pg4,9257
81
+ sota-implementations/crossq/utils.py,sha256=JWXTCJsOlZN98hSTjCYPuMzr9i8jtN-rkbdeGisMFoo,9259
82
+ sota-check/README.md,sha256=L_klTkIrnZdXp75Yf4lZH1peqkxrnzqAwpUizKnXlkI,1082
83
+ benchmarks/test_replaybuffer_benchmark.py,sha256=XOhG8yXnyTsF38LTtdl6SgV3kycCSmpwXbVuLZ8naKo,8020
84
+ benchmarks/conftest.py,sha256=S0kpR83vOEH0Bj-yf6KWMFD9vakmBVicE6gGLQvEXr0,2623
85
+ benchmarks/test_llm.py,sha256=iSYU0TyvLVrOCfxafb6bF0kmXZIMaVTjm8hkIb1-zIA,3937
86
+ benchmarks/test_collectors_benchmark.py,sha256=33aivFimLu833vVvcpXogA6vInGNsCEBbPlrfA4dlsc,6669
87
+ benchmarks/requirements.txt,sha256=fBZgx705zlfAmC2FhsZTQ_c_XoZHRfFNiLVFo7aTqEQ,67
88
+ benchmarks/test_envs_benchmark.py,sha256=l9nRGGb3GVaNY6Hk5z4mmPcMKch_I_u3kaCrZ2EgVTU,3520
89
+ benchmarks/test_objectives_benchmarks.py,sha256=69B2gm7JmI95Qykb8pB-KoLcYchOcL8ynfxcIF51nZ8,34949
90
+ benchmarks/test_compressed_storage_benchmark.py,sha256=UIYE3aXIBzT-YwSTC5e0rTB5o_ryCmC-rfh9bBA4FGE,5929
91
+ benchmarks/test_non_tensor_env_benchmark.py,sha256=GABZ7xb0ztA2bqxEa8UvtmUjgiKQOO5LF7HkJD38kpM,2343
92
+ benchmarks/benchmark_batched_envs.py,sha256=X2D9IorprtkS182mGzRsB4Pz3h61O-zO2Y4_qKGV1Dk,3704
93
+ benchmarks/ecosystem/gym_env_throughput.py,sha256=NkYgdrXuKOLTOl5JPP5SI2MWJpbJjH25rL96PXGfCk4,13958
94
+ benchmarks/ecosystem/vmas_rllib_vs_torchrl_sampling_performance.py,sha256=vu-aIJBM0RHWSbSAOLUdB7VuGtnYJVDzKCOy4wKeKbs,6727
95
+ benchmarks/storage/benchmark_sample_latency_over_rpc.py,sha256=kF-UaAgZ-3zy2hClUcwtVux4nhgDuQn7jF-SHH51eTs,6332
96
+ torchrl-0.11.0.dist-info/RECORD,,
97
+ torchrl-0.11.0.dist-info/WHEEL,sha256=FZ3JI6wOPuDqrjSonX6g1fWFHrGriKLVhmaSXrY6t8M,110
98
+ torchrl-0.11.0.dist-info/entry_points.txt,sha256=kjqZUboF3jzU21uy15NPn2WDfbwGE21Ls0fmfhqhmy4,110
99
+ torchrl-0.11.0.dist-info/top_level.txt,sha256=niUu8mZaEt1Z9cX9Mv7FQF9PCg3CTjUnjuqLA929JQ0,73
100
+ torchrl-0.11.0.dist-info/METADATA,sha256=9ihqFL4z5gMYuFv7q5fTuHpbUJxBGDy7wiNoFUGlhVo,49197
101
+ torchrl-0.11.0.dist-info/licenses/LICENSE,sha256=xdjS4_xk-IwnLuIFCvTYTl9Y8aXRejqpmke3dGam_nI,1098
102
+ torchrl/_torchrl.cpython-314-darwin.so,sha256=NK0vip_iDB0VybtECrVckQYEXd7InKM2iVT-xleiHPM,801232
103
+ torchrl/__init__.py,sha256=nBf8LoX4OtjRyVJks9JBrAnJW-dSAgNqVuPuebeelNg,3970
104
+ torchrl/_extension.py,sha256=-33spVuVtpcXCeRv5pgZPw87EzYKCisd7TD1es306Yc,3220
105
+ torchrl/_utils.py,sha256=NtlnazPsAjIWBIj_3I737vD590Y8oYVCe8KCf169aJo,47377
106
+ torchrl/csrc/utils.h,sha256=VpghIMsTZz_ZX345Ls4zAyHxMWUd5f5OkHvXYpqSEfQ,1101
107
+ torchrl/csrc/utils.cpp,sha256=8dQb7dRB517Wy_F6FN3s7vm5haBfXAt4Dz16drop4sY,1642
108
+ torchrl/csrc/numpy_utils.h,sha256=Z1rSVRAr1KiUfeidqk600fSxb4lgwlTQGKFcKPdEcO0,921
109
+ torchrl/csrc/torch_utils.h,sha256=QQRvSEWoquBzfsj6xcd7mXL4pPyrccE_ISHvSzw2O8Q,696
110
+ torchrl/csrc/pybind.cpp,sha256=9YJeGIee08tW8ke7QDVN15xmCxKsb0ZcBgWi4_qbW7Q,730
111
+ torchrl/csrc/segment_tree.h,sha256=feyFyCfhybNmbpPrOfoI_EtpfszU6VZQDC8xY8rucxY,17375
112
+ torchrl/weight_update/_noupdate.py,sha256=YjR-YmHQNLOmBJp2dh0-bxqbz2pyuH5E375fPF9oqGA,3001
113
+ torchrl/weight_update/_rpc.py,sha256=mpZu6_R9Apm5JTvDo2nY-MYAu6gUYN5ss8IcqYRDAJI,10584
114
+ torchrl/weight_update/weight_sync_schemes.py,sha256=at9aDYcQcsE2E7VcMlZzzYb0-J2VJG03ePhfA_bYWlU,42591
115
+ torchrl/weight_update/__init__.py,sha256=5Eg3w_n5ONFpaZQxiZ0FR3Fq-8QgiBOjlu9O3mQCEIs,1102
116
+ torchrl/weight_update/_shared.py,sha256=sx5dZBQSD_1itEV3GpMxX0qW2gtIy8OhB6XIw2OFt8A,36623
117
+ torchrl/weight_update/_distributed.py,sha256=iCKVHsol-O3F2cX4iZpTS0S82EAr3g27OH0S77R0m4g,28401
118
+ torchrl/weight_update/utils.py,sha256=dUzSX-EhyaGAgfxuwsy8bAVu0E_rATGwYmxVPqKkgT4,2834
119
+ torchrl/weight_update/_ray.py,sha256=l0TNYG7VhaeDaViM0CVRC07EqTL66MFunAICmxl9rMM,37263
120
+ torchrl/weight_update/_mp.py,sha256=-4DBEm-PBgVlWuuRbw5dnfZfBGktpdM_ZHR9nJVzEMo,26046
121
+ torchrl/weight_update/llm/vllm_nccl.py,sha256=JqOUiBuQu0lxOYHlYU9EPDYllyVTlFzhC6NjZB9RCVg,27020
122
+ torchrl/weight_update/llm/__init__.py,sha256=MeVhykNdsLgZI6_8BrztPuofrgPRvRkTB2wCmT8qNP0,863
123
+ torchrl/weight_update/llm/vllm_double_buffer.py,sha256=dS8NhEKbdeV3x-J-vw-jabfOiyw2YonKENuqIottoJQ,13563
124
+ torchrl/collectors/weight_update.py,sha256=vjp7zOToSBmWXgOy4IWommWYjwfBHZrJd07wRCUsdRU,24580
125
+ torchrl/collectors/_constants.py,sha256=3MU3-Ugjxm_8lmLW_2WDdh_1vhxvkVcbm281YGzLa4g,2729
126
+ torchrl/collectors/_base.py,sha256=8YsoA6A8lq4F6QBgHo3QXwRUynPXp6AHMWbiK-s8CHo,41730
127
+ torchrl/collectors/collectors.py,sha256=4K08e9vt6EJbT17tswESXgRudGE-YA8IqDQ3-cQ8H-E,1868
128
+ torchrl/collectors/_multi_async.py,sha256=L6EsIFxC5KGB6kaSVGCVxsdnkygjH-qnR70L9ey-gI4,14363
129
+ torchrl/collectors/_single_async.py,sha256=Tz2DvtP_1wEPYOheWoOtIPQ9kQj_D1-MRu--6ZicjuA,14239
130
+ torchrl/collectors/_multi_sync.py,sha256=2bg_DDfZa5ghaa5EhRTcDmVHcngTigDfojvddD03bLY,20536
131
+ torchrl/collectors/__init__.py,sha256=rwqjwZrIbpQgkp6PkcOI-PuZv2gEamGjzsT45JE1lfo,1425
132
+ torchrl/collectors/_multi_base.py,sha256=Sp1-l31RyzlI9gjySTpUwldOJAve4x91n6ys_60_o4A,86594
133
+ torchrl/collectors/utils.py,sha256=vRL96op3oJnReJXFlPEdhawuUCmB4YEe-Sz8kYy-Vgg,17403
134
+ torchrl/collectors/_single.py,sha256=ZCRQucSj_kVo6X4xrMZi5TkTtnGhjihB7dmALtRDFig,89439
135
+ torchrl/collectors/_runner.py,sha256=u7Al0lNOsEW9h77bRydbUulKCKZFasqRQN-P1B0mM9g,24183
136
+ torchrl/collectors/llm/ray_collector.py,sha256=APGkD2YU3iIRXFxuyoGyvenzdNZC59-pl8AtzHy7xZE,11689
137
+ torchrl/collectors/llm/__init__.py,sha256=blxPktOeYA4u_QUCE0UHubFJktk1ul1a1eF74kDcIdg,387
138
+ torchrl/collectors/llm/utils.py,sha256=-KRSlOmjj34M0c3msP7yS_0DlLmqCijEbf_bADLjzuM,1148
139
+ torchrl/collectors/llm/base.py,sha256=PNnpxJNz_j52bUHRLHY29Q2y5znGUx1jImH7JctmZk4,22845
140
+ torchrl/collectors/llm/weight_update/vllm.py,sha256=8kga6yfPJCj7g7Ysn6i-2VNV9jFORvoPqgltzDW0AXk,13739
141
+ torchrl/collectors/llm/weight_update/__init__.py,sha256=N95OwLfgte-Z2ds28QmEPMvYq9YKO7xuKxBcjWs4_mg,324
142
+ torchrl/collectors/llm/weight_update/vllm_v2.py,sha256=HHa-JZ9e2FPuwQIjlB9uDQi5z0d_TNBAlhmxW7tDvAw,12044
143
+ torchrl/collectors/distributed/sync.py,sha256=Dw8S9O7PXOaOe7Rq5uLG0xY3VqzHAJmm6g4q2aWBfEQ,31849
144
+ torchrl/collectors/distributed/generic.py,sha256=lzGcuLJ6c1GNJDirnN67QtSyEYfCP-LdHM-TwxVzovY,57757
145
+ torchrl/collectors/distributed/__init__.py,sha256=haUhY4DnaCK4ebYxPuQFTgdA0A59bmjmHTdOgm6CR9g,958
146
+ torchrl/collectors/distributed/ray.py,sha256=b76RqP2fOA45FhVkLiWIvzCXjZJGb0Ou3uNTXATAMEw,50877
147
+ torchrl/collectors/distributed/rpc.py,sha256=j21Kjc6NYf4R8ys09c6TCDWlyCXUCsgDCrN7YJWNaJQ,44698
148
+ torchrl/collectors/distributed/utils.py,sha256=2zEcllTAHbE7PXfsnnH6ddKvTECxKNnfgLTaflm0DeE,6459
149
+ torchrl/collectors/distributed/default_configs.py,sha256=sk8yaEpfOklYS4cxtvPZ61IX1i5yiZt1zeMLF8rco7U,4383
150
+ torchrl/record/recorder.py,sha256=pvJVLQqhtToSDiI-0JDPNUm1icorklgF5qipBDw7yPQ,22382
151
+ torchrl/record/__init__.py,sha256=QdLnwjbnfd3eNsH0p2Zt5HKnAMvYPxNskbtB-pFTw90,506
152
+ torchrl/record/loggers/mlflow.py,sha256=Bf2HwVzbuDZLmE9lnk6w0jUZaqhC8tqYO0Us4OwSLkQ,4956
153
+ torchrl/record/loggers/wandb.py,sha256=19E7ql9rcx9WsTDH5gZOQnGIHhAOR7pA9eYa6OcIKB4,7539
154
+ torchrl/record/loggers/trackio.py,sha256=Q5wuqZcGqxyO2kTqzFxqgUc0X48HxPr8bEwAxBGGXmY,5073
155
+ torchrl/record/loggers/__init__.py,sha256=4WcizvyExqkCD9nZEbAQQSOjxizoSbnMnDT3dsfc0lc,545
156
+ torchrl/record/loggers/common.py,sha256=7hNxQfMqnOgsqRgJl7BBaRf6oKb7uIbu7n85q-tMySU,1186
157
+ torchrl/record/loggers/utils.py,sha256=n_3SyxaWGfHQKIS8b_7uXJrSAwvk8ENvCk3j_8iMUts,2712
158
+ torchrl/record/loggers/csv.py,sha256=e7B0TvvdL51MrEgiIAuRPmFv0_VGOrfHKh_Nr6t00L8,9298
159
+ torchrl/record/loggers/tensorboard.py,sha256=6DEdW7CuITjhLuzK5v8SwSI1i_AMm0SVpTTlAH9lUSM,4866
160
+ torchrl/objectives/td3.py,sha256=vAORFHYgYA1h-rs6DQsfjr0wtiPd0ZXyVQmrC-RB93U,23873
161
+ torchrl/objectives/iql.py,sha256=4UGUwumZDKYqrGuY14OuXp_MlDzkQS-2boxM4TMI6Do,43406
162
+ torchrl/objectives/crossq.py,sha256=MqYVBkeoX7V2VRAXBIpPhYb_iE87LbeEUUgpl3U7kaI,29240
163
+ torchrl/objectives/deprecated.py,sha256=a0oxktMPI50gdu1rUJ9vd1kvZXyCcpfdlMp4Zfomryw,21102
164
+ torchrl/objectives/dreamer.py,sha256=jXWHHzgg3vT2MzS8Styu9tW2IE53WeOrlpx00rRgj7I,18955
165
+ torchrl/objectives/reinforce.py,sha256=HR9VQEm5It0YpaUESML7Pd5SYUyjL3UyJxXPGk4Rx2E,22682
166
+ torchrl/objectives/__init__.py,sha256=F6ifaqPw6UX0NXXMeVuTUnbzDeMeeq7jtd2iwbm7Ysc,2167
167
+ torchrl/objectives/cql.py,sha256=BMtzLbZXUstxANRlxAXvlKqQ2JT828G-QPu4SSwLicw,55621
168
+ torchrl/objectives/redq.py,sha256=gOPndUnMy35YM8Yaci5u04QrE6DST7Ddd4GAv2UHq3c,28933
169
+ torchrl/objectives/decision_transformer.py,sha256=37LYZQZfztbpDWqiiSb0nHuam6ApjGgIaHYs9Z_fJPI,13095
170
+ torchrl/objectives/sac.py,sha256=ktKjihsWetV6r5ZKPB1dPewbRDbqnmAjHr8XwyK5W4o,68435
171
+ torchrl/objectives/functional.py,sha256=ZaglBjEGuOTNGeFA-Ox-ugZVcNegQMUj--KWHDRBmaU,2106
172
+ torchrl/objectives/common.py,sha256=I6mepxll2s3gdQUX3QOyN5HnjsYbm5ksfbKVJXzrKBo,31093
173
+ torchrl/objectives/utils.py,sha256=hNCeOtm8brXOvTULTYHdLEiJiKkSdKZ7TqvvFjU30HQ,27158
174
+ torchrl/objectives/ddpg.py,sha256=w90amzDzgd8deXj0HtkEgjnPz9XSYbbRYAYVwor5XUM,18568
175
+ torchrl/objectives/td3_bc.py,sha256=mAdQlXCqXyT-euzgvfqZSinf8GI13gvO5-91XDBpHBg,26633
176
+ torchrl/objectives/dqn.py,sha256=GsaB_UPeESl_RlsSEF_gzArVHUnEYR3kkjjcatZDOO4,29789
177
+ torchrl/objectives/ppo.py,sha256=z-j0JQZr02JUsHP1iepFsf8pk3bdgshJLKK-vGlBR4o,80293
178
+ torchrl/objectives/a2c.py,sha256=M-Eg6W22QFfE5lHIaNsXZta8-TOB-gHLf_NWJQf1DAg,28571
179
+ torchrl/objectives/gail.py,sha256=G7Maz6ZIPxoiU2u9VVmdji0nr8PHtX2FsSqaUbsEJys,9597
180
+ torchrl/objectives/llm/__init__.py,sha256=sLjJTKiLKTY3k3vGpQthD7wJC853P9FgjDr7ellVyzA,616
181
+ torchrl/objectives/llm/grpo.py,sha256=2JVBKYm9HGiqfZNaJbfMma9HqfTxBIj88wSNqps56LI,38154
182
+ torchrl/objectives/llm/sft.py,sha256=5Y8ibTjK3s_Tvt7SPGzoNsGqJrNxcEpQC0yC6QhQbHA,20883
183
+ torchrl/objectives/multiagent/__init__.py,sha256=CHxWmq5_3kveLcAdyB7cgSVYVIald7EZo81RRgozxo0,237
184
+ torchrl/objectives/multiagent/qmixer.py,sha256=8mTJAUUaAXzmuiFPZ2_qu-M3E-z236QN1DIhbSvw1lI,17298
185
+ torchrl/objectives/value/advantages.py,sha256=EtxTRMLSVK1m6FKOWYXxroViYidLDKQ_dyGwUesVBCs,85278
186
+ torchrl/objectives/value/__init__.py,sha256=AdluF370wYzOAcP_yglUAFnNByKVZzivBYJafkDQbJA,561
187
+ torchrl/objectives/value/functional.py,sha256=knsppthKKtrukm4FY599JKzwNtcWUFIbl63wxgBiNeI,51272
188
+ torchrl/objectives/value/utils.py,sha256=R5k45Cx6HQwO4bjeQmmk_d5DTO8Vh-a4DwZUL7ZLEw4,13256
189
+ torchrl/trainers/__init__.py,sha256=4vdkLfIi4zuIBALEnJt3JsvrCk6LSb3Q3WEfLEBGSrE,867
190
+ torchrl/trainers/trainers.py,sha256=afxZEirHIVeHoN5vpVdqOZppt4NvuejU9ZgFy_7eMUU,79007
191
+ torchrl/trainers/algorithms/__init__.py,sha256=oFnJudqqyUqu3RKeXwYGmLi4QF_G0Bi1vpZBDXmMgZI,312
192
+ torchrl/trainers/algorithms/sac.py,sha256=YnfeBt3wRPy9V3hFKF0xFZvHox0f_gJP6go1CjWRmIo,13060
193
+ torchrl/trainers/algorithms/ppo.py,sha256=-Y13deUel34Qp9akiOE5CWcTocnfP-oWUWuNdXmFaCk,15400
194
+ torchrl/trainers/algorithms/configs/weight_update.py,sha256=-WW2684043isc3pw9L3qAFNybRfZgWBa4xZFYMfmfnc,4939
195
+ torchrl/trainers/algorithms/configs/logging.py,sha256=AfbPuQnc1nBWQNs9PdjJNc5RHy73oYXtslnVIgpIPtM,1757
196
+ torchrl/trainers/algorithms/configs/transforms.py,sha256=EptvAT8dRmBSD3c8jld7WqUEBQm_5ygvPhvQnlEO9rg,28813
197
+ torchrl/trainers/algorithms/configs/envs.py,sha256=kDAn8lIzZa0T0PzHP5n1ljorrIELWPhoAK13kVB4Pdk,3348
198
+ torchrl/trainers/algorithms/configs/collectors.py,sha256=0mEeodJ_lPJrjMCtg9QVnts5kr_0s9Iv426CzCt7nnQ,6889
199
+ torchrl/trainers/algorithms/configs/weight_sync_schemes.py,sha256=SRa4H_B3JxHPC30Mtpcm37E7V8dh1IuTpdDJO_HjOzY,6565
200
+ torchrl/trainers/algorithms/configs/__init__.py,sha256=83QvbZIjcx45gShMCEQsRziDTvIrtr6W2OdikVAF3BM,26253
201
+ torchrl/trainers/algorithms/configs/objectives.py,sha256=aDcjXitdapgDMoFb2Wb1vbJGywDUgZHqERGflaf3QZM,5380
202
+ torchrl/trainers/algorithms/configs/common.py,sha256=CocWEAC_ZaXpwcC-nhnbRwMj6Sw143ka9JViaBQeLsg,1123
203
+ torchrl/trainers/algorithms/configs/utils.py,sha256=ct7c7p8dzpG2lPMhqo53mYHi_zJHNd10lkGRNOSLJ6M,6690
204
+ torchrl/trainers/algorithms/configs/trainers.py,sha256=ZMtQuQMXdbW8oj9m7RHyaqmBEFuhdiuT5eGT5qAS_ao,13413
205
+ torchrl/trainers/algorithms/configs/modules.py,sha256=Df3NduvePaQCQO471cKj3C-i4QERntu8rRRofGjmUko,17627
206
+ torchrl/trainers/algorithms/configs/envs_libs.py,sha256=l-VOeaEEbogj57uufZfTqM5isVOP_KyXTyuWP0QnNYE,10755
207
+ torchrl/trainers/algorithms/configs/data.py,sha256=F5CzjYbN-vO9RQDq4455plZ0-uUZmtRz_tfRhTi_u3U,8754
208
+ torchrl/trainers/helpers/envs.py,sha256=KZU-1cXESjppfSavfSFXABXmLSLguHtMBXqYz1mFV2M,22121
209
+ torchrl/trainers/helpers/collectors.py,sha256=DSWOSYo5zJ7t5CNllCPTHCNdEilQCrx-M_RyQ9PoNWw,18660
210
+ torchrl/trainers/helpers/models.py,sha256=ihTERG2c96E8cS3Tnul6a_ys6iDEEJmHh05p9blQTW8,21807
211
+ torchrl/trainers/helpers/__init__.py,sha256=HhDB2Ubq2gZodV-hB6xw4ZgCgwaZKUoZgOfVKPp0Vsc,1097
212
+ torchrl/trainers/helpers/logger.py,sha256=FtuEiLnK4NmxVVNyEEWaoCu3nG7WbNpHP3UYGQRJmgo,1278
213
+ torchrl/trainers/helpers/trainers.py,sha256=LnYSkzog5v7xr6Bl9ub9W9kHtU4b150b7jt5ePEt0uU,12021
214
+ torchrl/trainers/helpers/replay_buffer.py,sha256=ZUZHOa0TILyeWJ3iahzTJ6UvMl_0FdxuZfJEja94Bn8,2001
215
+ torchrl/trainers/helpers/losses.py,sha256=sHlJqjh02t8cKN73X35Azd_OoWGurohLuviB8Yeo4JQ,5272
216
+ torchrl/.dylibs/libc++.1.0.dylib,sha256=i6IIARoKMtEHiwAuH31BgdQhXA8GUYzxteIpqIuz6P0,1173408
217
+ torchrl/testing/mocking_classes.py,sha256=G6QEOy2sYWqHrK70ZCGlYwFhGk4cvxw46GdeOQqXgoE,92703
218
+ torchrl/testing/gym_helpers.py,sha256=J-exTeVx00pBRwMHe-uVwUSpFOStVMuw8EvrNqa1PBQ,5047
219
+ torchrl/testing/env_creators.py,sha256=7NuLs5n2APsiG2w7VK51JLiHhPmiM70G3_9IB_KDfx8,6590
220
+ torchrl/testing/__init__.py,sha256=5AnRWxg20NOAYhCGzPwvQSbnmNhQAg5wPVBZQfg4Xtc,2552
221
+ torchrl/testing/assertions.py,sha256=5Rsa3EDeQBxFlBXGCFt9rVMmt9J-KqWpmsiqt8m4ZhU,7424
222
+ torchrl/testing/utils.py,sha256=1C-QGLBvfnHmC9vDHKEvAWzFnxXerS9X_-fIkPUdS2s,5258
223
+ torchrl/testing/mp_helpers.py,sha256=wgvQGxj5WkuoOxk6Zk0v1Dl5neopE37eKm3G-VpG8jo,398
224
+ torchrl/testing/ray_helpers.py,sha256=d8o_f7G0FWEHRAXK3dvYV73tJJv-le3G-hu0Av1Sqe0,10106
225
+ torchrl/testing/modules.py,sha256=sBTv9Yx0RRQvB86x2IuEnkUQ-vU3G-vTnzYYUAKOkF8,10677
226
+ torchrl/testing/env_helper.py,sha256=VWFa4qU_NjpesDWxOmuHQ6cy2cZhQZE-_bIvfgkqj8M,1202
227
+ torchrl/testing/dist_utils.py,sha256=DD8eEN8uppS0cTAUUMAqmrk5hxw0Cqui-XnBuJy0gmk,3804
228
+ torchrl/testing/llm_mocks.py,sha256=ULOAz-qbBsJrkvLeOKh7FTTFnvhLteswkFf--Ms0s4w,4258
229
+ torchrl/modules/__init__.py,sha256=cisn2iO2V3THP4-IFIfivJDnKSVZk9xVF_o0DhZj15s,4568
230
+ torchrl/modules/llm/__init__.py,sha256=vu4Vg78KXuH5BPyHSNq88vBhAr5h7WN_b0mQXmjW1vk,1863
231
+ torchrl/modules/llm/utils.py,sha256=gf_F-4bEMwkcI3jLQM7ifB7nsjRctGebB5E2c-AznO0,726
232
+ torchrl/modules/llm/backends/__init__.py,sha256=vhOzeHDL6BhGV9pwnycwqzMj8L0jy_eeAqa245ce-Zg,2142
233
+ torchrl/modules/llm/backends/vllm/vllm_sync.py,sha256=zpGrBADTN9dNQjqjq1vA4oS-D9MadBDunKzbWZmWQZo,16423
234
+ torchrl/modules/llm/backends/vllm/vllm_async.py,sha256=8s8RS78ibaQBJ5D33-MPiroRjdJc3zq_7tOXucV5C9c,82579
235
+ torchrl/modules/llm/backends/vllm/vllm_plugin.py,sha256=iAjbwrEzr7WtdHlrJVvrzviWrN0oTtw4N0k1XvnlIek,694
236
+ torchrl/modules/llm/backends/vllm/__init__.py,sha256=WYHeVoMu4ZdqSuE6ZJogW7oKvDAaJPUCfUzJuTogWiE,2927
237
+ torchrl/modules/llm/backends/vllm/vllm_utils.py,sha256=VuxQhgSR25zODw22XKvnjE-pvelPUJu76rZlPUxTfgA,4843
238
+ torchrl/modules/llm/backends/vllm/_models.py,sha256=YUlKC5T_OW1FwIiHlj4zsbvytBOjq6pBXEo9R7KAhq4,1357
239
+ torchrl/modules/llm/backends/vllm/base.py,sha256=MpcqaWwjnbaS93vJ_DgODJy51dGkebmPOTxiLHDTAwM,2077
240
+ torchrl/modules/llm/policies/vllm_wrapper.py,sha256=hz30seeQhtr0cMU4QWM5gO9GknP2mBln8HpxhXhB_48,96287
241
+ torchrl/modules/llm/policies/__init__.py,sha256=8Iwi5SIQF7X9jJodWr468wksA_XSI2q9CLwDeR7vlwY,849
242
+ torchrl/modules/llm/policies/common.py,sha256=3gWTCFEfGjmAhHKVDLsekdH4n7ZGSl9CK2NEPu_CgIE,73210
243
+ torchrl/modules/llm/policies/transformers_wrapper.py,sha256=LIJTVm2JgNPWShmCF4ceasrY3OXpyHSoq-OdoAMFFN4,112089
244
+ torchrl/modules/utils/__init__.py,sha256=KXaF_xEghKSPsNg0JyfxChK6KWHFRy0lwkL2RipmNh0,1127
245
+ torchrl/modules/utils/utils.py,sha256=WPfcE-AoemnrP7Ny4FxJ-_LoQsBnX-y77Zb7MnZjXV0,2916
246
+ torchrl/modules/utils/mappings.py,sha256=VMYrPxDk1ywgl2l_f6HXZaRsVOKcYR7VF5DNkmi3lHk,362
247
+ torchrl/modules/models/model_based.py,sha256=Q3qgesZetVqVufPKCuRbeSKe_rrvZeqm0PXrOnIb0PA,23111
248
+ torchrl/modules/models/models.py,sha256=5CotUF7wihy97qOjCOBKqDpmte2qsll_PTO9T4ST7WQ,66044
249
+ torchrl/modules/models/batchrenorm.py,sha256=TojpTUluIcFdTSemIVRLGtB2O5q54mRHy3vJP6DuI5I,4750
250
+ torchrl/modules/models/multiagent.py,sha256=lHZO_Lite6l8q1bvJwojP6V6UKEcRM1za8-mdOm1njE,43998
251
+ torchrl/modules/models/exploration.py,sha256=Hm9Ws9bqgYjYQT7zSFe0yQhKAkXwfxlsJoeDhSvEHZA,30610
252
+ torchrl/modules/models/__init__.py,sha256=DrOG-7hynjjUh_tc2EqysiUiNMRiDR0WLtZql9TPNcI,1743
253
+ torchrl/modules/models/llm.py,sha256=nAOlXIZbtIJrj6HzpkPwNl4s0kyCbXp2PaYb1bxOAqU,6398
254
+ torchrl/modules/models/decision_transformer.py,sha256=2ug1oE7Ml1-Kbm5C3U3WTMYKzKIDvCbKS3WsNwdb_MQ,6599
255
+ torchrl/modules/models/utils.py,sha256=Bs4v-NWrH_kCek4y-_91Yy7y_FOD7120td5tn0ntsv8,5058
256
+ torchrl/modules/models/recipes/impala.py,sha256=TRqFHaGyYSJDCokhZ9gdlrIydZ-LOHUqBWlnTvqzvfw,5667
257
+ torchrl/modules/planners/cem.py,sha256=xpQBPKaY36TClKRvuQPL-hzoL0ie1s95xxlMcv_fVmw,9539
258
+ torchrl/modules/planners/mppi.py,sha256=dPOrYcY-pT0yRK4qMxfJMUxOrNiy-AvJjca0mNFjh1g,10769
259
+ torchrl/modules/planners/__init__.py,sha256=nfLJXqhcPuB0aPBKs-mqGJ633kCNa0TaCynpH1pB4wo,332
260
+ torchrl/modules/planners/common.py,sha256=uYEuOiWwu29XS7NmlyS65xZX0BNuLGTaRi4UlRhA1hg,2441
261
+ torchrl/modules/distributions/truncated_normal.py,sha256=be---9L_Y1_rak8xtG2o64whWMlCddfWSqL9jslRqoE,6215
262
+ torchrl/modules/distributions/discrete.py,sha256=KydEwTRWtIm_24f5ww8nMoznyYYfr3HmK1LSkqN339s,35590
263
+ torchrl/modules/distributions/__init__.py,sha256=RDFoYD9IX1FhwXk5R4M8khq42gdTOcVnUnKHfWCTZBQ,1597
264
+ torchrl/modules/distributions/utils.py,sha256=sy7ry1b_aj8Uz0t0ASmpQPiZ0tfGKdSLTSrBrH54ZXM,7821
265
+ torchrl/modules/distributions/continuous.py,sha256=ZoTVmHRl3VpYZRMtBV17ksfh77Lph8PxpxUe6YdQoFA,29533
266
+ torchrl/modules/mcts/__init__.py,sha256=yShDb5tTIiqoNJ-wJm4HZRnhWu3QGYA-Jiirdaa8fzQ,420
267
+ torchrl/modules/mcts/scores.py,sha256=WmuqygCuxZgEeW2-t-vBicHp77kn6e2sThaFZEcmgOE,23352
268
+ torchrl/modules/tensordict_module/exploration.py,sha256=uIvvlbZYQunRtO9uCkBW03OIEZ-Tq5M_kgqFgOQMLWg,32160
269
+ torchrl/modules/tensordict_module/sequence.py,sha256=GqKuwWFs2T3apxLwkAkrMKk-Er0CmnFDK8SzTTTfoAE,6011
270
+ torchrl/modules/tensordict_module/__init__.py,sha256=y5f4nXk-eWkOh0qwiwRDg7c5C0cUbGgr-AlLW1IoCvs,2334
271
+ torchrl/modules/tensordict_module/common.py,sha256=lz5rrCQ_F0z6kjRGwi_G7WwFzvSYeHZnFcc_eFY62dg,21707
272
+ torchrl/modules/tensordict_module/probabilistic.py,sha256=N_KoR55DooL6oKBrQzvBSv6IY3a_H1djDPtQekyPLXw,16358
273
+ torchrl/modules/tensordict_module/world_models.py,sha256=Y3ag1locZbH5WC3ZGY90K3wi3E6ea_0ILX0X3OnzVwc,1360
274
+ torchrl/modules/tensordict_module/actors.py,sha256=J-E8QCy0WzBrKfvExi7R0VN7cLuX5SBmaKc03KSOsw4,108726
275
+ torchrl/modules/tensordict_module/rnn.py,sha256=gTcz84-D7DFYbkP01IyDXX-uGosm-ejnPFWLqo3Xk5E,65731
276
+ torchrl/envs/env_creator.py,sha256=EopTdn4BmFIeDukSxq_l_frO3bE-vwTphrIP-79wll4,10308
277
+ torchrl/envs/async_envs.py,sha256=D1-VnNYQ6wUANRD8EA7h6FEmM6PC-NziSo86gVRlnbo,46139
278
+ torchrl/envs/batched_envs.py,sha256=QD1UCr5fqKJ8FLbNkKrXHyuTenJjE-RoMQwzzMX0prA,131434
279
+ torchrl/envs/vec_envs.py,sha256=HLeoGymXhr_2DMzU8ZpLFBSLGU6qeURHGWS0Z1V7Kro,366
280
+ torchrl/envs/__init__.py,sha256=7JqZMLwe9H6SIW4qEoeuSAbWkxbZsDJhtP_A_ApU7Jc,5807
281
+ torchrl/envs/gym_like.py,sha256=7_8z1V0Q8x6LbzlNFGLvt7nXgkJcA2-6AIsgv5w_ux8,31629
282
+ torchrl/envs/common.py,sha256=6fRp9Zj3R0RVJH-akjrGz8kTJ43QZ48Ghyg-Yf3i5vA,177460
283
+ torchrl/envs/utils.py,sha256=aW-1VptmWmEj5j9qNUmPEs7HZ7J8NnbWu7TgzN5uHC4,72214
284
+ torchrl/envs/llm/envs.py,sha256=KWSQq2DaoOZ5TqSFVR-uN5mu7w-ESkQuOI6BuesOkSg,35024
285
+ torchrl/envs/llm/__init__.py,sha256=31NLrTHGnac2K5r1p7jI9BfgGJuYu_PU-i8ft7mij3Y,1441
286
+ torchrl/envs/llm/chat.py,sha256=ZvWI8c5Ej4O2a-xzYxpxWS09Q-MaWup647wkaitNmck,31799
287
+ torchrl/envs/llm/datasets/ifeval.py,sha256=hEEdGRjzgddqNuCoW6QYnAbeM0_u0bEhuQ1UX5kAmWg,12099
288
+ torchrl/envs/llm/datasets/gsm8k.py,sha256=JHX2lGjMFfqpD8VzPV0R5bnbKqMqr1YFA-M4kSZdGfA,16701
289
+ torchrl/envs/llm/datasets/__init__.py,sha256=FFethtv8unJWzphGLPQVC5QD9NMdaygEjx25O1DHHZk,473
290
+ torchrl/envs/llm/datasets/README.md,sha256=8lz6SVX3XuPte4n3s_yDLXBRRLbyKdh6rjdO7wgqj1c,112
291
+ torchrl/envs/llm/libs/__init__.py,sha256=vhEm5Fhz1sLWt107zfZLy5pzGmfQi0fNBGazTq1m7dU,266
292
+ torchrl/envs/llm/libs/README.md,sha256=FjqAs7gEwrxbLIWbfPBz4YY1xyjLL6mQdZSB9ElHjFU,90
293
+ torchrl/envs/llm/libs/mlgym.py,sha256=JUTrraE4QfdcAtblEMe0796orVa68rk1b6xvZhhHiUc,31447
294
+ torchrl/envs/llm/transforms/dataloading.py,sha256=8ArOL5VFukZolOxAkRXGWr3Vm0kP0K5b756bsK0oiLg,38084
295
+ torchrl/envs/llm/transforms/tools.py,sha256=VINvpsXJ_0LYbIvPeMF0t8qTW7kAeK6hoT4yT1ezyJk,72205
296
+ torchrl/envs/llm/transforms/__init__.py,sha256=HvajrQ80KFO6ktyMmQbLTIwaDaaKpC8bf4cuJ7Z2eZY,1349
297
+ torchrl/envs/llm/transforms/format.py,sha256=ESn0S9k5G4FQPBICq9h6ZsLKXZqiU71tYW8UnW4rgLI,2519
298
+ torchrl/envs/llm/transforms/browser.py,sha256=WVr266XvyAY0zUa7WIP026UHAKv34Jfo3XMhn3Djr5c,10445
299
+ torchrl/envs/llm/transforms/reason.py,sha256=FINmutplG6iLn38nc4R1xO8lucBbCoHsQlnjwFTEhUs,13761
300
+ torchrl/envs/llm/transforms/tokenizer.py,sha256=ScXK5LRL7zxyDCXvDyhyzcoRa1YZe677bVQ9a_PoiF4,13962
301
+ torchrl/envs/llm/transforms/policy_version.py,sha256=QMX9Vql9bf1uKiCbsKvVChJyQ1sBWirHR5QPsEIH8IU,6963
302
+ torchrl/envs/llm/transforms/kl.py,sha256=B40tDVMLZX8w0IyA4xjHcdJXHl9-TtE6rDIXp6HzYek,70947
303
+ torchrl/envs/llm/reward/gsm8k.py,sha256=M0m1MyDE7fW5YcmAQXbKGboOQhPXM3LIBczG2yhLtXc,13192
304
+ torchrl/envs/llm/reward/__init__.py,sha256=a-Xsye29z2LugO1cOCFM2FNsqNwEp-5XwQk4saVQlu8,370
305
+ torchrl/envs/llm/reward/ifeval/_scorer.py,sha256=b6wvzZSv8_sZQ6j6VN6HbMIcKqpXao7yQtmFgnMbB2A,17852
306
+ torchrl/envs/llm/reward/ifeval/_instructions_registry.py,sha256=3_guc8LZ0mWQc-n6E4cQgYMgZRYa6xfgvXgrze9aO_w,3814
307
+ torchrl/envs/llm/reward/ifeval/_instructions_main.py,sha256=y0DzhnXKZOz_jifqX9eEMND45DK3zxMYvEsucO3q4Ns,4298
308
+ torchrl/envs/llm/reward/ifeval/__init__.py,sha256=g5NtrwfwqK22hRcoIdz8-KWBh5Ogre9J-Bf3uGWE9Pg,314
309
+ torchrl/envs/llm/reward/ifeval/README.md,sha256=zWb-mPlgdsiy4vxXOEB2pXr_XL4JKJu4o29jyQXR-Rs,802
310
+ torchrl/envs/llm/reward/ifeval/_instructions_util.py,sha256=Oe_85LlrHykAr9_XW8KdIsFOJ3lx3j5GfqS4mJv1pVY,26024
311
+ torchrl/envs/llm/reward/ifeval/_instructions.py,sha256=FEdThc5Gui0J7uZHaOd-i8wc5XcMoBx8qYL9RbG3E8o,61717
312
+ torchrl/envs/libs/openspiel.py,sha256=iXmkOjsv2cI2ZYlMe7u56h4BS122jWswZ54g3o8yTsA,24801
313
+ torchrl/envs/libs/gym.py,sha256=4xduxMAsaF8lPREOwexAbK57RE0T6q9Zm1jwwPqidZU,88637
314
+ torchrl/envs/libs/_gym_utils.py,sha256=HZouqci2114LZIUToyAWZhSNRgRCIzM-DFIZXH3-zKI,12824
315
+ torchrl/envs/libs/meltingpot.py,sha256=nd8P3JW_1D6fm_-eZbgmZle20fBoN6M_08SH5ydNS3Y,26096
316
+ torchrl/envs/libs/vmas.py,sha256=0qOlhRW8z3Fx2-MQ21ANdeQMoMBs3U5cChP7sFKCd0s,35416
317
+ torchrl/envs/libs/openml.py,sha256=cuTWhedmXiDYjz8O-wsAuCKPfxaRGYaOffopGzidUw8,5713
318
+ torchrl/envs/libs/isaacgym.py,sha256=GqXwbs9Iq7A5PHr1Sa-7UgQF42DLW7BFcu8lWYhBVJ8,7133
319
+ torchrl/envs/libs/procgen.py,sha256=p0ZaCxO2bsVPcNjA5GfJ3MuM-SPFfsqb22fDPAdfVH8,13753
320
+ torchrl/envs/libs/robohive.py,sha256=zbxUyCW6bhVUO5Sdq_FsSLJCArCLcICIosLl1MCK658,15799
321
+ torchrl/envs/libs/habitat.py,sha256=PYvVqS8AGwplSY9r1x6RSLPejSKvxEyZgcDXFZvCYqA,5387
322
+ torchrl/envs/libs/__init__.py,sha256=G-lAW_jggAXo-6nYeRYVJetlTGHASaezQGBkx_ABqVA,1844
323
+ torchrl/envs/libs/pettingzoo.py,sha256=4XZi1k3xnb9pNgFYkmx2JtgNNx5vWljCCqg6V7zYfII,46616
324
+ torchrl/envs/libs/isaac_lab.py,sha256=4QiCB3tVGQ_D-gOngHyhtVrivy76B32fKGvpt-0hwxo,3436
325
+ torchrl/envs/libs/jax_utils.py,sha256=MAm0dvsG6Uk73Obh5ablkGIgkdUgGZnOqqniST0-lZk,6081
326
+ torchrl/envs/libs/utils.py,sha256=RgiR16KJWFEtQim44-AIcHByGTq_NrtpjWoYIC13aYA,5207
327
+ torchrl/envs/libs/brax.py,sha256=mus51cyPbIwZfU8Pd90sybWJOePed1IN_XpqjtJ3YrQ,31185
328
+ torchrl/envs/libs/jumanji.py,sha256=XS2dw3ekt8621VmMbASlUTyqHhLpzVgmuMyLgj07lks,40271
329
+ torchrl/envs/libs/envpool.py,sha256=Y0l1AiFA5qOjEKvjKkzGcv-8Aydv03ZWYE88-CTV--M,18019
330
+ torchrl/envs/libs/smacv2.py,sha256=TZB5srcrPSwxpL7d4mwuVgfSs1WNypplck7Pr7u5hho,29048
331
+ torchrl/envs/libs/unity_mlagents.py,sha256=Z3qSU0H3o2NXbS2lNvQ7OmYxkr3AWAMyRHfxeCtNZrk,49667
332
+ torchrl/envs/libs/dm_control.py,sha256=GTIkiYXr1EC-bVGY5i8GLNId6BFbruY4yNHr18OqReE,22582
333
+ torchrl/envs/transforms/transforms.py,sha256=Jt1qC6IlRCIrK5So7ytTMkuyWu3lrPMznMVWS8teSZU,497221
334
+ torchrl/envs/transforms/vc1.py,sha256=mho5BvdAK-f9hD9t-iah52wT2B06qPmaJO7chrfIOWY,10534
335
+ torchrl/envs/transforms/gym_transforms.py,sha256=xh1TYnZG-i7Q8Fzx3L5MWG7KH4XMP8QXvOrehep5o2M,9882
336
+ torchrl/envs/transforms/ray_service.py,sha256=5Z13-CzQOgkwHaStvoDLEeexfoQMuVR23mMJxPZ386s,23114
337
+ torchrl/envs/transforms/__init__.py,sha256=WaSoJgI6xXAgyO2VGDhpw94LPDnFA5FxSUrdYpnkzwA,3191
338
+ torchrl/envs/transforms/vecnorm.py,sha256=01b_tN5WVQykGIkRhiPEDc1-K5hkNzk1iimkSg1DE_c,35381
339
+ torchrl/envs/transforms/functional.py,sha256=8A47pcBHNI8hu-uLHlDMdRat9g-tLtqnBy26ICtYwbE,1438
340
+ torchrl/envs/transforms/vip.py,sha256=INwcCNpVzM-zBMZcVdJ5dRj0avDqr7AvMIjt6ru1ZqY,14757
341
+ torchrl/envs/transforms/utils.py,sha256=7ToVFnD4-DkOMtML91g4bqXeY0bZ-gmCaSLxC93oaKM,3264
342
+ torchrl/envs/transforms/rb_transforms.py,sha256=6ohnKXHHAEh2Hz3Seaw6eDrcFMu-1IVQrT7RVywh3YQ,7447
343
+ torchrl/envs/transforms/module.py,sha256=nHPT3VF3wUSU9PdFvmPpc_h_hZi-cXX3dlSB2tHE4tk,14241
344
+ torchrl/envs/transforms/r3m.py,sha256=sdTVLpnxHfzFVo5rO8WnXf2uUg9cr4LBOLBsWaFgGT8,13478
345
+ torchrl/envs/model_based/dreamer.py,sha256=7FVygw6BZQh4UZmz2yGTXlsirJgpXbK4UXUooUX2qwA,4265
346
+ torchrl/envs/model_based/__init__.py,sha256=AkgZvTP5AerIg6ZwXfCfk3bnSr01hlwZWDiRd3UjBE4,331
347
+ torchrl/envs/model_based/common.py,sha256=dFVd3dPhaXC1Hij-LcHSyZ55phAXHUFMnk7j8egy5Xs,7792
348
+ torchrl/envs/custom/chess.py,sha256=dtIoSKRIYxoYDM9yzFC-8_OoVG8jXkgX49h2Ykyp2KM,24663
349
+ torchrl/envs/custom/tictactoeenv.py,sha256=ni5xseTSCOAt0a5ai5HH1ZvgJ-H3V-viR7LW43OBS7c,12259
350
+ torchrl/envs/custom/san_moves.txt,sha256=UY5rPgH0iu5kyl0W8NIaVX8BTC-LOReqdLcDLIYGv6g,188218
351
+ torchrl/envs/custom/__init__.py,sha256=IqDrii7ZIdvp8wa7IbrmupO7DOWI3MDXDr-gwrsMlLk,384
352
+ torchrl/envs/custom/llm.py,sha256=lYNmaeDUREWzU06fMUa6U8aDrazVEYlnYyfkfWfRnDw,8655
353
+ torchrl/envs/custom/pendulum.py,sha256=pb5v9_kMSIicHvUKx-wvMfEdjCsaeK1PQuYqdlzkzBQ,18216
354
+ torchrl/data/tensor_specs.py,sha256=qzQa-Dnt8zwpdrcFpQa_ivoUa3p7V5Qp793qllErh3A,258112
355
+ torchrl/data/__init__.py,sha256=7WMAP7ro1KQM1TAdEGrKg8QxS022lvoCD1vLdmc6L-M,4263
356
+ torchrl/data/utils.py,sha256=Kcs2Az8fGVJbkmz4KTk25VcrG-BaF9vdSiGr0H2u0Wc,12107
357
+ torchrl/data/llm/__init__.py,sha256=B4Ekok-w5PMiWcfmAGXaseaN6hWdNOr4WebeLrHfBVQ,975
358
+ torchrl/data/llm/dataset.py,sha256=IDKEsJFCNXSc9_I1Wuk88ZqPNo8tyBdnovBxaImL9cE,20712
359
+ torchrl/data/llm/utils.py,sha256=axe3wSovfWBm5YmR_uJYpfAmYtd__2i9SCKgUSezkBk,23600
360
+ torchrl/data/llm/prompt.py,sha256=bg5LzJfwOq5Ns72KQMciIprMWAmDDinzdopwdopU04c,8380
361
+ torchrl/data/llm/reward.py,sha256=FbPchNXG3smJV9NCbB5Yk4grsCa2Se4KZ_tojVLKWQM,8404
362
+ torchrl/data/llm/topk.py,sha256=mYXCgJS4TuEVLZfTNccQd6kmC858AAh2Ygy0q_K1hlY,8365
363
+ torchrl/data/llm/history.py,sha256=HP8Lu_JPVAUCsVm04v9HIUYFvCjtMbGSUgF5WdnhfUk,59466
364
+ torchrl/data/datasets/gen_dgrl.py,sha256=62ryTA9QRIVYiA9RisEithHI_Q4lKvf7qD3xP-3VEN4,14293
365
+ torchrl/data/datasets/openml.py,sha256=64m75wX4gs1mxouMqUIrBMPkox-6mvIxHFYIPDpTFxY,7018
366
+ torchrl/data/datasets/roboset.py,sha256=oZAUJUdM6OXoMGip-4TvDLFCJkapAxC7TE2rFPPb1ts,16657
367
+ torchrl/data/datasets/__init__.py,sha256=fPjeCNa4gA_0XaVDCf-9Q9FYI73GEqVr2VNjDR6iSOc,1294
368
+ torchrl/data/datasets/common.py,sha256=JVSMJtzb5LPhrBFYmgBKFuJc15wU6nJnwxurULKNgfU,16020
369
+ torchrl/data/datasets/utils.py,sha256=nAFDTlBIPyEoPoJC-Hc_fcOhzE7UZQE4BwKxq15Vhvk,339
370
+ torchrl/data/datasets/minari_data.py,sha256=-THiIU1OolwObKMdlucPSvXqkTy_fEXU-M1YCBlUUUs,28425
371
+ torchrl/data/datasets/d4rl.py,sha256=2iQ4_e9zVGpr48jWHrD5fEcKhz2t_K3wYKkbCSMOw-I,20199
372
+ torchrl/data/datasets/d4rl_infos.py,sha256=pxHgQ2P5uHiVt6sY4NCQfqOU6dL_QwdFYtdpTnEju0o,22570
373
+ torchrl/data/datasets/vd4rl.py,sha256=fwmZdprefuVYSw7Zwi9Xf1p5DJRToK2gyxreL9h7w-M,18271
374
+ torchrl/data/datasets/openx.py,sha256=HR4ryHksYP1Q7gn4-W5kXHG6zpTseB3CD0TWBdh048w,33630
375
+ torchrl/data/datasets/atari_dqn.py,sha256=r1QB7PEibeXFGx-llQ9tIf4pEADhyEi_-3PPTBRN8XE,40748
376
+ torchrl/data/postprocs/__init__.py,sha256=Z9JpRKMGsuFGpB3ro4R9Y_hYTBqkkzbkWZR79TRZ7Ig,270
377
+ torchrl/data/postprocs/postprocs.py,sha256=AQEgOgTd1LUgelmaoJa7hAVJIloI4M1jKHswklvkeqw,15152
378
+ torchrl/data/map/tree.py,sha256=apv3YCx2OCh6xY4Kf6oxEkxf8ndrbGj-PvZ7qhqkLfM,59348
379
+ torchrl/data/map/tdstorage.py,sha256=U-Ua1FWeacoBlYnmkfqLXjyr-dzxq48gIi1iaIwYORo,14780
380
+ torchrl/data/map/query.py,sha256=WTPDToYDVe4LtA8T4wMfST0l8VCGGVhPTLJJpWYS1XI,7921
381
+ torchrl/data/map/__init__.py,sha256=1IB8lWApscQOOscsCEhQrUDy_AE1wWV51Tcl1Segsqk,555
382
+ torchrl/data/map/hash.py,sha256=a3K3zUYNkTfWodMqAN2XdKVXjhs_wNZovlxQ7XsTolU,7261
383
+ torchrl/data/map/utils.py,sha256=HQYSAtgVQ8zNMZ0MRMafcyKzcMGZ760FtdHHd8JyxhE,2919
384
+ torchrl/data/replay_buffers/__init__.py,sha256=mu7oVx3IlZyTN9x5VafiHz49eO2t7JOxaBAKehUzcq8,2496
385
+ torchrl/data/replay_buffers/writers.py,sha256=pJmkYugQMA66FZjPv304EwSjxHpj4IQqueWdx56v4fM,29713
386
+ torchrl/data/replay_buffers/replay_buffers.py,sha256=AN6eJg-ADcNnYe1XGCveW-t8o7-oemk6jAyvg8eBcFY,101817
387
+ torchrl/data/replay_buffers/utils.py,sha256=eDTxYYhlY7RUYysgv9DUlkFQNCxuskc1icnK7KII8eU,38598
388
+ torchrl/data/replay_buffers/ray_buffer.py,sha256=D6jZROBHCyYmuG03RrlTbzScBrMz7Vj2PgU6NAm5bsA,10395
389
+ torchrl/data/replay_buffers/checkpointers.py,sha256=NPA8tCKFqKjXESgtxpxQjPmKwtxFPsELVgX25rU_IuI,23585
390
+ torchrl/data/replay_buffers/scheduler.py,sha256=R34GHuzWmnA7mX_O0n0yHayyZH02FuwBJewmt1IpK34,10179
391
+ torchrl/data/replay_buffers/samplers.py,sha256=wHQ4RGCvPkq4FnTS94IcTbeAa9H1ojxUtr5USRdOiVw,111805
392
+ torchrl/data/replay_buffers/storages.py,sha256=7g0-jdUFexx_Rm_Ai4rX6ga4LRQGZ4gBC038tGC_-Ss,92437
393
+ torchrl/services/ray_service.py,sha256=5gonFMdTOzTZt1_-AM13HmmiFgfs1eWS2XZyLZsvGDE,15966
394
+ torchrl/services/__init__.py,sha256=BOd8Ow0myaJ4V2mIpl2hykCdIbY0hhr3sO49uVyg8dY,2775
395
+ torchrl/services/base.py,sha256=zG6fvBnmJWYMlNddWh3LndMUpa6yWSCv6ZnlKp227_c,3604
@@ -0,0 +1,5 @@
1
+ Wheel-Version: 1.0
2
+ Generator: setuptools (80.10.2)
3
+ Root-Is-Purelib: false
4
+ Tag: cp314-cp314-macosx_11_0_arm64
5
+
@@ -0,0 +1,2 @@
1
+ [vllm.general_plugins]
2
+ fp32_overrides = torchrl.modules.llm.backends.vllm.vllm_plugin:register_fp32_overrides
@@ -0,0 +1,21 @@
1
+ MIT License
2
+
3
+ Copyright (c) Meta Platforms, Inc. and affiliates.
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
@@ -0,0 +1,7 @@
1
+ benchmarks
2
+ build
3
+ gallery
4
+ scripts
5
+ sota-check
6
+ sota-implementations
7
+ torchrl