rlox 1.2.0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- rlox-1.2.0/Cargo.lock +6462 -0
- rlox-1.2.0/Cargo.toml +15 -0
- rlox-1.2.0/LICENSE-APACHE +190 -0
- rlox-1.2.0/LICENSE-MIT +21 -0
- rlox-1.2.0/PKG-INFO +351 -0
- rlox-1.2.0/README.md +313 -0
- rlox-1.2.0/crates/rlox-burn/Cargo.toml +18 -0
- rlox-1.2.0/crates/rlox-burn/README.md +36 -0
- rlox-1.2.0/crates/rlox-burn/src/actor_critic.rs +528 -0
- rlox-1.2.0/crates/rlox-burn/src/continuous_q.rs +347 -0
- rlox-1.2.0/crates/rlox-burn/src/convert.rs +86 -0
- rlox-1.2.0/crates/rlox-burn/src/deterministic.rs +339 -0
- rlox-1.2.0/crates/rlox-burn/src/dqn.rs +364 -0
- rlox-1.2.0/crates/rlox-burn/src/entropy.rs +139 -0
- rlox-1.2.0/crates/rlox-burn/src/lib.rs +26 -0
- rlox-1.2.0/crates/rlox-burn/src/mlp.rs +161 -0
- rlox-1.2.0/crates/rlox-burn/src/stochastic.rs +373 -0
- rlox-1.2.0/crates/rlox-burn/src/training.rs +150 -0
- rlox-1.2.0/crates/rlox-candle/Cargo.toml +20 -0
- rlox-1.2.0/crates/rlox-candle/README.md +42 -0
- rlox-1.2.0/crates/rlox-candle/src/actor_critic.rs +374 -0
- rlox-1.2.0/crates/rlox-candle/src/collector.rs +283 -0
- rlox-1.2.0/crates/rlox-candle/src/continuous_q.rs +269 -0
- rlox-1.2.0/crates/rlox-candle/src/convert.rs +65 -0
- rlox-1.2.0/crates/rlox-candle/src/deterministic.rs +206 -0
- rlox-1.2.0/crates/rlox-candle/src/dqn.rs +203 -0
- rlox-1.2.0/crates/rlox-candle/src/entropy.rs +99 -0
- rlox-1.2.0/crates/rlox-candle/src/lib.rs +22 -0
- rlox-1.2.0/crates/rlox-candle/src/mlp.rs +100 -0
- rlox-1.2.0/crates/rlox-candle/src/stochastic.rs +254 -0
- rlox-1.2.0/crates/rlox-candle/src/training.rs +137 -0
- rlox-1.2.0/crates/rlox-core/Cargo.toml +30 -0
- rlox-1.2.0/crates/rlox-core/README.md +79 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/columnar.rs +214 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/concurrent.rs +293 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/episode.rs +530 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/extra_columns.rs +271 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/flat.rs +258 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/her.rs +606 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/mixed.rs +232 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/mmap.rs +895 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/mod.rs +169 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/offline.rs +634 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/priority.rs +1072 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/provenance.rs +217 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/ringbuf.rs +725 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/sequence.rs +427 -0
- rlox-1.2.0/crates/rlox-core/src/buffer/varlen.rs +159 -0
- rlox-1.2.0/crates/rlox-core/src/env/batch.rs +81 -0
- rlox-1.2.0/crates/rlox-core/src/env/builtins.rs +1082 -0
- rlox-1.2.0/crates/rlox-core/src/env/mod.rs +48 -0
- rlox-1.2.0/crates/rlox-core/src/env/mujoco.rs +567 -0
- rlox-1.2.0/crates/rlox-core/src/env/parallel.rs +549 -0
- rlox-1.2.0/crates/rlox-core/src/env/spaces.rs +372 -0
- rlox-1.2.0/crates/rlox-core/src/error.rs +32 -0
- rlox-1.2.0/crates/rlox-core/src/lib.rs +23 -0
- rlox-1.2.0/crates/rlox-core/src/llm/mod.rs +1 -0
- rlox-1.2.0/crates/rlox-core/src/llm/ops.rs +462 -0
- rlox-1.2.0/crates/rlox-core/src/pipeline/channel.rs +257 -0
- rlox-1.2.0/crates/rlox-core/src/pipeline/collector.rs +335 -0
- rlox-1.2.0/crates/rlox-core/src/pipeline/mod.rs +2 -0
- rlox-1.2.0/crates/rlox-core/src/seed.rs +51 -0
- rlox-1.2.0/crates/rlox-core/src/training/augmentation.rs +291 -0
- rlox-1.2.0/crates/rlox-core/src/training/cpd.rs +414 -0
- rlox-1.2.0/crates/rlox-core/src/training/gae.rs +434 -0
- rlox-1.2.0/crates/rlox-core/src/training/kl.rs +73 -0
- rlox-1.2.0/crates/rlox-core/src/training/mod.rs +10 -0
- rlox-1.2.0/crates/rlox-core/src/training/normalization.rs +965 -0
- rlox-1.2.0/crates/rlox-core/src/training/packing.rs +330 -0
- rlox-1.2.0/crates/rlox-core/src/training/reward_shaping.rs +410 -0
- rlox-1.2.0/crates/rlox-core/src/training/simd_ops.rs +580 -0
- rlox-1.2.0/crates/rlox-core/src/training/vtrace.rs +509 -0
- rlox-1.2.0/crates/rlox-core/src/training/weight_ops.rs +285 -0
- rlox-1.2.0/crates/rlox-nn/Cargo.toml +15 -0
- rlox-1.2.0/crates/rlox-nn/README.md +48 -0
- rlox-1.2.0/crates/rlox-nn/src/distributions.rs +188 -0
- rlox-1.2.0/crates/rlox-nn/src/error.rs +19 -0
- rlox-1.2.0/crates/rlox-nn/src/lib.rs +19 -0
- rlox-1.2.0/crates/rlox-nn/src/tensor_data.rs +103 -0
- rlox-1.2.0/crates/rlox-nn/src/traits.rs +387 -0
- rlox-1.2.0/crates/rlox-python/Cargo.toml +27 -0
- rlox-1.2.0/crates/rlox-python/README.md +47 -0
- rlox-1.2.0/crates/rlox-python/src/buffer.rs +1216 -0
- rlox-1.2.0/crates/rlox-python/src/env.rs +316 -0
- rlox-1.2.0/crates/rlox-python/src/lib.rs +85 -0
- rlox-1.2.0/crates/rlox-python/src/llm.rs +196 -0
- rlox-1.2.0/crates/rlox-python/src/nn.rs +409 -0
- rlox-1.2.0/crates/rlox-python/src/training.rs +1004 -0
- rlox-1.2.0/pyproject.toml +61 -0
- rlox-1.2.0/python/rlox/__init__.py +359 -0
- rlox-1.2.0/python/rlox/__main__.py +167 -0
- rlox-1.2.0/python/rlox/_rlox_core.pyi +1176 -0
- rlox-1.2.0/python/rlox/algorithms/__init__.py +69 -0
- rlox-1.2.0/python/rlox/algorithms/a2c.py +224 -0
- rlox-1.2.0/python/rlox/algorithms/awr.py +319 -0
- rlox-1.2.0/python/rlox/algorithms/bc.py +120 -0
- rlox-1.2.0/python/rlox/algorithms/best_of_n.py +77 -0
- rlox-1.2.0/python/rlox/algorithms/calql.py +486 -0
- rlox-1.2.0/python/rlox/algorithms/cql.py +247 -0
- rlox-1.2.0/python/rlox/algorithms/decision_transformer.py +478 -0
- rlox-1.2.0/python/rlox/algorithms/diffusion_policy.py +611 -0
- rlox-1.2.0/python/rlox/algorithms/dpo.py +136 -0
- rlox-1.2.0/python/rlox/algorithms/dqn.py +469 -0
- rlox-1.2.0/python/rlox/algorithms/dreamer.py +1134 -0
- rlox-1.2.0/python/rlox/algorithms/dtp.py +452 -0
- rlox-1.2.0/python/rlox/algorithms/grpo.py +185 -0
- rlox-1.2.0/python/rlox/algorithms/hybrid_ppo.py +309 -0
- rlox-1.2.0/python/rlox/algorithms/impala.py +557 -0
- rlox-1.2.0/python/rlox/algorithms/iql.py +219 -0
- rlox-1.2.0/python/rlox/algorithms/mappo.py +737 -0
- rlox-1.2.0/python/rlox/algorithms/mpo.py +434 -0
- rlox-1.2.0/python/rlox/algorithms/online_dpo.py +115 -0
- rlox-1.2.0/python/rlox/algorithms/ppo.py +269 -0
- rlox-1.2.0/python/rlox/algorithms/qmix.py +488 -0
- rlox-1.2.0/python/rlox/algorithms/sac.py +423 -0
- rlox-1.2.0/python/rlox/algorithms/td3.py +397 -0
- rlox-1.2.0/python/rlox/algorithms/td3_bc.py +177 -0
- rlox-1.2.0/python/rlox/algorithms/trpo.py +405 -0
- rlox-1.2.0/python/rlox/algorithms/vpg.py +333 -0
- rlox-1.2.0/python/rlox/augmentation.py +52 -0
- rlox-1.2.0/python/rlox/batch.py +102 -0
- rlox-1.2.0/python/rlox/builders.py +317 -0
- rlox-1.2.0/python/rlox/callbacks.py +446 -0
- rlox-1.2.0/python/rlox/checkpoint.py +97 -0
- rlox-1.2.0/python/rlox/collectors.py +303 -0
- rlox-1.2.0/python/rlox/compat/__init__.py +0 -0
- rlox-1.2.0/python/rlox/compat/sb3.py +426 -0
- rlox-1.2.0/python/rlox/compile.py +124 -0
- rlox-1.2.0/python/rlox/config.py +1215 -0
- rlox-1.2.0/python/rlox/dashboard.py +607 -0
- rlox-1.2.0/python/rlox/deploy/__init__.py +15 -0
- rlox-1.2.0/python/rlox/deploy/docker.py +189 -0
- rlox-1.2.0/python/rlox/deploy/sagemaker.py +117 -0
- rlox-1.2.0/python/rlox/diagnostics.py +91 -0
- rlox-1.2.0/python/rlox/distributed/__init__.py +29 -0
- rlox-1.2.0/python/rlox/distributed/multi_gpu.py +251 -0
- rlox-1.2.0/python/rlox/distributed/pipeline.py +149 -0
- rlox-1.2.0/python/rlox/distributed/remote_env.py +563 -0
- rlox-1.2.0/python/rlox/distributed/vllm_backend.py +223 -0
- rlox-1.2.0/python/rlox/evaluation.py +352 -0
- rlox-1.2.0/python/rlox/experiment.py +115 -0
- rlox-1.2.0/python/rlox/exploration/__init__.py +14 -0
- rlox-1.2.0/python/rlox/exploration/go_explore.py +145 -0
- rlox-1.2.0/python/rlox/exploration/noise.py +145 -0
- rlox-1.2.0/python/rlox/gpu_buffer.py +199 -0
- rlox-1.2.0/python/rlox/gym_vec_env.py +145 -0
- rlox-1.2.0/python/rlox/hub.py +249 -0
- rlox-1.2.0/python/rlox/intrinsic/__init__.py +10 -0
- rlox-1.2.0/python/rlox/intrinsic/icm.py +214 -0
- rlox-1.2.0/python/rlox/intrinsic/rnd.py +97 -0
- rlox-1.2.0/python/rlox/llm/__init__.py +15 -0
- rlox-1.2.0/python/rlox/llm/environment.py +48 -0
- rlox-1.2.0/python/rlox/llm/reward_models.py +94 -0
- rlox-1.2.0/python/rlox/logging.py +94 -0
- rlox-1.2.0/python/rlox/losses.py +206 -0
- rlox-1.2.0/python/rlox/meta/__init__.py +9 -0
- rlox-1.2.0/python/rlox/meta/reptile.py +141 -0
- rlox-1.2.0/python/rlox/networks.py +177 -0
- rlox-1.2.0/python/rlox/off_policy_collector.py +249 -0
- rlox-1.2.0/python/rlox/offline/__init__.py +5 -0
- rlox-1.2.0/python/rlox/offline/base.py +91 -0
- rlox-1.2.0/python/rlox/offline_to_online.py +92 -0
- rlox-1.2.0/python/rlox/pbt.py +162 -0
- rlox-1.2.0/python/rlox/plugins.py +213 -0
- rlox-1.2.0/python/rlox/policies.py +298 -0
- rlox-1.2.0/python/rlox/protocols.py +393 -0
- rlox-1.2.0/python/rlox/reward_shaping.py +138 -0
- rlox-1.2.0/python/rlox/runner.py +124 -0
- rlox-1.2.0/python/rlox/self_play.py +121 -0
- rlox-1.2.0/python/rlox/trainer.py +316 -0
- rlox-1.2.0/python/rlox/trainers.py +107 -0
- rlox-1.2.0/python/rlox/utils.py +35 -0
- rlox-1.2.0/python/rlox/vec_normalize.py +288 -0
- rlox-1.2.0/python/rlox/wrappers/__init__.py +29 -0
- rlox-1.2.0/python/rlox/wrappers/language.py +186 -0
- rlox-1.2.0/python/rlox/wrappers/visual.py +322 -0
- rlox-1.2.0/python/rlox/zoo.py +212 -0
There are too many changes on this page to be displayed.
The amount of changes on this page would crash your brower.
You can still verify the content by downloading the package file manually.