d9d 0.2.0__tar.gz → 0.2.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (242) hide show
  1. {d9d-0.2.0 → d9d-0.2.1}/PKG-INFO +1 -1
  2. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/gradient_manager.py +5 -1
  3. {d9d-0.2.0 → d9d-0.2.1}/pyproject.toml +1 -1
  4. {d9d-0.2.0 → d9d-0.2.1}/LICENSE +0 -0
  5. {d9d-0.2.0 → d9d-0.2.1}/README.md +0 -0
  6. {d9d-0.2.0 → d9d-0.2.1}/d9d/__init__.py +0 -0
  7. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/__init__.py +0 -0
  8. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/autograd/__init__.py +0 -0
  9. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/autograd/grad_context.py +0 -0
  10. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/dist_context/__init__.py +0 -0
  11. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/dist_context/configured.py +0 -0
  12. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/dist_context/device_mesh_domains.py +0 -0
  13. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/dist_context/log.py +0 -0
  14. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/dist_context/params.py +0 -0
  15. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/dist_ops/__init__.py +0 -0
  16. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/dist_ops/object.py +0 -0
  17. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/dist_ops/tensor.py +0 -0
  18. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/protocol/__init__.py +0 -0
  19. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/protocol/training.py +0 -0
  20. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/sharding/__init__.py +0 -0
  21. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/sharding/auto_spec.py +0 -0
  22. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/sharding/shard.py +0 -0
  23. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/sharding/spec.py +0 -0
  24. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/sharding/unshard.py +0 -0
  25. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/types/__init__.py +0 -0
  26. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/types/data.py +0 -0
  27. {d9d-0.2.0 → d9d-0.2.1}/d9d/core/types/pytree.py +0 -0
  28. {d9d-0.2.0 → d9d-0.2.1}/d9d/dataset/__init__.py +0 -0
  29. {d9d-0.2.0 → d9d-0.2.1}/d9d/dataset/buffer_sorted.py +0 -0
  30. {d9d-0.2.0 → d9d-0.2.1}/d9d/dataset/padding.py +0 -0
  31. {d9d-0.2.0 → d9d-0.2.1}/d9d/dataset/sharded.py +0 -0
  32. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/__init__.py +0 -0
  33. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/determinism/__init__.py +0 -0
  34. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/determinism/seed.py +0 -0
  35. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/grad_norm/__init__.py +0 -0
  36. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/grad_norm/group.py +0 -0
  37. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/grad_norm/norm.py +0 -0
  38. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/grad_sync/__init__.py +0 -0
  39. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/grad_sync/bucket.py +0 -0
  40. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/grad_sync/placement_helper.py +0 -0
  41. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/grad_sync/synchronizer.py +0 -0
  42. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/pipeline_state/__init__.py +0 -0
  43. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/pipeline_state/api.py +0 -0
  44. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/pipeline_state/handler.py +0 -0
  45. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/pipeline_state/storage.py +0 -0
  46. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/profiling/__init__.py +0 -0
  47. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/profiling/profile.py +0 -0
  48. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/state/__init__.py +0 -0
  49. {d9d-0.2.0 → d9d-0.2.1}/d9d/internals/state/main_process.py +0 -0
  50. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/__init__.py +0 -0
  51. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/cce/__init__.py +0 -0
  52. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/cce/cce.py +0 -0
  53. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/cce/main.py +0 -0
  54. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/general/__init__.py +0 -0
  55. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/general/get_int_dtype.py +0 -0
  56. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/gmm/__init__.py +0 -0
  57. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/gmm/function.py +0 -0
  58. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/moe/__init__.py +0 -0
  59. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/moe/indices_to_multihot.py +0 -0
  60. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/moe/permute_with_probs.py +0 -0
  61. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/stochastic/__init__.py +0 -0
  62. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/stochastic/adamw_step.py +0 -0
  63. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/stochastic/copy.py +0 -0
  64. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/stochastic/ops/__init__.py +0 -0
  65. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/stochastic/ops/round.py +0 -0
  66. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/swiglu/__init__.py +0 -0
  67. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/swiglu/function.py +0 -0
  68. {d9d-0.2.0 → d9d-0.2.1}/d9d/kernel/swiglu/op.py +0 -0
  69. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/__init__.py +0 -0
  70. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/auto/__init__.py +0 -0
  71. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/auto/auto_lr_scheduler.py +0 -0
  72. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/auto/auto_optimizer.py +0 -0
  73. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/__init__.py +0 -0
  74. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/batch_maths.py +0 -0
  75. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/checkpointer.py +0 -0
  76. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/data_loader_factory.py +0 -0
  77. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/garbage_collector.py +0 -0
  78. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/gradient_clipper.py +0 -0
  79. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/job_logger.py +0 -0
  80. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/job_profiler.py +0 -0
  81. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/model_stage_exporter.py +0 -0
  82. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/model_stage_factory.py +0 -0
  83. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/optimizer_factory.py +0 -0
  84. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/pipeline_result_processing.py +0 -0
  85. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/stepper.py +0 -0
  86. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/task_operator.py +0 -0
  87. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/component/timeout_manager.py +0 -0
  88. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/config/__init__.py +0 -0
  89. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/config/config.py +0 -0
  90. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/config/types.py +0 -0
  91. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/control/__init__.py +0 -0
  92. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/control/dataset_provider.py +0 -0
  93. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/control/lr_scheduler_provider.py +0 -0
  94. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/control/model_provider.py +0 -0
  95. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/control/optimizer_provider.py +0 -0
  96. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/control/task.py +0 -0
  97. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/run/__init__.py +0 -0
  98. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/run/inference.py +0 -0
  99. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/run/train.py +0 -0
  100. {d9d-0.2.0 → d9d-0.2.1}/d9d/loop/state.py +0 -0
  101. {d9d-0.2.0 → d9d-0.2.1}/d9d/lr_scheduler/__init__.py +0 -0
  102. {d9d-0.2.0 → d9d-0.2.1}/d9d/lr_scheduler/piecewise/__init__.py +0 -0
  103. {d9d-0.2.0 → d9d-0.2.1}/d9d/lr_scheduler/piecewise/builder.py +0 -0
  104. {d9d-0.2.0 → d9d-0.2.1}/d9d/lr_scheduler/piecewise/config.py +0 -0
  105. {d9d-0.2.0 → d9d-0.2.1}/d9d/lr_scheduler/piecewise/curves.py +0 -0
  106. {d9d-0.2.0 → d9d-0.2.1}/d9d/lr_scheduler/piecewise/engine.py +0 -0
  107. {d9d-0.2.0 → d9d-0.2.1}/d9d/lr_scheduler/visualizer.py +0 -0
  108. {d9d-0.2.0 → d9d-0.2.1}/d9d/metric/__init__.py +0 -0
  109. {d9d-0.2.0 → d9d-0.2.1}/d9d/metric/abc.py +0 -0
  110. {d9d-0.2.0 → d9d-0.2.1}/d9d/metric/impl/__init__.py +0 -0
  111. {d9d-0.2.0 → d9d-0.2.1}/d9d/metric/impl/compose.py +0 -0
  112. {d9d-0.2.0 → d9d-0.2.1}/d9d/metric/impl/mean.py +0 -0
  113. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/__init__.py +0 -0
  114. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/io/__init__.py +0 -0
  115. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/io/dto.py +0 -0
  116. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/io/module_reader.py +0 -0
  117. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/io/module_writer.py +0 -0
  118. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/io/reader.py +0 -0
  119. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/io/writer.py +0 -0
  120. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/__init__.py +0 -0
  121. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/abc.py +0 -0
  122. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/adapters/__init__.py +0 -0
  123. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/adapters/mapper.py +0 -0
  124. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/adapters/module.py +0 -0
  125. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/compose/__init__.py +0 -0
  126. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/compose/helper.py +0 -0
  127. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/compose/parallel.py +0 -0
  128. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/compose/sequential.py +0 -0
  129. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/compose/shard.py +0 -0
  130. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/leaf/__init__.py +0 -0
  131. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/leaf/dtensor.py +0 -0
  132. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/leaf/identity.py +0 -0
  133. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/leaf/rename.py +0 -0
  134. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/leaf/select_child.py +0 -0
  135. {d9d-0.2.0 → d9d-0.2.1}/d9d/model_state/mapper/leaf/stack.py +0 -0
  136. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/__init__.py +0 -0
  137. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/base/__init__.py +0 -0
  138. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/base/late_init.py +0 -0
  139. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/__init__.py +0 -0
  140. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/attention/__init__.py +0 -0
  141. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/attention/grouped_query.py +0 -0
  142. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/attention/sdpa/__init__.py +0 -0
  143. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/attention/sdpa/flash.py +0 -0
  144. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/embedding/__init__.py +0 -0
  145. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/embedding/shard_token_embedding.py +0 -0
  146. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/ffn/__init__.py +0 -0
  147. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/ffn/swiglu.py +0 -0
  148. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/head/__init__.py +0 -0
  149. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/head/language_modelling.py +0 -0
  150. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/hidden_states_aggregator/__init__.py +0 -0
  151. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/hidden_states_aggregator/base.py +0 -0
  152. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/hidden_states_aggregator/factory.py +0 -0
  153. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/hidden_states_aggregator/mean.py +0 -0
  154. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/hidden_states_aggregator/noop.py +0 -0
  155. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/moe/__init__.py +0 -0
  156. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/moe/communications/__init__.py +0 -0
  157. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/moe/communications/base.py +0 -0
  158. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/moe/communications/deepep.py +0 -0
  159. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/moe/communications/naive.py +0 -0
  160. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/moe/grouped_experts.py +0 -0
  161. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/moe/grouped_linear.py +0 -0
  162. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/moe/layer.py +0 -0
  163. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/moe/router.py +0 -0
  164. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/positional/__init__.py +0 -0
  165. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/block/positional/rope.py +0 -0
  166. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/model/__init__.py +0 -0
  167. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/model/qwen3_moe/__init__.py +0 -0
  168. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/model/qwen3_moe/decoder_layer.py +0 -0
  169. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/model/qwen3_moe/model.py +0 -0
  170. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/model/qwen3_moe/params.py +0 -0
  171. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/parallelism/__init__.py +0 -0
  172. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/parallelism/api/__init__.py +0 -0
  173. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/parallelism/api/expert_parallel.py +0 -0
  174. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/parallelism/api/fully_sharded.py +0 -0
  175. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/parallelism/api/hybrid_sharded.py +0 -0
  176. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/parallelism/api/replicate_parallel.py +0 -0
  177. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/parallelism/model/__init__.py +0 -0
  178. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/parallelism/model/qwen3_moe.py +0 -0
  179. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/parallelism/style/__init__.py +0 -0
  180. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/parallelism/style/shard_experts.py +0 -0
  181. {d9d-0.2.0 → d9d-0.2.1}/d9d/module/parallelism/style/to_local.py +0 -0
  182. {d9d-0.2.0 → d9d-0.2.1}/d9d/optim/__init__.py +0 -0
  183. {d9d-0.2.0 → d9d-0.2.1}/d9d/optim/stochastic/__init__.py +0 -0
  184. {d9d-0.2.0 → d9d-0.2.1}/d9d/optim/stochastic/adamw.py +0 -0
  185. {d9d-0.2.0 → d9d-0.2.1}/d9d/peft/__init__.py +0 -0
  186. {d9d-0.2.0 → d9d-0.2.1}/d9d/peft/all/__init__.py +0 -0
  187. {d9d-0.2.0 → d9d-0.2.1}/d9d/peft/all/config.py +0 -0
  188. {d9d-0.2.0 → d9d-0.2.1}/d9d/peft/all/method.py +0 -0
  189. {d9d-0.2.0 → d9d-0.2.1}/d9d/peft/applicator.py +0 -0
  190. {d9d-0.2.0 → d9d-0.2.1}/d9d/peft/base.py +0 -0
  191. {d9d-0.2.0 → d9d-0.2.1}/d9d/peft/full_tune/__init__.py +0 -0
  192. {d9d-0.2.0 → d9d-0.2.1}/d9d/peft/full_tune/config.py +0 -0
  193. {d9d-0.2.0 → d9d-0.2.1}/d9d/peft/full_tune/method.py +0 -0
  194. {d9d-0.2.0 → d9d-0.2.1}/d9d/peft/lora/__init__.py +0 -0
  195. {d9d-0.2.0 → d9d-0.2.1}/d9d/peft/lora/config.py +0 -0
  196. {d9d-0.2.0 → d9d-0.2.1}/d9d/peft/lora/layer.py +0 -0
  197. {d9d-0.2.0 → d9d-0.2.1}/d9d/peft/lora/method.py +0 -0
  198. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/__init__.py +0 -0
  199. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/api/__init__.py +0 -0
  200. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/api/module.py +0 -0
  201. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/api/schedule.py +0 -0
  202. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/api/sharding.py +0 -0
  203. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/api/types.py +0 -0
  204. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/factory/__init__.py +0 -0
  205. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/factory/config.py +0 -0
  206. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/factory/factory.py +0 -0
  207. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/factory/registry.py +0 -0
  208. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/__init__.py +0 -0
  209. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/__init__.py +0 -0
  210. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/component/__init__.py +0 -0
  211. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/component/program/__init__.py +0 -0
  212. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/component/program/base.py +0 -0
  213. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/component/program/communications.py +0 -0
  214. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/component/program/topology.py +0 -0
  215. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/component/runtime/__init__.py +0 -0
  216. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/component/runtime/action.py +0 -0
  217. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/component/runtime/callback.py +0 -0
  218. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/component/runtime/communications.py +0 -0
  219. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/component/runtime/executor.py +0 -0
  220. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/component/runtime/offline.py +0 -0
  221. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/program/__init__.py +0 -0
  222. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/program/bfs.py +0 -0
  223. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/program/dualpipev.py +0 -0
  224. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/program/interleaved.py +0 -0
  225. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/schedule/program/zerobubblev.py +0 -0
  226. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/stage/__init__.py +0 -0
  227. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/stage/communications.py +0 -0
  228. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/stage/computations.py +0 -0
  229. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/stage/splitgrad.py +0 -0
  230. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/stage/stage.py +0 -0
  231. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/infra/stage/struct_helper.py +0 -0
  232. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/training/__init__.py +0 -0
  233. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/training/optimizer.py +0 -0
  234. {d9d-0.2.0 → d9d-0.2.1}/d9d/pipelining/training/scheduler.py +0 -0
  235. {d9d-0.2.0 → d9d-0.2.1}/d9d/tracker/__init__.py +0 -0
  236. {d9d-0.2.0 → d9d-0.2.1}/d9d/tracker/base.py +0 -0
  237. {d9d-0.2.0 → d9d-0.2.1}/d9d/tracker/factory.py +0 -0
  238. {d9d-0.2.0 → d9d-0.2.1}/d9d/tracker/provider/__init__.py +0 -0
  239. {d9d-0.2.0 → d9d-0.2.1}/d9d/tracker/provider/aim/__init__.py +0 -0
  240. {d9d-0.2.0 → d9d-0.2.1}/d9d/tracker/provider/aim/config.py +0 -0
  241. {d9d-0.2.0 → d9d-0.2.1}/d9d/tracker/provider/aim/tracker.py +0 -0
  242. {d9d-0.2.0 → d9d-0.2.1}/d9d/tracker/provider/null.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: d9d
3
- Version: 0.2.0
3
+ Version: 0.2.1
4
4
  Summary: d9d - d[istribute]d - distributed training framework based on PyTorch that tries to be efficient yet hackable
5
5
  License: Apache-2.0
6
6
  License-File: LICENSE
@@ -78,8 +78,12 @@ class GradientManager:
78
78
  self._grads_to_scale = None
79
79
 
80
80
  def _scale_grads(self):
81
+ if self._grads_to_scale is None:
82
+ raise ValueError("You should bind the manager first.")
83
+
81
84
  scale_factor = 1.0 / self._loss.accumulated_weight
82
- torch._foreach_mul_(self._grads_to_scale, scale_factor)
85
+ if len(self._grads_to_scale) > 0:
86
+ torch._foreach_mul_(self._grads_to_scale, scale_factor)
83
87
 
84
88
  @contextmanager
85
89
  def install(self):
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "d9d"
3
- version = "0.2.0"
3
+ version = "0.2.1"
4
4
  description = "d9d - d[istribute]d - distributed training framework based on PyTorch that tries to be efficient yet hackable"
5
5
  authors = [
6
6
  {name = "Maksim Afanasyev", email = "mr.applexz@gmail.com"}
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes