returnn 1.20241022.173306__tar.gz → 1.20241023.94437__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of returnn might be problematic. Click here for more details.
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/PKG-INFO +1 -1
- returnn-1.20241023.94437/_setup_info_generated.py +2 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/audio/mel.py +4 -1
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/decoder/transformer.py +2 -6
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/dtype.py +35 -1
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tensor/utils.py +3 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/data/extern_data.py +8 -1
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/engine.py +55 -18
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/frontend/_backend.py +10 -1
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/util/exception_helper.py +4 -1
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn.egg-info/PKG-INFO +1 -1
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_base.py +28 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_torch_engine.py +27 -0
- returnn-1.20241022.173306/_setup_info_generated.py +0 -2
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/.editorconfig +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/.gitignore +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/.gitmodules +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/.kateconfig +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/CHANGELOG.md +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/CODEOWNERS +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/CONTRIBUTING.md +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/LICENSE +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/MANIFEST.in +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/README.rst +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/12AX.cluster_map +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/_setup_returnn_env.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-fwd.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-horovod-mpi.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-horovod-mpi.py.sh +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-horovod-mpi.sh +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-hyper-param-tuning.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-iter-dataset.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-list-devices.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-lua-torch-layer.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-pretrain.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-record-and-push-to-webserver.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-returnn-as-framework.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-rf-pt-benchmark.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-rf.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-rhn-enwik8.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-sprint-interface.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-att-copy.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-attention.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-chunking-blstm.12ax.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-contribrnn-lstm.12ax.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-enc-dec.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-hard-att-copy.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-lstm-benchmark.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-maxgradnorm-lstm.12ax.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-native-lstm-lowmem.12ax.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-native-lstm.12ax.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-native-lstm2.12ax.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-native-lstm2.12ax.tuned.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-neural-transducer.12ax.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-rec-explicit-lstm.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-rec-explicit-rnn.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-rec-self-att.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-search-compiled-graph.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-vanilla-lstm.12ax.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-timit-lstm-ctc.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-torch.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-upd-mult-model.lstm.12ax.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo.sh +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/IAM_lines/a01-000u-00.png +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/IAM_lines/a01-007-04.png +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/IAM_lines/a01-007-06.png +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/README.txt +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/chars.txt +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/config_demo +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/config_fwd +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/config_real +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/create_IAM_dataset.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/decode.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/features/raw/demo.h5 +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/go.sh +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/lines.txt +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/split/eval.txt +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/split/train.txt +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/split/valid.txt +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/README.md +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/artificial/create_test_h5.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/artificial/forwardconfig +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/artificial/go.sh +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/artificial/trainconfig +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/artificial_rgb/create_test_h5.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/artificial_rgb/forwardconfig +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/artificial_rgb/go.sh +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/artificial_rgb/trainconfig +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/pyproject.toml +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/requirements.txt +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/__main__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/__old_mod_loader__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/__setup__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/config.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/audio.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/basic.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/bundle_file.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/cached.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/cached2.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/distrib_files.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/generating.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/hdf.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/lm.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/map.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/meta.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/multi_proc.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/normalization_data.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/numpy_dump.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/postprocessing.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/raw_wav.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/sprint.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/stereo.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/util/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/util/feature_extraction.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/util/strings.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/datasets/util/vocabulary.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/engine/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/engine/base.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/engine/batch.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/__main__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/.git +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/.gitignore +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/LICENSE +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/README.md +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/aligner.gif +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/check.png +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/core.cu +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/core.h +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/core_cpu.cpp +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/pytorch_binding/LICENSE +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/pytorch_binding/MANIFEST.in +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/pytorch_binding/README.md +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/pytorch_binding/binding.cpp +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/pytorch_binding/core.cu +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/pytorch_binding/core.h +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/pytorch_binding/requirements.txt +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/pytorch_binding/setup.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/pytorch_binding/warp_rna/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/pytorch_binding/warp_rna/test.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/ref_rna.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/tensorflow_binding/setup.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/tensorflow_binding/src/warp_rna_op.cc +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/tensorflow_binding/src/warp_rna_op_kernel_tmpl.h +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/tensorflow_binding/warp_rna/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/WarpRna/warp-rna/test.cpp +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/graph_editor/README.md +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/graph_editor/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/graph_editor/edit.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/graph_editor/reroute.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/graph_editor/select.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/graph_editor/subgraph.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/graph_editor/transform.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/extern/graph_editor/util.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/forward_iface.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/_backend.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/_native/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/_native/backend.cpp +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/_native/backend.hpp +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/_native/module.cpp +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/_native/module.hpp +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/_native/py_utils.hpp +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/_native/tensor_ops.cpp +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/_native/tensor_ops.hpp +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/_numpy_backend.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/_random_journal.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/_utils.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/array_.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/attention.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/audio/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/audio/specaugment.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/backend.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/build_from_dict.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/cond.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/const.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/container.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/control_flow_ctx.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/conv.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/conversions/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/conversions/espnet_e_branchformer.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/conversions/hf_llama.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/conversions/torch_nn.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/decoder/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/device.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/dims.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/dropout.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/encoder/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/encoder/base.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/encoder/conformer.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/encoder/e_branchformer.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/encoder/transformer.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/gradient.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/graph.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/hooks.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/init.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/label_smoothing.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/linear.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/loop.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/loss.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/math_.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/matmul.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/module.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/normalization.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/parameter.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/parametrizations.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/parametrize.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/piecewise_linear.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/rand.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/rec.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/reduce.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/run_ctx.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/signal.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/state.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/stepwise_scheduler.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/tensor_array.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/types.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/import_/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/import_/common.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/import_/git.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/import_/import_.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/learning_rate_control.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/log.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/native_op.cpp +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/native_op.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/pretrain.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/sprint/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/sprint/cache.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/sprint/control.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/sprint/error_signals.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/sprint/extern_interface.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/sprint/interface.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tensor/README.md +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tensor/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tensor/_dim_extra.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tensor/_tensor_extra.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tensor/_tensor_mixin_base.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tensor/_tensor_op_overloads.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tensor/control_flow_ctx.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tensor/dim.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tensor/marked_dim.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tensor/tensor.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tensor/tensor_dict.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/compat.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/data_pipeline.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/distributed.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/engine.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/README.md +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/_backend.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/_utils.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/cond.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/config_entry_points.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/debug_eager_mode.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/dims.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/layer.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/loop.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/make_layer.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/masked_computation.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/parameter_assign.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_layers/prev_tensor_ref.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_low_level/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/frontend_low_level/_backend.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/horovod.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/hyper_param_tuning.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/layers/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/layers/base.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/layers/basic.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/layers/rec.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/layers/segmental_model.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/layers/signal_processing.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/layers/variable.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/native_op.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/network.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/sprint.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/updater.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/util/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/util/basic.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/util/data.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/util/gradient_checkpoint.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/util/ken_lm.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/tf/util/open_fst.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/README.md +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/data/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/data/pipeline.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/data/queued_data_iter.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/data/returnn_dataset_wrapper.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/data/tensor_utils.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/distributed.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/frontend/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/frontend/_rand.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/frontend/bridge.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/frontend/raw_ops.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/optim/README.md +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/optim/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/optim/lion.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/updater.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/util/README.md +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/util/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/util/array_.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/util/diagnose_gpu.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/util/gradient_checkpoint.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/util/module.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/util/scaled_gradient.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/__init__.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/basic.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/better_exchook.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/bpe.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/debug.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/debug_helpers.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/file_cache.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/fsa.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/literal_py_to_pickle.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/math.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/multi_proc_non_daemonic_spawn.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/native_code_compiler.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/pprint.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/py-to-pickle.cpp +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/py_compat.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/py_ext_mod_compiler.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/result_with_reason.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/sig_proc.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/task_system.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/train_proc_manager.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/util/watch_memory.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn.egg-info/SOURCES.txt +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn.egg-info/dependency_links.txt +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn.egg-info/top_level.txt +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/rnn.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/setup.cfg +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/setup.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/DummySprintExec.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/PyCharm-inspection-profile.xml +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/PyCharm.idea/.gitignore +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/PyCharm.idea/.name +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/PyCharm.idea/codeStyleSettings.xml +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/PyCharm.idea/codeStyles/Project.xml +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/PyCharm.idea/codeStyles/codeStyleConfig.xml +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/PyCharm.idea/inspectionProfiles/Project_Default.xml +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/PyCharm.idea/inspectionProfiles/profiles_settings.xml +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/PyCharm.idea/misc.xml +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/PyCharm.idea/modules.xml +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/PyCharm.idea/returnn.iml +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/PyCharm.idea/scopes/scope_settings.xml +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/_set_num_threads1.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/_setup_returnn_env.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/_setup_test_env.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/bpe-unicode-demo.codes +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/bpe-unicode-demo.vocab +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/lexicon_opt.fst +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/lexicon_opt.isyms +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/lexicon_opt.jpg +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/lexicon_opt.osyms +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/lint_common.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/pycharm-inspect.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/pylint.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/returnn-as-framework.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/rf_utils.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/spelling.dic +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_Config.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_Dataset.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_Fsa.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_GeneratingDataset.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_HDFDataset.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_LearningRateControl.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_Log.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_MultiProcDataset.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_Pretrain.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_ResNet.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_SprintDataset.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_SprintInterface.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_TFEngine.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_TFNativeOp.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_TFNetworkLayer.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_TFNetworkRecLayer.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_TFNetworkSigProcLayer.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_TFUpdater.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_TFUtil.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_TF_determinism.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_TaskSystem.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_TaskSystem_SharedMem.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_TranslationDataset.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_Util.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_demos.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_fork_exec.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_hdf_dump.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_array.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_attention.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_cond.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_const.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_container.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_conv.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_decoder_transformer.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_encoder_conformer.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_gradient.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_label_smoothing.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_loop.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_math.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_normalization.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_piecewise_linear.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_rec.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_reduce.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_rf_signal.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_tensor.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_tools.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_torch_dataset.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_torch_frontend.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_torch_internal_frontend.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/test_torch_util.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tests/torch_utils.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/_setup_returnn_env.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/analyze-dataset-batches.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/bliss-collect-seq-lens.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/bliss-dump-text.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/bliss-get-segment-names.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/bliss-to-ogg-zip.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/bpe-create-lexicon.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/calculate-word-error-rate.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/cleanup-old-models.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/collect-orth-symbols.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/collect-words.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/compile_native_op.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/compile_tf_graph.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/debug-dump-search-scores.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/debug-plot-search-scores.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/dump-dataset-raw-strings.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/dump-dataset.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/dump-forward-stats.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/dump-forward.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/dump-network-json.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/dump-pickle.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/extract_state_tying_from_dataset.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/get-attention-weights.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/get-best-model-epoch.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/hdf_dump.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/hdf_dump_translation_dataset.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/import-blocks-mt-model.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/import-t2t-mt-model.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/.gitignore +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/Makefile +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/README.md +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/example/README.md +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/example/libs_list +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/example/network.040/i600_m600_m600.sgd_b16_lr0_cl2.newbobabs.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/example/network.040/i600_m600_m600.sgd_b16_lr0_cl2.newbobabs.keep_over_epoch.lstm2.config +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/example/rescore_lattice.sh +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/example/state_vars_list +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/example/tensor_names_list +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/file.h +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/htklatticerescorer.cc +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/htklatticerescorer.h +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/main.cc +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/rescorer.h +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/vocabulary.cc +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/lattice_rescorer/vocabulary.h +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/tf_avg_checkpoints.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/tf_inspect_checkpoint.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/tf_inspect_summary_log.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/torch_avg_checkpoints.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/torch_export_to_onnx.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/torch_inspect_checkpoint.py +0 -0
- {returnn-1.20241022.173306 → returnn-1.20241023.94437}/tools/torch_inspect_checkpoint_and_opt.py +0 -0
|
@@ -56,8 +56,8 @@ def mel_filterbank(
|
|
|
56
56
|
filter_bank_matrix_np = _mel_filter_bank_matrix_np(
|
|
57
57
|
f_min=f_min, f_max=f_max, sampling_rate=sampling_rate, fft_size=fft_length, nr_of_filters=out_dim.dimension
|
|
58
58
|
)
|
|
59
|
-
filter_bank_matrix_np = filter_bank_matrix_np.astype(x.dtype)
|
|
60
59
|
filter_bank_matrix = rf.convert_to_tensor(filter_bank_matrix_np, dims=(in_dim, out_dim), _backend=backend)
|
|
60
|
+
filter_bank_matrix = rf.cast(filter_bank_matrix, dtype=x.dtype)
|
|
61
61
|
filter_bank_matrix = rf.copy_to_device(filter_bank_matrix, x.device)
|
|
62
62
|
if backend.executing_eagerly():
|
|
63
63
|
if len(_mel_filter_bank_matrix_cache) > 100:
|
|
@@ -191,6 +191,9 @@ def log_mel_filterbank_from_raw(
|
|
|
191
191
|
fft_length=n_fft,
|
|
192
192
|
)
|
|
193
193
|
power_spectrogram = rf.abs(spectrogram) ** 2.0
|
|
194
|
+
# stft might have upcasted this to float32 because some PyTorch versions don't support stft on bfloat16.
|
|
195
|
+
# https://github.com/pytorch/pytorch/issues/117844
|
|
196
|
+
power_spectrogram = rf.cast(power_spectrogram, dtype=raw_audio.dtype)
|
|
194
197
|
mel_fbank = mel_filterbank(power_spectrogram, in_dim=in_dim_, out_dim=out_dim, sampling_rate=sampling_rate)
|
|
195
198
|
log_mel_fbank = rf.safe_log(mel_fbank, eps=1e-10)
|
|
196
199
|
if log_base != math.e:
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/frontend/decoder/transformer.py
RENAMED
|
@@ -101,15 +101,11 @@ class TransformerDecoder(rf.Module):
|
|
|
101
101
|
if pos_enc is None:
|
|
102
102
|
pass
|
|
103
103
|
elif isinstance(pos_enc, dict):
|
|
104
|
-
pos_enc = rf.build_from_dict(
|
|
105
|
-
pos_enc, feat_dim=embed_dim or model_dim, dtype=self.input_embedding.weight.dtype
|
|
106
|
-
)
|
|
104
|
+
pos_enc = rf.build_from_dict(pos_enc, feat_dim=embed_dim or model_dim)
|
|
107
105
|
elif isinstance(pos_enc, rf.Module):
|
|
108
106
|
pass
|
|
109
107
|
elif isinstance(pos_enc, FunctionType):
|
|
110
|
-
pos_enc = functools.partial(
|
|
111
|
-
pos_enc, feat_dim=embed_dim or model_dim, dtype=self.input_embedding.weight.dtype
|
|
112
|
-
)
|
|
108
|
+
pos_enc = functools.partial(pos_enc, feat_dim=embed_dim or model_dim)
|
|
113
109
|
else:
|
|
114
110
|
raise TypeError(f"unexpected pos_enc type {pos_enc!r}")
|
|
115
111
|
self.pos_enc = pos_enc
|
|
@@ -3,9 +3,17 @@ DType helpers
|
|
|
3
3
|
"""
|
|
4
4
|
|
|
5
5
|
from __future__ import annotations
|
|
6
|
+
from contextlib import contextmanager
|
|
6
7
|
|
|
7
8
|
|
|
8
|
-
__all__ = [
|
|
9
|
+
__all__ = [
|
|
10
|
+
"get_default_float_dtype",
|
|
11
|
+
"set_default_float_dtype",
|
|
12
|
+
"set_default_float_dtype_ctx",
|
|
13
|
+
"get_default_int_dtype",
|
|
14
|
+
"get_default_array_index_dtype",
|
|
15
|
+
"is_float_dtype",
|
|
16
|
+
]
|
|
9
17
|
|
|
10
18
|
|
|
11
19
|
_default_float_dtype: str = "float32"
|
|
@@ -21,6 +29,32 @@ def get_default_float_dtype() -> str:
|
|
|
21
29
|
return _default_float_dtype
|
|
22
30
|
|
|
23
31
|
|
|
32
|
+
def set_default_float_dtype(dtype: str):
|
|
33
|
+
"""
|
|
34
|
+
Set the default float dtype
|
|
35
|
+
|
|
36
|
+
:param dtype: the new default float dtype
|
|
37
|
+
"""
|
|
38
|
+
global _default_float_dtype
|
|
39
|
+
assert isinstance(dtype, str)
|
|
40
|
+
_default_float_dtype = dtype
|
|
41
|
+
|
|
42
|
+
|
|
43
|
+
@contextmanager
|
|
44
|
+
def set_default_float_dtype_ctx(dtype: str):
|
|
45
|
+
"""
|
|
46
|
+
:param dtype: see :func:`get_default_float_dtype`
|
|
47
|
+
"""
|
|
48
|
+
global _default_float_dtype
|
|
49
|
+
assert isinstance(dtype, str)
|
|
50
|
+
old_default_float_dtype = _default_float_dtype
|
|
51
|
+
try:
|
|
52
|
+
_default_float_dtype = dtype
|
|
53
|
+
yield
|
|
54
|
+
finally:
|
|
55
|
+
_default_float_dtype = old_default_float_dtype
|
|
56
|
+
|
|
57
|
+
|
|
24
58
|
def get_default_int_dtype() -> str:
|
|
25
59
|
"""
|
|
26
60
|
https://data-apis.org/array-api/latest/API_specification/data_types.html#default-data-types
|
|
@@ -104,6 +104,9 @@ def tensor_fill_random_numpy_(
|
|
|
104
104
|
x.raw_tensor = rnd.randint(0, 2, size=shape, dtype=x.dtype)
|
|
105
105
|
elif x.dtype.startswith("float"):
|
|
106
106
|
x.raw_tensor = rnd.normal(0.0, 1.0, size=shape).astype(x.dtype)
|
|
107
|
+
elif x.dtype == "bfloat16":
|
|
108
|
+
# Numpy does not support bfloat16, will later be casted to bfloat16
|
|
109
|
+
x.raw_tensor = rnd.normal(0.0, 1.0, size=shape).astype("float32")
|
|
107
110
|
elif x.dtype.startswith("complex"):
|
|
108
111
|
real = rnd.normal(0.0, 1.0, size=shape)
|
|
109
112
|
imag = rnd.normal(0.0, 1.0, size=shape)
|
|
@@ -3,7 +3,7 @@ From raw dict to extern_data tensor dict.
|
|
|
3
3
|
"""
|
|
4
4
|
|
|
5
5
|
from __future__ import annotations
|
|
6
|
-
from typing import Any, Union, Dict, List, Sequence
|
|
6
|
+
from typing import Optional, Any, Union, Dict, List, Sequence
|
|
7
7
|
import numpy
|
|
8
8
|
import torch
|
|
9
9
|
from returnn.tensor import Tensor, TensorDict, Dim
|
|
@@ -27,13 +27,18 @@ def raw_dict_to_extern_data(
|
|
|
27
27
|
*,
|
|
28
28
|
extern_data_template: TensorDict,
|
|
29
29
|
device: Union[str, torch.device],
|
|
30
|
+
float_dtype: Optional[Union[str, torch.dtype]] = None,
|
|
30
31
|
) -> TensorDict:
|
|
31
32
|
"""
|
|
32
33
|
:param extern_data_raw: This comes out of the DataLoader, via our collate_batch.
|
|
33
34
|
:param extern_data_template: Specified via `extern_data` in the config.
|
|
34
35
|
:param device: E.g. the GPU.
|
|
36
|
+
:param float_dtype:
|
|
35
37
|
:return: tensor dict, like extern_data_template, but with raw tensors set to Torch tensors, on the right device.
|
|
36
38
|
"""
|
|
39
|
+
if isinstance(float_dtype, str):
|
|
40
|
+
float_dtype = getattr(torch, float_dtype)
|
|
41
|
+
assert isinstance(float_dtype, torch.dtype)
|
|
37
42
|
assert isinstance(extern_data_raw, dict) and extern_data_raw
|
|
38
43
|
batch_dim = get_batch_dim_from_extern_data(extern_data_template)
|
|
39
44
|
for dim in _get_dyn_dims_from_extern_data(extern_data_template):
|
|
@@ -51,6 +56,8 @@ def raw_dict_to_extern_data(
|
|
|
51
56
|
dim.dimension == raw_tensor.shape[i]
|
|
52
57
|
), f"shape mismatch for {k}: {raw_tensor.shape} vs {data.batch_shape}"
|
|
53
58
|
if isinstance(raw_tensor, torch.Tensor):
|
|
59
|
+
if raw_tensor.dtype.is_floating_point and float_dtype:
|
|
60
|
+
raw_tensor = raw_tensor.to(dtype=float_dtype)
|
|
54
61
|
data.dtype = str(raw_tensor.dtype).split(".")[-1] # just overwrite for now...
|
|
55
62
|
data.raw_tensor = raw_tensor.to(device)
|
|
56
63
|
elif isinstance(raw_tensor, numpy.ndarray):
|
|
@@ -4,7 +4,7 @@ Main engine for PyTorch
|
|
|
4
4
|
|
|
5
5
|
from __future__ import annotations
|
|
6
6
|
from typing import Optional, Any, Union, Callable, Dict, Set
|
|
7
|
-
from contextlib import nullcontext
|
|
7
|
+
from contextlib import nullcontext, ExitStack, contextmanager
|
|
8
8
|
|
|
9
9
|
import gc
|
|
10
10
|
import os
|
|
@@ -129,6 +129,13 @@ class Engine(EngineBase):
|
|
|
129
129
|
self._forward_auto_split_batch_on_oom = config.bool("forward_auto_split_batch_on_oom", False)
|
|
130
130
|
self._stop_on_nonfinite_train_score = config.bool("stop_on_nonfinite_train_score", True)
|
|
131
131
|
|
|
132
|
+
default_float_dtype = config.value("default_float_dtype", None)
|
|
133
|
+
if default_float_dtype is not None:
|
|
134
|
+
assert isinstance(default_float_dtype, str)
|
|
135
|
+
default_float_dtype = getattr(torch, default_float_dtype)
|
|
136
|
+
assert isinstance(default_float_dtype, torch.dtype)
|
|
137
|
+
self._default_float_dtype: Optional[torch.dtype] = default_float_dtype
|
|
138
|
+
|
|
132
139
|
amp_options = self.config.opt_typed_value("torch_amp")
|
|
133
140
|
grad_scaler_opts = self.config.typed_value("grad_scaler", NotSpecified)
|
|
134
141
|
if amp_options is not None:
|
|
@@ -380,7 +387,10 @@ class Engine(EngineBase):
|
|
|
380
387
|
cur_count_grad_accum = 0
|
|
381
388
|
|
|
382
389
|
extern_data = extern_data_util.raw_dict_to_extern_data(
|
|
383
|
-
extern_data_raw,
|
|
390
|
+
extern_data_raw,
|
|
391
|
+
extern_data_template=self.extern_data,
|
|
392
|
+
device=self._device,
|
|
393
|
+
float_dtype=self._default_float_dtype,
|
|
384
394
|
)
|
|
385
395
|
self._run_step(extern_data, train_flag=True, train_func=True)
|
|
386
396
|
|
|
@@ -389,7 +399,7 @@ class Engine(EngineBase):
|
|
|
389
399
|
losses_dict = NumbersDict(
|
|
390
400
|
{
|
|
391
401
|
name: (
|
|
392
|
-
float(loss.get_summed_loss().raw_tensor.detach().cpu().
|
|
402
|
+
float(loss.get_summed_loss().raw_tensor.detach().cpu().item())
|
|
393
403
|
if self._device != "meta"
|
|
394
404
|
else float("nan")
|
|
395
405
|
)
|
|
@@ -553,7 +563,10 @@ class Engine(EngineBase):
|
|
|
553
563
|
torch.distributed.broadcast(_has_data, src=0)
|
|
554
564
|
|
|
555
565
|
extern_data = extern_data_util.raw_dict_to_extern_data(
|
|
556
|
-
extern_data_raw,
|
|
566
|
+
extern_data_raw,
|
|
567
|
+
extern_data_template=self.extern_data,
|
|
568
|
+
device=self._device,
|
|
569
|
+
float_dtype=self._default_float_dtype,
|
|
557
570
|
)
|
|
558
571
|
|
|
559
572
|
self._run_step(extern_data, train_func=True)
|
|
@@ -566,7 +579,7 @@ class Engine(EngineBase):
|
|
|
566
579
|
losses_dict = NumbersDict(
|
|
567
580
|
{
|
|
568
581
|
name: (
|
|
569
|
-
float(loss.get_summed_loss().raw_tensor.detach().cpu().
|
|
582
|
+
float(loss.get_summed_loss().raw_tensor.detach().cpu().item())
|
|
570
583
|
if self._device != "meta"
|
|
571
584
|
else float("nan")
|
|
572
585
|
)
|
|
@@ -686,6 +699,17 @@ class Engine(EngineBase):
|
|
|
686
699
|
|
|
687
700
|
return data_loader
|
|
688
701
|
|
|
702
|
+
@contextmanager
|
|
703
|
+
def _run_ctx_mgr(self):
|
|
704
|
+
with ExitStack() as stack:
|
|
705
|
+
if self._use_autocast:
|
|
706
|
+
stack.enter_context(autocast(device_type=self._device.split(":")[0], dtype=self._autocast_dtype))
|
|
707
|
+
stack.enter_context(rf.set_default_device_ctx(self._device))
|
|
708
|
+
if self._default_float_dtype:
|
|
709
|
+
stack.enter_context(rf.set_default_float_dtype_ctx(str(self._default_float_dtype).split(".")[-1]))
|
|
710
|
+
stack.enter_context(_set_torch_default_dtype_ctx_mgr(self._default_float_dtype))
|
|
711
|
+
yield
|
|
712
|
+
|
|
689
713
|
def _run_step(
|
|
690
714
|
self, extern_data: TensorDict, *, train_flag: bool = False, train_func: bool, _inside_wrapped: bool = False
|
|
691
715
|
):
|
|
@@ -706,11 +730,7 @@ class Engine(EngineBase):
|
|
|
706
730
|
expected_outputs=self._forward_step_expected_outputs, step=self.global_train_step, epoch=self.epoch
|
|
707
731
|
)
|
|
708
732
|
|
|
709
|
-
with (
|
|
710
|
-
autocast(device_type=self._device.split(":")[0], dtype=self._autocast_dtype)
|
|
711
|
-
if self._use_autocast
|
|
712
|
-
else nullcontext()
|
|
713
|
-
), rf.set_default_device_ctx(self._device):
|
|
733
|
+
with self._run_ctx_mgr():
|
|
714
734
|
sentinel_kw = util.get_fwd_compat_kwargs()
|
|
715
735
|
if train_func:
|
|
716
736
|
self._train_step_func(model=self._orig_model, extern_data=extern_data, **sentinel_kw)
|
|
@@ -893,6 +913,8 @@ class Engine(EngineBase):
|
|
|
893
913
|
)
|
|
894
914
|
)
|
|
895
915
|
|
|
916
|
+
if self._default_float_dtype:
|
|
917
|
+
self._pt_model.to(dtype=self._default_float_dtype)
|
|
896
918
|
self._pt_model.to(self._device)
|
|
897
919
|
|
|
898
920
|
if model_epoch_filename and is_training:
|
|
@@ -906,11 +928,7 @@ class Engine(EngineBase):
|
|
|
906
928
|
|
|
907
929
|
load_model_post_hooks = self.config.typed_value("load_model_post_hooks")
|
|
908
930
|
if load_model_post_hooks:
|
|
909
|
-
with (
|
|
910
|
-
autocast(device_type=self._device.split(":")[0], dtype=self._autocast_dtype)
|
|
911
|
-
if self._use_autocast
|
|
912
|
-
else nullcontext()
|
|
913
|
-
), rf.set_default_device_ctx(self._device):
|
|
931
|
+
with self._run_ctx_mgr():
|
|
914
932
|
sentinel_kw = util.get_fwd_compat_kwargs()
|
|
915
933
|
for hook in load_model_post_hooks:
|
|
916
934
|
hook(model=self._orig_model, **sentinel_kw)
|
|
@@ -1090,7 +1108,10 @@ class Engine(EngineBase):
|
|
|
1090
1108
|
# Currently, this callback interface is intended to also be used by other backends,
|
|
1091
1109
|
# and then the user can always assume Numpy arrays.
|
|
1092
1110
|
if isinstance(raw, torch.Tensor): # might already be numpy array
|
|
1093
|
-
raw = raw.detach().cpu()
|
|
1111
|
+
raw = raw.detach().cpu()
|
|
1112
|
+
if raw.dtype == torch.bfloat16:
|
|
1113
|
+
raw = raw.float()
|
|
1114
|
+
raw = raw.numpy()
|
|
1094
1115
|
y.raw_tensor = raw
|
|
1095
1116
|
return y
|
|
1096
1117
|
|
|
@@ -1120,7 +1141,10 @@ class Engine(EngineBase):
|
|
|
1120
1141
|
# Also resets any dyn dims, which might have been set in the prev step.
|
|
1121
1142
|
self._forward_step_expected_outputs.reset_content()
|
|
1122
1143
|
extern_data = extern_data_util.raw_dict_to_extern_data(
|
|
1123
|
-
extern_data_raw,
|
|
1144
|
+
extern_data_raw,
|
|
1145
|
+
extern_data_template=self.extern_data,
|
|
1146
|
+
device=self._device,
|
|
1147
|
+
float_dtype=self._default_float_dtype,
|
|
1124
1148
|
)
|
|
1125
1149
|
try:
|
|
1126
1150
|
self._run_step(extern_data, train_func=False)
|
|
@@ -1224,7 +1248,10 @@ def _to_raw(n: Union[int, float, Tensor]):
|
|
|
1224
1248
|
if isinstance(n, (int, float)):
|
|
1225
1249
|
return n
|
|
1226
1250
|
if isinstance(n, Tensor):
|
|
1227
|
-
|
|
1251
|
+
x = n.raw_tensor.detach().cpu()
|
|
1252
|
+
if x.dtype == torch.bfloat16:
|
|
1253
|
+
x = x.float()
|
|
1254
|
+
return x.numpy()
|
|
1228
1255
|
raise TypeError(f"Unexpected {n} of type {type(n)}")
|
|
1229
1256
|
|
|
1230
1257
|
|
|
@@ -1382,3 +1409,13 @@ class _WrappedModuleRunStep(torch.nn.Module):
|
|
|
1382
1409
|
for name, loss in ctx.losses.items():
|
|
1383
1410
|
res["loss/" + name] = loss.loss.raw_tensor
|
|
1384
1411
|
return res
|
|
1412
|
+
|
|
1413
|
+
|
|
1414
|
+
@contextmanager
|
|
1415
|
+
def _set_torch_default_dtype_ctx_mgr(dtype: torch.dtype):
|
|
1416
|
+
old_dtype = torch.get_default_dtype()
|
|
1417
|
+
try:
|
|
1418
|
+
torch.set_default_dtype(dtype)
|
|
1419
|
+
yield
|
|
1420
|
+
finally:
|
|
1421
|
+
torch.set_default_dtype(old_dtype)
|
|
@@ -676,6 +676,9 @@ class TorchBackend(Backend[torch.Tensor]):
|
|
|
676
676
|
if len(batch_dims) != 1:
|
|
677
677
|
targets_raw = torch.reshape(targets_raw, (batch_n_elems, targets_raw.shape[-1])) # [B', S]
|
|
678
678
|
targets_lengths = torch.reshape(targets_lengths, (batch_n_elems,)) # [B']
|
|
679
|
+
if log_probs.dtype == torch.bfloat16:
|
|
680
|
+
# Currently (PyTorch 2.5), ctc_loss does not support bfloat16.
|
|
681
|
+
log_probs = log_probs.to(torch.float32)
|
|
679
682
|
loss_raw = torch.nn.functional.ctc_loss(
|
|
680
683
|
log_probs=log_probs,
|
|
681
684
|
targets=targets_raw,
|
|
@@ -691,7 +694,7 @@ class TorchBackend(Backend[torch.Tensor]):
|
|
|
691
694
|
name="ctc_loss",
|
|
692
695
|
dims=batch_dims,
|
|
693
696
|
raw_tensor=loss_raw,
|
|
694
|
-
dtype=
|
|
697
|
+
dtype=TorchBackend.get_dtype_name_raw(loss_raw),
|
|
695
698
|
)
|
|
696
699
|
return loss
|
|
697
700
|
|
|
@@ -2039,6 +2042,12 @@ class TorchBackend(Backend[torch.Tensor]):
|
|
|
2039
2042
|
pad_right = fft_length - frame_length - pad_left
|
|
2040
2043
|
window_pt = torch.nn.functional.pad(window_pt, (pad_left, pad_right))
|
|
2041
2044
|
|
|
2045
|
+
orig_dtype = x_raw.dtype
|
|
2046
|
+
if orig_dtype == torch.bfloat16:
|
|
2047
|
+
# PyTorch stft does not support bfloat16 currently (PyTorch 2.5):
|
|
2048
|
+
# https://github.com/pytorch/pytorch/issues/117844
|
|
2049
|
+
# (Check back later here whether that's still the case...)
|
|
2050
|
+
x_raw = x_raw.to(torch.float32)
|
|
2042
2051
|
y_raw = torch.stft(
|
|
2043
2052
|
x_raw,
|
|
2044
2053
|
n_fft=fft_length,
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/returnn/torch/util/exception_helper.py
RENAMED
|
@@ -86,7 +86,10 @@ def _help_data_or_array(
|
|
|
86
86
|
:return: (info,(min,max))
|
|
87
87
|
"""
|
|
88
88
|
if isinstance(value, torch.Tensor):
|
|
89
|
-
value = value.detach().cpu()
|
|
89
|
+
value = value.detach().cpu()
|
|
90
|
+
if value.dtype == torch.bfloat16:
|
|
91
|
+
value = value.float()
|
|
92
|
+
value = value.numpy()
|
|
90
93
|
v_minmax = -1, -1
|
|
91
94
|
if isinstance(value, np.ndarray):
|
|
92
95
|
info = "shape %s, dtype %s" % (value.shape, value.dtype)
|
|
@@ -769,3 +769,31 @@ def test_edit_distance():
|
|
|
769
769
|
a_ = Tensor("a", [batch_dim, a_spatial_dim], dtype="int64", raw_tensor=torch.tensor(a_values))
|
|
770
770
|
b_ = Tensor("b", [batch_dim, b_spatial_dim], dtype="int64", raw_tensor=torch.tensor(b_values))
|
|
771
771
|
_check_edit_distance(a_, a_spatial_dim, b_, b_spatial_dim)
|
|
772
|
+
|
|
773
|
+
|
|
774
|
+
def test_audio_log_mel_filterbank_from_raw_bfloat16():
|
|
775
|
+
time_dim = Dim(Tensor("time", [batch_dim], dtype="int32"))
|
|
776
|
+
out_dim = Dim(80, name="freq")
|
|
777
|
+
extern_data = TensorDict(
|
|
778
|
+
{
|
|
779
|
+
"data": Tensor("data", [batch_dim, time_dim], dtype="float32"),
|
|
780
|
+
}
|
|
781
|
+
)
|
|
782
|
+
|
|
783
|
+
# noinspection PyShadowingNames
|
|
784
|
+
def _forward_step(*, extern_data: TensorDict, **_kwargs):
|
|
785
|
+
audio = extern_data["data"]
|
|
786
|
+
audio = rf.cast(audio, "bfloat16")
|
|
787
|
+
out, out_spatial_dim = rf.audio.log_mel_filterbank_from_raw(audio, in_spatial_dim=time_dim, out_dim=out_dim)
|
|
788
|
+
assert out.dtype == "bfloat16"
|
|
789
|
+
out = rf.cast(out, "float32") # the test framework doesn't support bfloat16 currently due to Numpy...
|
|
790
|
+
out.mark_as_default_output(shape=(batch_dim, out_spatial_dim, out_dim))
|
|
791
|
+
|
|
792
|
+
run_model(
|
|
793
|
+
extern_data,
|
|
794
|
+
lambda **_kwargs: rf.Module(),
|
|
795
|
+
_forward_step,
|
|
796
|
+
dyn_dim_min_sizes={time_dim: 2000},
|
|
797
|
+
dyn_dim_max_sizes={time_dim: 3000},
|
|
798
|
+
test_tensorflow=False,
|
|
799
|
+
)
|
|
@@ -606,6 +606,33 @@ def test_torch_engine_train_lion_optimizer():
|
|
|
606
606
|
engine.train()
|
|
607
607
|
|
|
608
608
|
|
|
609
|
+
def test_torch_engine_bf16():
|
|
610
|
+
config = Config(
|
|
611
|
+
dict(
|
|
612
|
+
task="train",
|
|
613
|
+
device="cpu",
|
|
614
|
+
default_float_dtype="bfloat16",
|
|
615
|
+
extern_data={"data": {"dim": 9}, "classes": {"dim": 2, "sparse": True}},
|
|
616
|
+
get_model=TrainTestModel,
|
|
617
|
+
train_step=TrainTestModel.train_step,
|
|
618
|
+
batch_size=500,
|
|
619
|
+
optimizer={"class": "adam"},
|
|
620
|
+
num_epochs=1,
|
|
621
|
+
)
|
|
622
|
+
)
|
|
623
|
+
dataset = init_dataset({"class": "Task12AXDataset", "num_seqs": 10, "name": "train"})
|
|
624
|
+
dataset.init_seq_order(epoch=1)
|
|
625
|
+
|
|
626
|
+
with global_config_ctx(config):
|
|
627
|
+
engine = Engine(config=config)
|
|
628
|
+
engine.init_train_from_config(train_data=dataset)
|
|
629
|
+
engine.train()
|
|
630
|
+
params = list(engine.get_pt_model().parameters())
|
|
631
|
+
assert params
|
|
632
|
+
for p in params:
|
|
633
|
+
assert p.dtype == torch.bfloat16
|
|
634
|
+
|
|
635
|
+
|
|
609
636
|
if __name__ == "__main__":
|
|
610
637
|
better_exchook.install()
|
|
611
638
|
if len(sys.argv) <= 1:
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-record-and-push-to-webserver.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-chunking-blstm.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-contribrnn-lstm.12ax.config
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-maxgradnorm-lstm.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-native-lstm-lowmem.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-native-lstm.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-native-lstm2.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-native-lstm2.12ax.tuned.config
RENAMED
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-neural-transducer.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-rec-explicit-lstm.config
RENAMED
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-rec-explicit-rnn.config
RENAMED
|
File without changes
|
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-search-compiled-graph.py
RENAMED
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-tf-vanilla-lstm.12ax.config
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/demo-upd-mult-model.lstm.12ax.config
RENAMED
|
File without changes
|
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/IAM_lines/a01-000u-00.png
RENAMED
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/IAM_lines/a01-007-04.png
RENAMED
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/IAM_lines/a01-007-06.png
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/create_IAM_dataset.py
RENAMED
|
File without changes
|
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/IAM/features/raw/demo.h5
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/artificial/create_test_h5.py
RENAMED
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/artificial/forwardconfig
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/artificial_rgb/create_test_h5.py
RENAMED
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/artificial_rgb/forwardconfig
RENAMED
|
File without changes
|
|
File without changes
|
{returnn-1.20241022.173306 → returnn-1.20241023.94437}/demos/mdlstm/artificial_rgb/trainconfig
RENAMED
|
File without changes
|