returnn 1.20241010.171521__tar.gz → 1.20241014.140459__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of returnn might be problematic. Click here for more details.
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/PKG-INFO +1 -1
- returnn-1.20241014.140459/_setup_info_generated.py +2 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tensor/_dim_extra.py +3 -3
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tensor/tensor_dict.py +3 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/engine.py +95 -111
- returnn-1.20241014.140459/returnn/torch/util/exception_helper.py +111 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/basic.py +22 -3
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn.egg-info/PKG-INFO +1 -1
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn.egg-info/SOURCES.txt +1 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_TFUtil.py +9 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_Util.py +8 -0
- returnn-1.20241010.171521/_setup_info_generated.py +0 -2
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/.editorconfig +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/.gitignore +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/.gitmodules +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/.kateconfig +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/CHANGELOG.md +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/CODEOWNERS +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/CONTRIBUTING.md +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/LICENSE +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/MANIFEST.in +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/README.rst +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/12AX.cluster_map +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/_setup_returnn_env.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-fwd.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-horovod-mpi.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-horovod-mpi.py.sh +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-horovod-mpi.sh +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-hyper-param-tuning.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-iter-dataset.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-list-devices.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-lua-torch-layer.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-pretrain.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-record-and-push-to-webserver.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-returnn-as-framework.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-rf-pt-benchmark.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-rf.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-rhn-enwik8.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-sprint-interface.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-att-copy.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-attention.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-chunking-blstm.12ax.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-contribrnn-lstm.12ax.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-enc-dec.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-hard-att-copy.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-lstm-benchmark.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-maxgradnorm-lstm.12ax.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-native-lstm-lowmem.12ax.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-native-lstm.12ax.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-native-lstm2.12ax.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-native-lstm2.12ax.tuned.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-neural-transducer.12ax.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-rec-explicit-lstm.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-rec-explicit-rnn.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-rec-self-att.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-search-compiled-graph.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-vanilla-lstm.12ax.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-timit-lstm-ctc.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-torch.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-upd-mult-model.lstm.12ax.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo.sh +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/IAM_lines/a01-000u-00.png +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/IAM_lines/a01-007-04.png +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/IAM_lines/a01-007-06.png +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/README.txt +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/chars.txt +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/config_demo +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/config_fwd +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/config_real +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/create_IAM_dataset.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/decode.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/features/raw/demo.h5 +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/go.sh +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/lines.txt +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/split/eval.txt +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/split/train.txt +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/IAM/split/valid.txt +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/README.md +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/artificial/create_test_h5.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/artificial/forwardconfig +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/artificial/go.sh +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/artificial/trainconfig +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/artificial_rgb/create_test_h5.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/artificial_rgb/forwardconfig +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/artificial_rgb/go.sh +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/mdlstm/artificial_rgb/trainconfig +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/pyproject.toml +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/requirements.txt +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/__main__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/__old_mod_loader__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/__setup__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/config.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/audio.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/basic.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/bundle_file.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/cached.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/cached2.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/distrib_files.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/generating.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/hdf.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/lm.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/map.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/meta.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/multi_proc.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/normalization_data.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/numpy_dump.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/postprocessing.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/raw_wav.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/sprint.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/stereo.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/util/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/util/feature_extraction.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/util/strings.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/datasets/util/vocabulary.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/engine/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/engine/base.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/engine/batch.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/__main__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/.git +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/.gitignore +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/LICENSE +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/README.md +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/aligner.gif +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/check.png +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/core.cu +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/core.h +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/core_cpu.cpp +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/pytorch_binding/LICENSE +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/pytorch_binding/MANIFEST.in +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/pytorch_binding/README.md +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/pytorch_binding/binding.cpp +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/pytorch_binding/core.cu +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/pytorch_binding/core.h +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/pytorch_binding/requirements.txt +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/pytorch_binding/setup.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/pytorch_binding/warp_rna/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/pytorch_binding/warp_rna/test.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/ref_rna.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/tensorflow_binding/setup.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/tensorflow_binding/src/warp_rna_op.cc +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/tensorflow_binding/src/warp_rna_op_kernel_tmpl.h +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/tensorflow_binding/warp_rna/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/WarpRna/warp-rna/test.cpp +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/graph_editor/README.md +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/graph_editor/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/graph_editor/edit.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/graph_editor/reroute.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/graph_editor/select.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/graph_editor/subgraph.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/graph_editor/transform.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/extern/graph_editor/util.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/forward_iface.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/_backend.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/_native/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/_native/backend.cpp +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/_native/backend.hpp +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/_native/module.cpp +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/_native/module.hpp +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/_native/py_utils.hpp +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/_native/tensor_ops.cpp +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/_native/tensor_ops.hpp +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/_numpy_backend.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/_random_journal.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/_utils.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/array_.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/attention.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/audio/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/audio/mel.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/audio/specaugment.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/backend.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/build_from_dict.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/cond.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/const.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/container.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/control_flow_ctx.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/conv.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/conversions/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/conversions/espnet_e_branchformer.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/conversions/hf_llama.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/conversions/torch_nn.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/decoder/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/decoder/transformer.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/device.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/dims.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/dropout.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/dtype.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/encoder/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/encoder/base.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/encoder/conformer.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/encoder/e_branchformer.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/encoder/transformer.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/gradient.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/graph.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/hooks.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/init.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/label_smoothing.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/linear.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/loop.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/loss.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/math_.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/matmul.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/module.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/normalization.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/parameter.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/parametrizations.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/parametrize.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/piecewise_linear.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/rand.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/rec.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/reduce.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/run_ctx.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/signal.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/state.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/stepwise_scheduler.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/tensor_array.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/frontend/types.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/import_/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/import_/common.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/import_/git.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/import_/import_.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/learning_rate_control.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/log.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/native_op.cpp +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/native_op.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/pretrain.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/sprint/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/sprint/cache.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/sprint/control.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/sprint/error_signals.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/sprint/extern_interface.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/sprint/interface.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tensor/README.md +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tensor/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tensor/_tensor_extra.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tensor/_tensor_mixin_base.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tensor/_tensor_op_overloads.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tensor/control_flow_ctx.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tensor/dim.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tensor/marked_dim.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tensor/tensor.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tensor/utils.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/compat.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/data_pipeline.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/distributed.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/engine.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/README.md +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/_backend.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/_utils.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/cond.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/config_entry_points.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/debug_eager_mode.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/dims.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/layer.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/loop.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/make_layer.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/masked_computation.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/parameter_assign.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_layers/prev_tensor_ref.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_low_level/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/frontend_low_level/_backend.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/horovod.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/hyper_param_tuning.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/layers/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/layers/base.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/layers/basic.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/layers/rec.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/layers/segmental_model.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/layers/signal_processing.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/layers/variable.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/native_op.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/network.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/sprint.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/updater.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/util/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/util/basic.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/util/data.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/util/gradient_checkpoint.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/util/ken_lm.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/tf/util/open_fst.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/README.md +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/data/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/data/extern_data.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/data/pipeline.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/data/queued_data_iter.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/data/returnn_dataset_wrapper.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/data/tensor_utils.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/distributed.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/frontend/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/frontend/_backend.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/frontend/_rand.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/frontend/bridge.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/frontend/raw_ops.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/updater.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/util/README.md +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/util/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/util/array_.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/util/diagnose_gpu.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/util/gradient_checkpoint.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/util/module.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/torch/util/scaled_gradient.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/__init__.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/better_exchook.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/bpe.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/debug.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/debug_helpers.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/file_cache.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/fsa.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/literal_py_to_pickle.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/math.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/multi_proc_non_daemonic_spawn.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/native_code_compiler.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/pprint.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/py-to-pickle.cpp +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/py_compat.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/py_ext_mod_compiler.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/result_with_reason.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/sig_proc.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/task_system.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/train_proc_manager.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn/util/watch_memory.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn.egg-info/dependency_links.txt +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/returnn.egg-info/top_level.txt +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/rnn.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/setup.cfg +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/setup.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/DummySprintExec.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/PyCharm-inspection-profile.xml +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/PyCharm.idea/.gitignore +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/PyCharm.idea/.name +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/PyCharm.idea/codeStyleSettings.xml +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/PyCharm.idea/codeStyles/Project.xml +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/PyCharm.idea/codeStyles/codeStyleConfig.xml +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/PyCharm.idea/inspectionProfiles/Project_Default.xml +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/PyCharm.idea/inspectionProfiles/profiles_settings.xml +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/PyCharm.idea/misc.xml +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/PyCharm.idea/modules.xml +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/PyCharm.idea/returnn.iml +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/PyCharm.idea/scopes/scope_settings.xml +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/_set_num_threads1.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/_setup_returnn_env.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/_setup_test_env.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/bpe-unicode-demo.codes +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/bpe-unicode-demo.vocab +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/lexicon_opt.fst +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/lexicon_opt.isyms +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/lexicon_opt.jpg +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/lexicon_opt.osyms +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/lint_common.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/pycharm-inspect.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/pylint.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/returnn-as-framework.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/rf_utils.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/spelling.dic +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_Config.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_Dataset.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_Fsa.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_GeneratingDataset.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_HDFDataset.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_LearningRateControl.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_Log.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_MultiProcDataset.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_Pretrain.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_ResNet.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_SprintDataset.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_SprintInterface.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_TFEngine.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_TFNativeOp.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_TFNetworkLayer.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_TFNetworkRecLayer.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_TFNetworkSigProcLayer.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_TFUpdater.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_TF_determinism.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_TaskSystem.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_TaskSystem_SharedMem.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_TranslationDataset.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_demos.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_fork_exec.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_hdf_dump.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_array.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_attention.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_base.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_cond.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_const.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_container.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_conv.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_decoder_transformer.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_encoder_conformer.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_gradient.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_label_smoothing.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_loop.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_math.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_normalization.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_piecewise_linear.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_rec.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_reduce.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_rf_signal.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_tensor.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_tools.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_torch_dataset.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_torch_engine.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_torch_frontend.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_torch_internal_frontend.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/test_torch_util.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tests/torch_utils.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/_setup_returnn_env.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/analyze-dataset-batches.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/bliss-collect-seq-lens.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/bliss-dump-text.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/bliss-get-segment-names.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/bliss-to-ogg-zip.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/bpe-create-lexicon.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/calculate-word-error-rate.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/cleanup-old-models.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/collect-orth-symbols.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/collect-words.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/compile_native_op.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/compile_tf_graph.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/debug-dump-search-scores.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/debug-plot-search-scores.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/dump-dataset-raw-strings.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/dump-dataset.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/dump-forward-stats.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/dump-forward.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/dump-network-json.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/dump-pickle.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/extract_state_tying_from_dataset.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/get-attention-weights.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/get-best-model-epoch.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/hdf_dump.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/hdf_dump_translation_dataset.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/import-blocks-mt-model.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/import-t2t-mt-model.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/.gitignore +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/Makefile +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/README.md +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/example/README.md +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/example/libs_list +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/example/network.040/i600_m600_m600.sgd_b16_lr0_cl2.newbobabs.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/example/network.040/i600_m600_m600.sgd_b16_lr0_cl2.newbobabs.keep_over_epoch.lstm2.config +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/example/rescore_lattice.sh +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/example/state_vars_list +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/example/tensor_names_list +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/file.h +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/htklatticerescorer.cc +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/htklatticerescorer.h +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/main.cc +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/rescorer.h +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/vocabulary.cc +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/lattice_rescorer/vocabulary.h +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/tf_avg_checkpoints.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/tf_inspect_checkpoint.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/tf_inspect_summary_log.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/torch_avg_checkpoints.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/torch_export_to_onnx.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/torch_inspect_checkpoint.py +0 -0
- {returnn-1.20241010.171521 → returnn-1.20241014.140459}/tools/torch_inspect_checkpoint_and_opt.py +0 -0
|
@@ -29,10 +29,10 @@ class DimTypes:
|
|
|
29
29
|
"""
|
|
30
30
|
|
|
31
31
|
Unspecified = None
|
|
32
|
-
Batch = Entity("batch")
|
|
33
|
-
Spatial = Entity("spatial") # also time
|
|
32
|
+
Batch = Entity("batch", global_base=_d, global_name="Dim.Types.Batch")
|
|
33
|
+
Spatial = Entity("spatial", global_base=_d, global_name="Dim.Types.Spatial") # also time
|
|
34
34
|
Time = Spatial # we don't treat this as different
|
|
35
|
-
Feature = Entity("feature")
|
|
35
|
+
Feature = Entity("feature", global_base=_d, global_name="Dim.Types.Feature")
|
|
36
36
|
Types = (Batch, Spatial, Feature)
|
|
37
37
|
|
|
38
38
|
|
|
@@ -12,6 +12,7 @@ import time
|
|
|
12
12
|
import socket
|
|
13
13
|
import fnmatch
|
|
14
14
|
import re
|
|
15
|
+
import math
|
|
15
16
|
|
|
16
17
|
import torch
|
|
17
18
|
import torch.distributed
|
|
@@ -19,7 +20,7 @@ from torch.nn.parallel import DistributedDataParallel
|
|
|
19
20
|
from torch.utils.data import DataLoader
|
|
20
21
|
from torch import autocast
|
|
21
22
|
from torch.cuda import amp
|
|
22
|
-
import
|
|
23
|
+
import numpy as np
|
|
23
24
|
|
|
24
25
|
import returnn
|
|
25
26
|
from returnn.config import Config
|
|
@@ -43,6 +44,7 @@ from .data.queued_data_iter import QueuedDataIter
|
|
|
43
44
|
from .frontend.bridge import rf_module_to_pt_module
|
|
44
45
|
from .util import diagnose_gpu
|
|
45
46
|
from .util import module as util_module
|
|
47
|
+
from .util.exception_helper import help_on_torch_exception
|
|
46
48
|
from .distributed import DistributedContext, get_ctx as dist_get_ctx
|
|
47
49
|
|
|
48
50
|
|
|
@@ -125,6 +127,7 @@ class Engine(EngineBase):
|
|
|
125
127
|
self._calculate_exp_loss = config.bool("calculate_exp_loss", False)
|
|
126
128
|
self._reset_dev_memory_caches = config.bool("reset_dev_memory_caches", False)
|
|
127
129
|
self._forward_auto_split_batch_on_oom = config.bool("forward_auto_split_batch_on_oom", False)
|
|
130
|
+
self._stop_on_nonfinite_train_score = config.bool("stop_on_nonfinite_train_score", True)
|
|
128
131
|
|
|
129
132
|
amp_options = self.config.opt_typed_value("torch_amp")
|
|
130
133
|
grad_scaler_opts = self.config.typed_value("grad_scaler", NotSpecified)
|
|
@@ -237,44 +240,10 @@ class Engine(EngineBase):
|
|
|
237
240
|
self._epoch_mp_shared.value = self.epoch
|
|
238
241
|
|
|
239
242
|
self.init_train_epoch()
|
|
240
|
-
|
|
241
|
-
self.train_epoch()
|
|
242
|
-
except Exception as exc:
|
|
243
|
-
self._handle_run_exception(exc)
|
|
244
|
-
raise
|
|
243
|
+
self.train_epoch()
|
|
245
244
|
|
|
246
245
|
print(f"Finished training at epoch {self.epoch}, global train step {self.global_train_step}", file=log.v3)
|
|
247
246
|
|
|
248
|
-
def _handle_run_exception(self, exc: Exception, *, always_direct_print: bool = False):
|
|
249
|
-
from returnn.util.better_exchook import get_func_from_code_object, iter_traceback
|
|
250
|
-
|
|
251
|
-
print(f"{type(exc).__name__}: {exc}", file=log.v1)
|
|
252
|
-
|
|
253
|
-
# Extend exception message by module call stack.
|
|
254
|
-
module_names_by_id = {} # id -> name
|
|
255
|
-
for name, mod in self._orig_model.named_modules():
|
|
256
|
-
if id(mod) not in module_names_by_id:
|
|
257
|
-
module_names_by_id[id(mod)] = name or "(root)"
|
|
258
|
-
exc_ext = []
|
|
259
|
-
for frame in iter_traceback(exc.__traceback__):
|
|
260
|
-
if frame.f_code.co_nlocals == 0:
|
|
261
|
-
continue
|
|
262
|
-
frame_self = frame.f_locals.get("self")
|
|
263
|
-
if isinstance(frame_self, (torch.nn.Module, rf.Module)):
|
|
264
|
-
func = get_func_from_code_object(frame.f_code, frame=frame)
|
|
265
|
-
if func and func.__name__ and func.__name__.startswith("_") and not func.__name__.startswith("__"):
|
|
266
|
-
continue
|
|
267
|
-
func_name = (func and func.__qualname__) or type(frame_self).__name__
|
|
268
|
-
exc_ext.append(f"({func_name}) {module_names_by_id.get(id(frame_self), '(unknown)')}")
|
|
269
|
-
if not exc_ext:
|
|
270
|
-
exc_ext.append("(No module call frames.)")
|
|
271
|
-
if len(exc.args) == 1 and isinstance(exc.args[0], str) and not always_direct_print:
|
|
272
|
-
exc.args = ("\n".join([exc.args[0], "", "Module call stack:"] + exc_ext),)
|
|
273
|
-
else:
|
|
274
|
-
print("Module call stack:", file=log.v3)
|
|
275
|
-
for msg in exc_ext:
|
|
276
|
-
print(msg, file=log.v3)
|
|
277
|
-
|
|
278
247
|
def init_train_epoch(self):
|
|
279
248
|
"""
|
|
280
249
|
init train (sub)epoch. LR etc
|
|
@@ -369,88 +338,103 @@ class Engine(EngineBase):
|
|
|
369
338
|
|
|
370
339
|
zero_grad_next_step = True
|
|
371
340
|
cur_count_grad_accum = 0
|
|
372
|
-
|
|
373
|
-
|
|
374
|
-
|
|
341
|
+
extern_data = None
|
|
342
|
+
try:
|
|
343
|
+
while True:
|
|
344
|
+
with torch.no_grad():
|
|
345
|
+
extern_data_raw = next(data_iter, None)
|
|
375
346
|
|
|
376
|
-
|
|
347
|
+
step_begin_time = time.time()
|
|
377
348
|
|
|
378
|
-
|
|
379
|
-
|
|
380
|
-
|
|
381
|
-
|
|
382
|
-
|
|
383
|
-
|
|
384
|
-
|
|
349
|
+
_has_data = torch.tensor([extern_data_raw is not None], dtype=torch.int8)
|
|
350
|
+
if self._torch_distributed_ctx:
|
|
351
|
+
# use all reduce to check if all workers have data, if at least one worker does not have data,
|
|
352
|
+
# all workers finish this epoch
|
|
353
|
+
torch.distributed.all_reduce(_has_data, op=torch.distributed.ReduceOp.MIN)
|
|
354
|
+
if not _has_data[0]:
|
|
355
|
+
break
|
|
385
356
|
|
|
386
|
-
|
|
387
|
-
|
|
388
|
-
|
|
389
|
-
|
|
357
|
+
# clear the gradients when every gradient accumulation loop starts
|
|
358
|
+
if zero_grad_next_step:
|
|
359
|
+
self._updater.get_optimizer().zero_grad()
|
|
360
|
+
cur_count_grad_accum = 0
|
|
390
361
|
|
|
391
|
-
|
|
392
|
-
|
|
393
|
-
|
|
394
|
-
|
|
395
|
-
|
|
396
|
-
|
|
397
|
-
|
|
398
|
-
|
|
399
|
-
|
|
400
|
-
|
|
401
|
-
|
|
402
|
-
|
|
403
|
-
|
|
362
|
+
extern_data = extern_data_util.raw_dict_to_extern_data(
|
|
363
|
+
extern_data_raw, extern_data_template=self.extern_data, device=self._device
|
|
364
|
+
)
|
|
365
|
+
self._run_step(extern_data, train_flag=True, train_func=True)
|
|
366
|
+
|
|
367
|
+
train_ctx = rf.get_run_ctx()
|
|
368
|
+
total_loss = train_ctx.total_loss()
|
|
369
|
+
losses_dict = NumbersDict(
|
|
370
|
+
{
|
|
371
|
+
name: (
|
|
372
|
+
float(loss.get_summed_loss().raw_tensor.detach().cpu().numpy())
|
|
373
|
+
if self._device != "meta"
|
|
374
|
+
else float("nan")
|
|
375
|
+
)
|
|
376
|
+
for name, loss in train_ctx.losses.items()
|
|
377
|
+
}
|
|
378
|
+
)
|
|
379
|
+
inv_norm_factors_dict = NumbersDict(
|
|
380
|
+
{name: float(_to_raw(loss.get_inv_norm_factor())) for name, loss in train_ctx.losses.items()}
|
|
381
|
+
)
|
|
382
|
+
|
|
383
|
+
if accum_grad_multiple_step_dyn:
|
|
384
|
+
accum_grad_multiple_step = accum_grad_multiple_step_dyn(
|
|
385
|
+
epoch=self.epoch, global_train_step=self.global_train_step
|
|
404
386
|
)
|
|
405
|
-
|
|
406
|
-
|
|
407
|
-
|
|
408
|
-
|
|
409
|
-
|
|
410
|
-
|
|
387
|
+
cur_count_grad_accum += 1
|
|
388
|
+
perform_update_step = cur_count_grad_accum >= accum_grad_multiple_step
|
|
389
|
+
with (
|
|
390
|
+
self._ddp_pt_model.no_sync()
|
|
391
|
+
if (self._ddp_pt_model is not None and not perform_update_step)
|
|
392
|
+
else nullcontext()
|
|
393
|
+
):
|
|
394
|
+
if self._grad_scaler is not None:
|
|
395
|
+
self._grad_scaler.scale(total_loss.raw_tensor).backward()
|
|
396
|
+
else:
|
|
397
|
+
total_loss.raw_tensor.backward()
|
|
411
398
|
|
|
412
|
-
|
|
413
|
-
|
|
414
|
-
|
|
415
|
-
|
|
416
|
-
cur_count_grad_accum += 1
|
|
417
|
-
perform_update_step = cur_count_grad_accum >= accum_grad_multiple_step
|
|
418
|
-
with (
|
|
419
|
-
self._ddp_pt_model.no_sync()
|
|
420
|
-
if (self._ddp_pt_model is not None and not perform_update_step)
|
|
421
|
-
else nullcontext()
|
|
422
|
-
):
|
|
423
|
-
if self._grad_scaler is not None:
|
|
424
|
-
self._grad_scaler.scale(total_loss.raw_tensor).backward()
|
|
425
|
-
else:
|
|
426
|
-
total_loss.raw_tensor.backward()
|
|
399
|
+
# only update the weights when every gradient accumulation loop ends
|
|
400
|
+
if perform_update_step:
|
|
401
|
+
self._updater.step(grad_scaler=self._grad_scaler)
|
|
402
|
+
zero_grad_next_step = perform_update_step
|
|
427
403
|
|
|
428
|
-
|
|
429
|
-
|
|
430
|
-
self._updater.step(grad_scaler=self._grad_scaler)
|
|
431
|
-
zero_grad_next_step = perform_update_step
|
|
404
|
+
if self._torch_distributed_ctx:
|
|
405
|
+
self._torch_distributed_ctx.step_after_param_update(module=self._pt_model, epoch_step_idx=step_idx)
|
|
432
406
|
|
|
433
|
-
|
|
434
|
-
|
|
435
|
-
|
|
436
|
-
step_duration = time.time() - step_begin_time
|
|
437
|
-
elapsed_computation_time += step_duration
|
|
438
|
-
|
|
439
|
-
accumulated_losses_dict += losses_dict
|
|
440
|
-
accumulated_inv_norm_factors_dict += inv_norm_factors_dict
|
|
441
|
-
eval_info = self._maybe_extend_losses_info(losses_dict / inv_norm_factors_dict)
|
|
442
|
-
_print_process(
|
|
443
|
-
f"ep {self.epoch} train",
|
|
444
|
-
step=step_idx,
|
|
445
|
-
eval_info=dict(eval_info),
|
|
446
|
-
step_duration=step_duration,
|
|
447
|
-
batch_size_info=_get_batch_size_info(extern_data) if self._log_batch_size else None,
|
|
448
|
-
log_memory_usage_device=self._device if self._log_memory_usage else None,
|
|
449
|
-
)
|
|
407
|
+
step_duration = time.time() - step_begin_time
|
|
408
|
+
elapsed_computation_time += step_duration
|
|
450
409
|
|
|
451
|
-
|
|
452
|
-
|
|
453
|
-
|
|
410
|
+
accumulated_losses_dict += losses_dict
|
|
411
|
+
accumulated_inv_norm_factors_dict += inv_norm_factors_dict
|
|
412
|
+
eval_info = self._maybe_extend_losses_info(losses_dict / inv_norm_factors_dict)
|
|
413
|
+
_print_process(
|
|
414
|
+
f"ep {self.epoch} train",
|
|
415
|
+
step=step_idx,
|
|
416
|
+
eval_info=dict(eval_info),
|
|
417
|
+
step_duration=step_duration,
|
|
418
|
+
batch_size_info=_get_batch_size_info(extern_data) if self._log_batch_size else None,
|
|
419
|
+
log_memory_usage_device=self._device if self._log_memory_usage else None,
|
|
420
|
+
)
|
|
421
|
+
|
|
422
|
+
if self._stop_on_nonfinite_train_score:
|
|
423
|
+
if any(np.isinf(v) or np.isnan(v) for v in accumulated_losses_dict.values()):
|
|
424
|
+
print("Model seems broken, got inf or nan score.", file=log.v1)
|
|
425
|
+
print(
|
|
426
|
+
"Accumulated scores:",
|
|
427
|
+
accumulated_losses_dict / accumulated_inv_norm_factors_dict,
|
|
428
|
+
file=log.v1,
|
|
429
|
+
)
|
|
430
|
+
raise Exception(f"Inf/nan score in step {step_idx}.")
|
|
431
|
+
|
|
432
|
+
step_idx += 1
|
|
433
|
+
self.global_train_step += 1
|
|
434
|
+
self._updater.set_current_train_step(global_train_step=self.global_train_step, epoch=self.epoch)
|
|
435
|
+
except Exception as exc:
|
|
436
|
+
help_on_torch_exception(exc, step_idx=step_idx, model=self._orig_model, extern_data=extern_data)
|
|
437
|
+
raise
|
|
454
438
|
|
|
455
439
|
elapsed = time.time() - epoch_start_time
|
|
456
440
|
elapsed_computation_percentage = elapsed_computation_time / elapsed
|
|
@@ -1118,13 +1102,13 @@ class Engine(EngineBase):
|
|
|
1118
1102
|
and self._forward_auto_split_batch_on_oom
|
|
1119
1103
|
and extern_data_util.raw_dict_can_split_batch(extern_data_raw)
|
|
1120
1104
|
):
|
|
1121
|
-
|
|
1105
|
+
help_on_torch_exception(exc, model=self._orig_model, always_direct_print=True)
|
|
1122
1106
|
util.traceback_clear_frames(exc.__traceback__)
|
|
1123
1107
|
diagnose_gpu.garbage_collect()
|
|
1124
1108
|
print(f"{report_prefix}, split step {step_idx} batch and try again...", file=log.v3)
|
|
1125
1109
|
data_loader.extend(extern_data_util.raw_dict_split_batch(extern_data_raw, splits=2))
|
|
1126
1110
|
continue
|
|
1127
|
-
self.
|
|
1111
|
+
help_on_torch_exception(exc, model=self._orig_model)
|
|
1128
1112
|
raise
|
|
1129
1113
|
ctx = rf.get_run_ctx()
|
|
1130
1114
|
ctx.check_outputs_complete()
|
|
@@ -0,0 +1,111 @@
|
|
|
1
|
+
"""
|
|
2
|
+
Helper for any type of PyTorch exceptions
|
|
3
|
+
"""
|
|
4
|
+
|
|
5
|
+
from __future__ import annotations
|
|
6
|
+
|
|
7
|
+
from typing import Optional, Union, Tuple
|
|
8
|
+
|
|
9
|
+
import torch
|
|
10
|
+
import numpy as np
|
|
11
|
+
|
|
12
|
+
from returnn.log import log
|
|
13
|
+
import returnn.frontend as rf
|
|
14
|
+
from returnn.tensor import TensorDict
|
|
15
|
+
|
|
16
|
+
|
|
17
|
+
def help_on_torch_exception(
|
|
18
|
+
exc: Exception,
|
|
19
|
+
*,
|
|
20
|
+
step_idx: Optional[int] = None,
|
|
21
|
+
extern_data: Optional[TensorDict] = None,
|
|
22
|
+
model: Union[rf.Module, torch.nn.Module],
|
|
23
|
+
always_direct_print: bool = False,
|
|
24
|
+
):
|
|
25
|
+
"""
|
|
26
|
+
Gather some information which might be helpful for debugging a PyTorch exception.
|
|
27
|
+
"""
|
|
28
|
+
from returnn.util.better_exchook import get_func_from_code_object, iter_traceback
|
|
29
|
+
|
|
30
|
+
print(f"{type(exc).__name__}: {exc}", file=log.v1)
|
|
31
|
+
|
|
32
|
+
exc_ext = [f"Step idx: {step_idx}"]
|
|
33
|
+
if extern_data:
|
|
34
|
+
exc_ext.append("Extern data:")
|
|
35
|
+
if "seq_tag" in extern_data:
|
|
36
|
+
exc_ext.append(f" Seq tags: {extern_data['seq_tag'].raw_tensor}")
|
|
37
|
+
covered_dim_tags = set()
|
|
38
|
+
for data_key, data in extern_data.data.items():
|
|
39
|
+
info, v_minmax = _help_data_or_array(data.raw_tensor)
|
|
40
|
+
exc_ext.append(f" {data_key}: {info}, {data}")
|
|
41
|
+
if data.sparse:
|
|
42
|
+
if v_minmax[0] < 0 or v_minmax[1] >= data.dim:
|
|
43
|
+
exc_ext.append(f" WARNING, invalid label for data sparse dim {data.sparse_dim}")
|
|
44
|
+
for dim in data.dims:
|
|
45
|
+
if dim in covered_dim_tags:
|
|
46
|
+
continue
|
|
47
|
+
covered_dim_tags.add(dim)
|
|
48
|
+
if not dim.dyn_size_ext:
|
|
49
|
+
continue
|
|
50
|
+
info, _ = _help_data_or_array(dim.dyn_size_ext.raw_tensor)
|
|
51
|
+
exc_ext.append(f" dim {dim.short_repr()} size: {info}")
|
|
52
|
+
|
|
53
|
+
# Extend exception message by module call stack.
|
|
54
|
+
exc_ext.append("Module call stack:")
|
|
55
|
+
module_names_by_id = {} # id -> name
|
|
56
|
+
count_frames = 0
|
|
57
|
+
for name, mod in model.named_modules():
|
|
58
|
+
if id(mod) not in module_names_by_id:
|
|
59
|
+
module_names_by_id[id(mod)] = name or "(root)"
|
|
60
|
+
for frame in iter_traceback(exc.__traceback__):
|
|
61
|
+
if frame.f_code.co_nlocals == 0:
|
|
62
|
+
continue
|
|
63
|
+
frame_self = frame.f_locals.get("self")
|
|
64
|
+
if isinstance(frame_self, (torch.nn.Module, rf.Module)):
|
|
65
|
+
func = get_func_from_code_object(frame.f_code, frame=frame)
|
|
66
|
+
if func and func.__name__ and func.__name__.startswith("_") and not func.__name__.startswith("__"):
|
|
67
|
+
continue
|
|
68
|
+
func_name = (func and func.__qualname__) or type(frame_self).__name__
|
|
69
|
+
exc_ext.append(f"({func_name}) {module_names_by_id.get(id(frame_self), '(unknown)')}")
|
|
70
|
+
count_frames += 1
|
|
71
|
+
if not count_frames:
|
|
72
|
+
exc_ext.append("(No module call frames.)")
|
|
73
|
+
|
|
74
|
+
if len(exc.args) == 1 and isinstance(exc.args[0], str) and not always_direct_print:
|
|
75
|
+
exc.args = ("\n".join([exc.args[0], ""] + exc_ext),)
|
|
76
|
+
else:
|
|
77
|
+
for msg in exc_ext:
|
|
78
|
+
print(msg, file=log.v3)
|
|
79
|
+
|
|
80
|
+
|
|
81
|
+
def _help_data_or_array(
|
|
82
|
+
value: Union[torch.Tensor, np.ndarray, bool, object]
|
|
83
|
+
) -> Tuple[str, Tuple[Union[int, float], Union[int, float]]]:
|
|
84
|
+
"""
|
|
85
|
+
:param value:
|
|
86
|
+
:return: (info,(min,max))
|
|
87
|
+
"""
|
|
88
|
+
if isinstance(value, torch.Tensor):
|
|
89
|
+
value = value.detach().cpu().numpy()
|
|
90
|
+
v_minmax = -1, -1
|
|
91
|
+
if isinstance(value, np.ndarray):
|
|
92
|
+
info = "shape %s, dtype %s" % (value.shape, value.dtype)
|
|
93
|
+
if value.dtype.kind in "biuf":
|
|
94
|
+
if value.size > 1:
|
|
95
|
+
v_minmax = np.min(value), np.max(value)
|
|
96
|
+
info += ", min/max %s/%s" % v_minmax
|
|
97
|
+
if value.dtype.kind == "f":
|
|
98
|
+
info += ", mean/stddev %s/%s" % (np.mean(value), np.std(value))
|
|
99
|
+
if value.ndim <= 1:
|
|
100
|
+
info += " (%s)" % np.array2string(value)
|
|
101
|
+
elif value.size == 1:
|
|
102
|
+
info += " (%s)" % np.array2string(value)
|
|
103
|
+
else:
|
|
104
|
+
info += ", EMPTY"
|
|
105
|
+
elif isinstance(value, (np.floating, np.integer, np.bool_, float, int, bool, str, bytes)):
|
|
106
|
+
info = "%s(%s)" % (type(value).__name__, value)
|
|
107
|
+
elif value is None:
|
|
108
|
+
info = "None"
|
|
109
|
+
else:
|
|
110
|
+
info = "type %r" % type(value)
|
|
111
|
+
return info, v_minmax
|
|
@@ -83,19 +83,38 @@ class Entity:
|
|
|
83
83
|
This is more efficient than using just the string directly in an enum.
|
|
84
84
|
"""
|
|
85
85
|
|
|
86
|
-
def __init__(
|
|
86
|
+
def __init__(
|
|
87
|
+
self, name: Optional[str] = None, *, global_base: Optional[Any] = None, global_name: Optional[str] = None
|
|
88
|
+
):
|
|
87
89
|
"""
|
|
88
90
|
:param str|None name:
|
|
89
91
|
"""
|
|
90
92
|
self.name = name
|
|
93
|
+
if global_name and not global_base:
|
|
94
|
+
frame = try_get_stack_frame(1)
|
|
95
|
+
global_base = sys.modules[frame.f_globals["__name__"]]
|
|
96
|
+
self.global_base = global_base
|
|
97
|
+
self.global_name = global_name
|
|
91
98
|
|
|
92
99
|
def __str__(self):
|
|
93
|
-
return self.name
|
|
100
|
+
return self.name or self.global_name or "<unnamed Entity>"
|
|
94
101
|
|
|
95
102
|
def __repr__(self):
|
|
96
|
-
return "<%s>" % self.name
|
|
103
|
+
return "<%s Entity>" % (self.name or self.global_name or "unnamed")
|
|
104
|
+
|
|
105
|
+
def __reduce__(self):
|
|
106
|
+
if self.global_name:
|
|
107
|
+
# Sanity check that the global ref is correct.
|
|
108
|
+
attrs = self.global_name.split(".")
|
|
109
|
+
assert attr_chain(self.global_base, attrs) is self
|
|
110
|
+
parent = attr_chain(self.global_base, attrs[:-1])
|
|
111
|
+
assert getattr(parent, attrs[-1]) is self
|
|
112
|
+
return getattr, (parent, attrs[-1])
|
|
113
|
+
raise Exception("Cannot pickle Entity object. (%r)" % self)
|
|
97
114
|
|
|
98
115
|
def __getstate__(self):
|
|
116
|
+
if self.global_name:
|
|
117
|
+
raise Exception("We expect that __reduce__ is used, not __getstate__.")
|
|
99
118
|
raise Exception("Cannot pickle Entity object. (%r)" % self)
|
|
100
119
|
|
|
101
120
|
|
|
@@ -302,6 +302,7 @@ returnn/torch/util/README.md
|
|
|
302
302
|
returnn/torch/util/__init__.py
|
|
303
303
|
returnn/torch/util/array_.py
|
|
304
304
|
returnn/torch/util/diagnose_gpu.py
|
|
305
|
+
returnn/torch/util/exception_helper.py
|
|
305
306
|
returnn/torch/util/gradient_checkpoint.py
|
|
306
307
|
returnn/torch/util/module.py
|
|
307
308
|
returnn/torch/util/scaled_gradient.py
|
|
@@ -1554,6 +1554,15 @@ def test_Dim_pickle():
|
|
|
1554
1554
|
assert single_step_dim_copy == single_step_dim
|
|
1555
1555
|
|
|
1556
1556
|
|
|
1557
|
+
def test_DimType_pickle():
|
|
1558
|
+
from returnn.tensor import Dim
|
|
1559
|
+
import pickle
|
|
1560
|
+
|
|
1561
|
+
a = Dim.Types.Spatial
|
|
1562
|
+
a_copy = pickle.loads(pickle.dumps(a))
|
|
1563
|
+
assert a is a_copy
|
|
1564
|
+
|
|
1565
|
+
|
|
1557
1566
|
def test_Dim_sorted():
|
|
1558
1567
|
from returnn.util.basic import obj_diff_str
|
|
1559
1568
|
|
|
@@ -369,6 +369,14 @@ def test_deepcopy_builtins():
|
|
|
369
369
|
assert o["__builtins__"] is user_ns["__builtins__"] # no copy, directly reference this module dict
|
|
370
370
|
|
|
371
371
|
|
|
372
|
+
_demo_entity = Entity("demo entity", global_name="_demo_entity")
|
|
373
|
+
|
|
374
|
+
|
|
375
|
+
def test_deepcopy_Entity():
|
|
376
|
+
entity_copy = deepcopy(_demo_entity)
|
|
377
|
+
assert entity_copy is _demo_entity # no copy, directly reference this entity
|
|
378
|
+
|
|
379
|
+
|
|
372
380
|
def test_get_func_kwargs():
|
|
373
381
|
def dummy_func(net, var, update_ops):
|
|
374
382
|
pass
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-hyper-param-tuning.config
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-record-and-push-to-webserver.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-chunking-blstm.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-contribrnn-lstm.12ax.config
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-maxgradnorm-lstm.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-native-lstm-lowmem.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-native-lstm.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-native-lstm2.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-native-lstm2.12ax.tuned.config
RENAMED
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-neural-transducer.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-rec-explicit-lstm.config
RENAMED
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-rec-explicit-rnn.config
RENAMED
|
File without changes
|
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-search-compiled-graph.py
RENAMED
|
File without changes
|
{returnn-1.20241010.171521 → returnn-1.20241014.140459}/demos/demo-tf-vanilla-lstm.12ax.config
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|