returnn 1.20250204.4017__tar.gz → 1.20250206.144022__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of returnn might be problematic. Click here for more details.
- {returnn-1.20250204.4017/returnn.egg-info → returnn-1.20250206.144022}/PKG-INFO +1 -1
- returnn-1.20250206.144022/_setup_info_generated.py +2 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/util/vocabulary.py +2 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/encoder/transformer.py +19 -11
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tensor/tensor_dict.py +1 -1
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/engine.py +24 -1
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/util/debug_inf_nan.py +37 -5
- {returnn-1.20250204.4017 → returnn-1.20250206.144022/returnn.egg-info}/PKG-INFO +1 -1
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/rf_utils.py +43 -2
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_array.py +28 -1
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_torch_util.py +2 -2
- returnn-1.20250204.4017/_setup_info_generated.py +0 -2
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/.editorconfig +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/.gitignore +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/.gitmodules +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/.kateconfig +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/CHANGELOG.md +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/CODEOWNERS +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/CONTRIBUTING.md +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/LICENSE +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/MANIFEST.in +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/README.rst +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/12AX.cluster_map +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/_setup_returnn_env.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-fwd.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-horovod-mpi.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-horovod-mpi.py.sh +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-horovod-mpi.sh +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-hyper-param-tuning.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-iter-dataset.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-list-devices.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-lua-torch-layer.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-pretrain.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-record-and-push-to-webserver.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-returnn-as-framework.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-rf-pt-benchmark.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-rf.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-rhn-enwik8.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-sprint-interface.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-att-copy.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-attention.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-chunking-blstm.12ax.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-contribrnn-lstm.12ax.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-enc-dec.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-hard-att-copy.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-lstm-benchmark.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-maxgradnorm-lstm.12ax.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-native-lstm-lowmem.12ax.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-native-lstm.12ax.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-native-lstm2.12ax.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-native-lstm2.12ax.tuned.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-neural-transducer.12ax.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-rec-explicit-lstm.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-rec-explicit-rnn.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-rec-self-att.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-search-compiled-graph.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-vanilla-lstm.12ax.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-timit-lstm-ctc.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-torch.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-upd-mult-model.lstm.12ax.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo.sh +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/IAM_lines/a01-000u-00.png +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/IAM_lines/a01-007-04.png +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/IAM_lines/a01-007-06.png +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/README.txt +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/chars.txt +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/config_demo +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/config_fwd +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/config_real +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/create_IAM_dataset.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/decode.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/features/raw/demo.h5 +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/go.sh +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/lines.txt +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/split/eval.txt +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/split/train.txt +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/split/valid.txt +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/README.md +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/artificial/create_test_h5.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/artificial/forwardconfig +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/artificial/go.sh +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/artificial/trainconfig +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/artificial_rgb/create_test_h5.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/artificial_rgb/forwardconfig +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/artificial_rgb/go.sh +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/artificial_rgb/trainconfig +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/pyproject.toml +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/requirements.txt +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/__main__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/__old_mod_loader__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/__setup__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/config.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/audio.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/basic.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/bundle_file.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/cached.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/cached2.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/distrib_files.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/generating.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/hdf.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/lm.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/map.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/meta.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/multi_proc.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/normalization_data.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/numpy_dump.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/postprocessing.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/raw_wav.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/sprint.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/stereo.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/text_dict.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/util/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/util/feature_extraction.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/datasets/util/strings.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/engine/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/engine/base.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/engine/batch.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/__main__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/.git +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/.gitignore +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/LICENSE +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/README.md +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/aligner.gif +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/check.png +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/core.cu +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/core.h +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/core_cpu.cpp +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/pytorch_binding/LICENSE +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/pytorch_binding/MANIFEST.in +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/pytorch_binding/README.md +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/pytorch_binding/binding.cpp +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/pytorch_binding/core.cu +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/pytorch_binding/core.h +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/pytorch_binding/requirements.txt +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/pytorch_binding/setup.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/pytorch_binding/warp_rna/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/pytorch_binding/warp_rna/test.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/ref_rna.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/tensorflow_binding/setup.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/tensorflow_binding/src/warp_rna_op.cc +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/tensorflow_binding/src/warp_rna_op_kernel_tmpl.h +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/tensorflow_binding/warp_rna/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/WarpRna/warp-rna/test.cpp +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/graph_editor/README.md +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/graph_editor/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/graph_editor/edit.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/graph_editor/reroute.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/graph_editor/select.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/graph_editor/subgraph.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/graph_editor/transform.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/extern/graph_editor/util.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/forward_iface.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/_backend.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/_cache.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/_native/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/_native/backend.cpp +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/_native/backend.hpp +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/_native/module.cpp +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/_native/module.hpp +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/_native/py_utils.hpp +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/_native/tensor_ops.cpp +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/_native/tensor_ops.hpp +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/_numpy_backend.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/_random_journal.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/_utils.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/array_.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/attention.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/audio/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/audio/mel.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/audio/specaugment.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/backend.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/build_from_dict.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/cond.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/const.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/container.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/control_flow_ctx.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/conv.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/conversions/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/conversions/espnet_e_branchformer.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/conversions/hf_llama.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/conversions/torch_nn.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/decoder/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/decoder/transformer.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/device.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/dims.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/dropout.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/dtype.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/encoder/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/encoder/base.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/encoder/conformer.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/encoder/conformer_v2.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/encoder/e_branchformer.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/gradient.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/graph.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/hooks.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/init.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/label_smoothing.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/linear.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/loop.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/loss.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/math_.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/matmul.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/module.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/nested.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/normalization.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/parameter.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/parametrizations.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/parametrize.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/piecewise_linear.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/rand.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/rec.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/reduce.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/run_ctx.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/signal.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/state.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/stepwise_scheduler.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/tensor_array.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/types.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/import_/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/import_/common.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/import_/git.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/import_/import_.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/learning_rate_control.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/log.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/native_op.cpp +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/native_op.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/pretrain.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/sprint/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/sprint/cache.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/sprint/control.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/sprint/error_signals.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/sprint/extern_interface.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/sprint/interface.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tensor/README.md +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tensor/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tensor/_dim_extra.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tensor/_tensor_extra.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tensor/_tensor_mixin_base.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tensor/_tensor_op_overloads.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tensor/control_flow_ctx.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tensor/dim.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tensor/marked_dim.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tensor/tensor.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tensor/utils.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/compat.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/data_pipeline.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/distributed.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/engine.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/README.md +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/_backend.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/_utils.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/cond.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/config_entry_points.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/debug_eager_mode.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/dims.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/layer.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/loop.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/make_layer.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/masked_computation.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/parameter_assign.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_layers/prev_tensor_ref.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_low_level/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/frontend_low_level/_backend.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/horovod.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/hyper_param_tuning.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/layers/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/layers/base.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/layers/basic.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/layers/rec.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/layers/segmental_model.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/layers/signal_processing.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/layers/variable.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/native_op.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/network.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/sprint.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/updater.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/util/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/util/basic.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/util/data.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/util/gradient_checkpoint.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/util/ken_lm.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/tf/util/open_fst.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/README.md +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/data/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/data/extern_data.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/data/pipeline.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/data/queued_data_iter.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/data/returnn_dataset_wrapper.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/data/tensor_utils.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/distributed.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/frontend/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/frontend/_backend.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/frontend/_rand.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/frontend/bridge.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/frontend/raw_ops.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/optim/README.md +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/optim/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/optim/lion.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/updater.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/util/README.md +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/util/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/util/array_.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/util/diagnose_gpu.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/util/exception_helper.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/util/gradient_checkpoint.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/util/module.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/torch/util/scaled_gradient.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/__init__.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/basic.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/better_exchook.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/bpe.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/debug.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/debug_helpers.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/file_cache.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/fsa.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/literal_py_to_pickle.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/lru_cache.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/math.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/multi_proc_non_daemonic_spawn.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/native_code_compiler.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/pprint.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/py-to-pickle.cpp +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/py_ext_mod_compiler.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/result_with_reason.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/sig_proc.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/task_system.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/train_proc_manager.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/util/watch_memory.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn.egg-info/SOURCES.txt +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn.egg-info/dependency_links.txt +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn.egg-info/requires.txt +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn.egg-info/top_level.txt +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/rnn.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/setup.cfg +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/setup.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/DummySprintExec.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/PyCharm-inspection-profile.xml +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/PyCharm.idea/.gitignore +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/PyCharm.idea/.name +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/PyCharm.idea/codeStyleSettings.xml +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/PyCharm.idea/codeStyles/Project.xml +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/PyCharm.idea/codeStyles/codeStyleConfig.xml +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/PyCharm.idea/inspectionProfiles/Project_Default.xml +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/PyCharm.idea/inspectionProfiles/profiles_settings.xml +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/PyCharm.idea/misc.xml +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/PyCharm.idea/modules.xml +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/PyCharm.idea/returnn.iml +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/PyCharm.idea/scopes/scope_settings.xml +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/_set_num_threads1.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/_setup_returnn_env.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/_setup_test_env.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/bpe-unicode-demo.codes +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/bpe-unicode-demo.vocab +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/lexicon_opt.fst +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/lexicon_opt.isyms +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/lexicon_opt.jpg +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/lexicon_opt.osyms +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/lint_common.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/pycharm-inspect.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/pylint.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/returnn-as-framework.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/spelling.dic +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_Config.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_Dataset.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_Fsa.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_GeneratingDataset.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_HDFDataset.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_LearningRateControl.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_Log.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_MultiProcDataset.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_Pretrain.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_ResNet.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_SprintDataset.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_SprintInterface.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_TFEngine.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_TFNativeOp.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_TFNetworkLayer.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_TFNetworkRecLayer.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_TFNetworkSigProcLayer.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_TFUpdater.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_TFUtil.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_TF_determinism.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_TaskSystem.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_TaskSystem_SharedMem.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_TranslationDataset.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_Util.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_demos.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_fork_exec.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_hdf_dump.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_attention.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_base.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_cond.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_const.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_container.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_conv.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_decoder_transformer.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_encoder_conformer.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_gradient.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_label_smoothing.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_loop.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_math.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_normalization.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_piecewise_linear.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_rec.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_reduce.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_rf_signal.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_tensor.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_threading.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_tools.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_torch_dataset.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_torch_engine.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_torch_frontend.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/test_torch_internal_frontend.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tests/torch_utils.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/_setup_returnn_env.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/analyze-dataset-batches.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/bliss-collect-seq-lens.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/bliss-dump-text.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/bliss-get-segment-names.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/bliss-to-ogg-zip.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/bpe-create-lexicon.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/calculate-word-error-rate.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/cleanup-old-models.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/collect-orth-symbols.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/collect-words.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/compile_native_op.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/compile_tf_graph.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/debug-dump-search-scores.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/debug-plot-search-scores.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/dump-dataset-raw-strings.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/dump-dataset.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/dump-forward-stats.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/dump-forward.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/dump-network-json.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/dump-pickle.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/extract_state_tying_from_dataset.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/get-attention-weights.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/get-best-model-epoch.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/hdf_dump.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/hdf_dump_translation_dataset.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/import-blocks-mt-model.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/import-t2t-mt-model.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/.gitignore +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/Makefile +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/README.md +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/example/README.md +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/example/libs_list +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/example/network.040/i600_m600_m600.sgd_b16_lr0_cl2.newbobabs.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/example/network.040/i600_m600_m600.sgd_b16_lr0_cl2.newbobabs.keep_over_epoch.lstm2.config +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/example/rescore_lattice.sh +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/example/state_vars_list +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/example/tensor_names_list +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/file.h +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/htklatticerescorer.cc +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/htklatticerescorer.h +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/main.cc +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/rescorer.h +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/vocabulary.cc +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/lattice_rescorer/vocabulary.h +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/tf_avg_checkpoints.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/tf_inspect_checkpoint.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/tf_inspect_summary_log.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/torch_avg_checkpoints.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/torch_export_to_onnx.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/torch_inspect_checkpoint.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/torch_inspect_checkpoint_and_opt.py +0 -0
- {returnn-1.20250204.4017 → returnn-1.20250206.144022}/tools/torch_scale_tuning.py +0 -0
|
@@ -78,6 +78,8 @@ class Vocabulary:
|
|
|
78
78
|
:param seq_postfix: labels will be added to the seq in self.get_seq
|
|
79
79
|
:param labels:
|
|
80
80
|
"""
|
|
81
|
+
if vocab_file and not isinstance(vocab_file, str): # sometimes it is a Path
|
|
82
|
+
vocab_file = str(vocab_file)
|
|
81
83
|
self.vocab_file = vocab_file
|
|
82
84
|
|
|
83
85
|
if special_symbols_via_file:
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/returnn/frontend/encoder/transformer.py
RENAMED
|
@@ -35,6 +35,7 @@ class TransformerEncoder(rf.Module):
|
|
|
35
35
|
layer: Optional[Union[TransformerEncoderLayer, rf.Module, type, Dict[str, Any], Any]] = None,
|
|
36
36
|
layer_opts: Optional[Dict[str, Any]] = None,
|
|
37
37
|
embed_dim: Optional[Dim] = None,
|
|
38
|
+
input_embedding: Union[None, rf.Module, type, Dict[str, Any]] = rf.Embedding,
|
|
38
39
|
input_embedding_scale: float = None,
|
|
39
40
|
input_dropout: float = None,
|
|
40
41
|
sequential=rf.Sequential,
|
|
@@ -53,6 +54,7 @@ class TransformerEncoder(rf.Module):
|
|
|
53
54
|
:param layer: an instance of :class:`TransformerEncoderLayer` or similar
|
|
54
55
|
:param layer_opts: options for the encoder layer
|
|
55
56
|
:param embed_dim: if given, will first have an embedding [vocab,embed] and then a linear [embed,model].
|
|
57
|
+
:param input_embedding:
|
|
56
58
|
:param input_embedding_scale:
|
|
57
59
|
:param input_dropout:
|
|
58
60
|
:param sequential:
|
|
@@ -77,9 +79,15 @@ class TransformerEncoder(rf.Module):
|
|
|
77
79
|
self.model_dim = model_dim
|
|
78
80
|
self.embed_dim = embed_dim
|
|
79
81
|
|
|
80
|
-
|
|
81
|
-
|
|
82
|
-
|
|
82
|
+
if input_embedding is None or isinstance(input_embedding, rf.Module):
|
|
83
|
+
pass
|
|
84
|
+
elif isinstance(input_embedding, type):
|
|
85
|
+
input_embedding: rf.Embedding = input_embedding(vocab_dim, embed_dim or model_dim)
|
|
86
|
+
elif isinstance(input_embedding, dict):
|
|
87
|
+
input_embedding = rf.build_from_dict(input_embedding, vocab_dim, embed_dim or model_dim)
|
|
88
|
+
else:
|
|
89
|
+
raise TypeError(f"unexpected input_embedding {input_embedding!r} type {type(input_embedding)}")
|
|
90
|
+
self.input_embedding = input_embedding
|
|
83
91
|
|
|
84
92
|
self.input_embedding_proj = None
|
|
85
93
|
if embed_dim:
|
|
@@ -88,17 +96,13 @@ class TransformerEncoder(rf.Module):
|
|
|
88
96
|
if pos_enc is None:
|
|
89
97
|
pass
|
|
90
98
|
elif isinstance(pos_enc, dict):
|
|
91
|
-
pos_enc = rf.build_from_dict(
|
|
92
|
-
pos_enc, feat_dim=embed_dim or model_dim, dtype=self.input_embedding.weight.dtype
|
|
93
|
-
)
|
|
99
|
+
pos_enc = rf.build_from_dict(pos_enc, feat_dim=embed_dim or model_dim, dtype=rf.get_default_float_dtype())
|
|
94
100
|
elif isinstance(pos_enc, rf.Module):
|
|
95
101
|
pass
|
|
96
102
|
elif isinstance(pos_enc, FunctionType):
|
|
97
|
-
pos_enc = functools.partial(
|
|
98
|
-
pos_enc, feat_dim=embed_dim or model_dim, dtype=self.input_embedding.weight.dtype
|
|
99
|
-
)
|
|
103
|
+
pos_enc = functools.partial(pos_enc, feat_dim=embed_dim or model_dim, dtype=rf.get_default_float_dtype())
|
|
100
104
|
else:
|
|
101
|
-
raise TypeError(f"unexpected pos_enc
|
|
105
|
+
raise TypeError(f"unexpected pos_enc {pos_enc!r} type {type(pos_enc)}")
|
|
102
106
|
self.pos_enc = pos_enc
|
|
103
107
|
if input_embedding_scale is None:
|
|
104
108
|
input_embedding_scale = model_dim.dimension**0.5
|
|
@@ -157,7 +161,11 @@ class TransformerEncoder(rf.Module):
|
|
|
157
161
|
:param collected_outputs:
|
|
158
162
|
:return: final encoder output, after final layer norm
|
|
159
163
|
"""
|
|
160
|
-
|
|
164
|
+
if self.input_embedding is not None:
|
|
165
|
+
decoded = self.input_embedding(source) * self.input_embedding_scale
|
|
166
|
+
else:
|
|
167
|
+
assert self.model_dim in source.dims
|
|
168
|
+
decoded = source
|
|
161
169
|
if self.pos_enc is not None:
|
|
162
170
|
decoded = decoded + self.pos_enc(spatial_dim=spatial_dim)
|
|
163
171
|
decoded = rf.dropout(decoded, self.input_dropout)
|
|
@@ -139,7 +139,7 @@ class TensorDict:
|
|
|
139
139
|
"""
|
|
140
140
|
visited_dims = set()
|
|
141
141
|
for key, value in self.data.items():
|
|
142
|
-
assert key in raw_tensor_dict
|
|
142
|
+
assert key in raw_tensor_dict, f"key {key} not in raw_tensor_dict {list(raw_tensor_dict.keys())}"
|
|
143
143
|
value.raw_tensor = raw_tensor_dict[key]
|
|
144
144
|
for i, dim in enumerate(value.dims):
|
|
145
145
|
dim: Dim
|
|
@@ -505,12 +505,35 @@ class Engine(EngineBase):
|
|
|
505
505
|
file=log.v1,
|
|
506
506
|
)
|
|
507
507
|
|
|
508
|
+
print("Checking for inf/nan in model parameters...", file=log.v1)
|
|
509
|
+
count_nan_inf_params = 0
|
|
510
|
+
for name, param in self._pt_model.named_parameters():
|
|
511
|
+
got_nan_inf_t = torch.stack([torch.isnan(param).any(), torch.isinf(param).any()]).cpu()
|
|
512
|
+
got_nan = got_nan_inf_t[0].item()
|
|
513
|
+
got_inf = got_nan_inf_t[1].item()
|
|
514
|
+
if got_nan or got_inf:
|
|
515
|
+
s = "/".join([s_ for s_, b in [("nan", got_nan), ("inf", got_inf)] if b])
|
|
516
|
+
print(f" {name} {param}: {s}", file=log.v1)
|
|
517
|
+
count_nan_inf_params += 1
|
|
518
|
+
if count_nan_inf_params == 0:
|
|
519
|
+
print("(No inf/nan in model parameters.)", file=log.v1)
|
|
520
|
+
|
|
508
521
|
def _debug_func() -> torch.Tensor:
|
|
509
522
|
self._run_step(extern_data, train_flag=True, train_func=True)
|
|
510
|
-
|
|
523
|
+
loss = rf.get_run_ctx().total_loss()
|
|
524
|
+
assert isinstance(loss, Tensor)
|
|
525
|
+
return loss.raw_tensor
|
|
511
526
|
|
|
512
527
|
print("Running debug_inf_nan...", file=log.v1)
|
|
513
528
|
debug_inf_nan(_debug_func, with_grad=True)
|
|
529
|
+
if count_nan_inf_params > 0 and self.global_train_step == 1:
|
|
530
|
+
print(
|
|
531
|
+
"This was the second step, so likely the first step grad was broken."
|
|
532
|
+
" Try again with reset model...",
|
|
533
|
+
file=log.v1,
|
|
534
|
+
)
|
|
535
|
+
self._load_model()
|
|
536
|
+
debug_inf_nan(_debug_func, with_grad=True)
|
|
514
537
|
raise Exception(f"Inf/nan score in step {step_idx}.")
|
|
515
538
|
|
|
516
539
|
step_idx += 1
|
|
@@ -52,6 +52,7 @@ def debug_inf_nan(
|
|
|
52
52
|
*,
|
|
53
53
|
with_grad: bool = False,
|
|
54
54
|
report_every_op_call: bool = True,
|
|
55
|
+
stop_reporting_after_first_inf_nan: bool = True,
|
|
55
56
|
file: Optional[Union[TextIO, TextIOBase]] = None,
|
|
56
57
|
):
|
|
57
58
|
"""
|
|
@@ -61,6 +62,7 @@ def debug_inf_nan(
|
|
|
61
62
|
and we will call `loss = func(); loss.backward()`.
|
|
62
63
|
:param with_grad: whether to compute and debug gradients for inf/nan.
|
|
63
64
|
:param report_every_op_call: whether to report every op call.
|
|
65
|
+
:param stop_reporting_after_first_inf_nan: whether to stop reporting after the first inf/nan.
|
|
64
66
|
:param file: where to write the output to. Default is stdout.
|
|
65
67
|
"""
|
|
66
68
|
|
|
@@ -69,13 +71,18 @@ def debug_inf_nan(
|
|
|
69
71
|
|
|
70
72
|
# noinspection PyUnresolvedReferences,PyProtectedMember
|
|
71
73
|
cur_frame: FrameType = sys._getframe()
|
|
72
|
-
trace_ops = _TraceOps(
|
|
74
|
+
trace_ops = _TraceOps(
|
|
75
|
+
root_frame=cur_frame,
|
|
76
|
+
file=file,
|
|
77
|
+
report_every_op_call=report_every_op_call,
|
|
78
|
+
stop_reporting_after_first_inf_nan=stop_reporting_after_first_inf_nan,
|
|
79
|
+
)
|
|
73
80
|
|
|
74
81
|
if with_grad:
|
|
75
|
-
|
|
76
82
|
with torch.autograd.detect_anomaly():
|
|
77
83
|
with trace_ops: # currently only for forward (but we might want to trace the backward too)
|
|
78
84
|
loss = func()
|
|
85
|
+
file.flush() # the backward detect_anomaly might screw up the output otherwise
|
|
79
86
|
try:
|
|
80
87
|
loss.backward()
|
|
81
88
|
except RuntimeError as exc:
|
|
@@ -89,23 +96,46 @@ def debug_inf_nan(
|
|
|
89
96
|
|
|
90
97
|
# For efficiency, and to be less spammy
|
|
91
98
|
_TraceFuncNameBlacklist = {
|
|
92
|
-
"aten::detach",
|
|
93
99
|
"aten::zeros_like",
|
|
94
100
|
"aten::ones_like",
|
|
101
|
+
"aten::full",
|
|
102
|
+
"aten::scalar_tensor", # when we deliberately create a scalar inf tensor
|
|
103
|
+
"aten::_local_scalar_dense",
|
|
104
|
+
"aten::where.self", # when we intentionally mask with inf
|
|
105
|
+
"aten::detach",
|
|
106
|
+
"aten::_to_copy",
|
|
107
|
+
"aten::clone",
|
|
108
|
+
"aten::stack",
|
|
109
|
+
"aten::view",
|
|
110
|
+
"aten::_unsafe_view",
|
|
111
|
+
"aten::permute",
|
|
112
|
+
"aten::t",
|
|
113
|
+
"aten::split_with_sizes",
|
|
114
|
+
"aten::slice.Tensor",
|
|
115
|
+
"aten::select.int",
|
|
95
116
|
}
|
|
96
117
|
|
|
97
118
|
|
|
98
119
|
class _TraceOps(TorchDispatchMode):
|
|
99
|
-
def __init__(
|
|
120
|
+
def __init__(
|
|
121
|
+
self,
|
|
122
|
+
*,
|
|
123
|
+
root_frame: FrameType,
|
|
124
|
+
file: Union[TextIO, TextIOBase],
|
|
125
|
+
report_every_op_call: bool = True,
|
|
126
|
+
stop_reporting_after_first_inf_nan: bool = True,
|
|
127
|
+
):
|
|
100
128
|
super().__init__()
|
|
101
129
|
self.root_frame = root_frame
|
|
102
130
|
self.file = file
|
|
131
|
+
self.enabled = True
|
|
103
132
|
self.report_every_op_call = report_every_op_call
|
|
133
|
+
self.stop_reporting_after_first_inf_nan = stop_reporting_after_first_inf_nan
|
|
104
134
|
|
|
105
135
|
def __torch_dispatch__(self, func, types, args=(), kwargs=None):
|
|
106
136
|
if kwargs is None:
|
|
107
137
|
kwargs = {}
|
|
108
|
-
if func.name() in _TraceFuncNameBlacklist:
|
|
138
|
+
if not self.enabled or func.name() in _TraceFuncNameBlacklist:
|
|
109
139
|
return func(*args, **kwargs)
|
|
110
140
|
if self.report_every_op_call:
|
|
111
141
|
print(f"--- op {func.name()}", file=self.file)
|
|
@@ -121,6 +151,8 @@ class _TraceOps(TorchDispatchMode):
|
|
|
121
151
|
traceback.print_list(
|
|
122
152
|
_extract_stack_up_to(skip_top_num_frames=1, root_frame=self.root_frame), file=self.file
|
|
123
153
|
)
|
|
154
|
+
if self.stop_reporting_after_first_inf_nan:
|
|
155
|
+
self.enabled = False
|
|
124
156
|
return out
|
|
125
157
|
|
|
126
158
|
|
|
@@ -55,6 +55,7 @@ def run_model(
|
|
|
55
55
|
dyn_dim_max_sizes: Optional[Dict[Dim, int]] = None,
|
|
56
56
|
dyn_dim_min_sizes: Optional[Dict[Dim, int]] = None,
|
|
57
57
|
test_tensorflow: bool = True,
|
|
58
|
+
allow_inf_nan_in_output: bool = False,
|
|
58
59
|
) -> TensorDict:
|
|
59
60
|
"""run"""
|
|
60
61
|
print(f"* run_model with dyn_dim_max_sizes={dyn_dim_max_sizes!r}")
|
|
@@ -70,6 +71,10 @@ def run_model(
|
|
|
70
71
|
# get the values now because dims might get overwritten
|
|
71
72
|
out_pt_raw = out_pt.as_raw_tensor_dict(include_const_sizes=True)
|
|
72
73
|
|
|
74
|
+
if not allow_inf_nan_in_output:
|
|
75
|
+
for k, v in out_pt.data.items():
|
|
76
|
+
assert numpy.isfinite(v.raw_tensor).all(), f"output {k!r} has non-finite values: {v.raw_tensor}"
|
|
77
|
+
|
|
73
78
|
if not test_tensorflow:
|
|
74
79
|
return out_pt
|
|
75
80
|
if disable_tf:
|
|
@@ -86,8 +91,10 @@ def run_model(
|
|
|
86
91
|
random_journal: RandomJournal
|
|
87
92
|
assert random_journal.reached_end()
|
|
88
93
|
|
|
89
|
-
print(out_pt, out_tf)
|
|
90
|
-
assert set(out_pt.data.keys()) == set(
|
|
94
|
+
print("Output PT/TF:", out_pt, out_tf)
|
|
95
|
+
assert set(out_pt.data.keys()) == set(
|
|
96
|
+
out_tf.data.keys()
|
|
97
|
+
), f"PT output {list(out_pt.data.keys())} vs TF output {list(out_tf.data.keys())}"
|
|
91
98
|
for k, v_pt in out_pt.data.items():
|
|
92
99
|
v_tf = out_tf[k]
|
|
93
100
|
# We cannot really check the dims directly for equality,
|
|
@@ -123,11 +130,31 @@ def _run_model_torch(extern_data: TensorDict, get_model: rf.GetModelFunc, forwar
|
|
|
123
130
|
# We recover extern_data in the end.
|
|
124
131
|
tensor_dict_numpy_to_torch_(extern_data)
|
|
125
132
|
|
|
133
|
+
for k, v in extern_data.data.items():
|
|
134
|
+
if v.raw_tensor.dtype.is_floating_point:
|
|
135
|
+
v.raw_tensor.requires_grad = True
|
|
136
|
+
|
|
126
137
|
model = get_model(epoch=1, step=0)
|
|
127
138
|
rf.init_forward_step_run_ctx(epoch=1, step=0)
|
|
128
139
|
forward_step(model=model, extern_data=extern_data)
|
|
129
140
|
outputs = rf.get_run_ctx().outputs
|
|
130
141
|
assert outputs.data
|
|
142
|
+
|
|
143
|
+
if "loss" in outputs.data:
|
|
144
|
+
loss = outputs.data["loss"]
|
|
145
|
+
assert isinstance(loss, Tensor)
|
|
146
|
+
assert loss.raw_tensor.dtype.is_floating_point
|
|
147
|
+
loss = rf.reduce_sum(loss, axis=loss.dims)
|
|
148
|
+
print("loss:", loss.raw_tensor.detach().numpy().item())
|
|
149
|
+
loss.raw_tensor.backward()
|
|
150
|
+
for k, v in list(extern_data.data.items()):
|
|
151
|
+
if v.raw_tensor.dtype.is_floating_point:
|
|
152
|
+
assert v.raw_tensor.grad is not None, f"no grad for {k}"
|
|
153
|
+
v_grad = v.copy_template()
|
|
154
|
+
v_grad.raw_tensor = v.raw_tensor.grad
|
|
155
|
+
assert f"{k}_grad" not in outputs.data
|
|
156
|
+
outputs.data[f"{k}_grad"] = v_grad
|
|
157
|
+
|
|
131
158
|
tensor_dict_torch_to_numpy_(outputs)
|
|
132
159
|
|
|
133
160
|
extern_data.assign_from_raw_tensor_dict_(extern_data_raw)
|
|
@@ -242,6 +269,20 @@ def _run_model_net_dict_tf(
|
|
|
242
269
|
layer = net.get_layer(layer_name)
|
|
243
270
|
outputs_tf.data[k] = layer.output.copy()
|
|
244
271
|
|
|
272
|
+
if "loss" in outputs_tf.data:
|
|
273
|
+
data_ = {name: data for name, data in net.extern_data.data.items() if data.dtype.startswith("float")}
|
|
274
|
+
loss = outputs_tf.data["loss"]
|
|
275
|
+
assert isinstance(loss, Tensor)
|
|
276
|
+
assert loss.dtype.startswith("float")
|
|
277
|
+
loss = rf.reduce_sum(loss, axis=loss.dims)
|
|
278
|
+
d_grads = tf.gradients(loss.raw_tensor, [d.raw_tensor for d in data_.values()])
|
|
279
|
+
for (name, data), d_grad_tf in zip(data_.items(), d_grads):
|
|
280
|
+
assert isinstance(data, Tensor)
|
|
281
|
+
assert isinstance(d_grad_tf, tf.Tensor)
|
|
282
|
+
d_grad = data.copy_template()
|
|
283
|
+
d_grad.raw_tensor = d_grad_tf
|
|
284
|
+
outputs_tf.data[f"{name}_grad"] = d_grad
|
|
285
|
+
|
|
245
286
|
fetches = outputs_tf.as_raw_tensor_dict(expected_value_type=tf.Tensor)
|
|
246
287
|
assert set(extern_data.data.keys()) == set(net.extern_data.data.keys())
|
|
247
288
|
extern_data_tf_placeholders = net.extern_data.as_raw_tensor_dict(expected_value_type=tf.Tensor)
|
|
@@ -627,6 +627,27 @@ def test_gather_time_static_clip_to_valid():
|
|
|
627
627
|
run_model(extern_data_template, lambda *, epoch, step: rf.Module(), _forward_step)
|
|
628
628
|
|
|
629
629
|
|
|
630
|
+
def test_gather_3d_embed():
|
|
631
|
+
time_dim = Dim(Tensor("time", [batch_dim], dtype="int32"))
|
|
632
|
+
in_dim = Dim(7, name="in")
|
|
633
|
+
num_embeddings_dim = Dim(2, name="num_embeddings")
|
|
634
|
+
embed_dim = Dim(11, name="embed")
|
|
635
|
+
extern_data_template = TensorDict(
|
|
636
|
+
{
|
|
637
|
+
"data": Tensor("data", [batch_dim, time_dim], sparse_dim=in_dim, dtype="int32"),
|
|
638
|
+
"embed": Tensor("embed", [in_dim, num_embeddings_dim, embed_dim], dtype="float32"),
|
|
639
|
+
}
|
|
640
|
+
)
|
|
641
|
+
|
|
642
|
+
def _forward_step(*, extern_data: TensorDict, **_kwargs):
|
|
643
|
+
x, embed = extern_data["data"], extern_data["embed"]
|
|
644
|
+
out = rf.gather(embed, indices=x)
|
|
645
|
+
out.mark_as_default_output(shape=(batch_dim, time_dim, num_embeddings_dim, embed_dim))
|
|
646
|
+
rf.reduce_sum(out, axis=out.dims).mark_as_output("loss")
|
|
647
|
+
|
|
648
|
+
run_model(extern_data_template, lambda *, epoch, step: rf.Module(), _forward_step)
|
|
649
|
+
|
|
650
|
+
|
|
630
651
|
def test_scatter_fill_inf():
|
|
631
652
|
batch_dim_ = Dim(3, name="batch")
|
|
632
653
|
states_dim = Dim(7, name="states")
|
|
@@ -645,7 +666,13 @@ def test_scatter_fill_inf():
|
|
|
645
666
|
) # [S], per state
|
|
646
667
|
scores.mark_as_default_output(shape=[states_dim])
|
|
647
668
|
|
|
648
|
-
res = run_model(
|
|
669
|
+
res = run_model(
|
|
670
|
+
TensorDict(),
|
|
671
|
+
lambda *, epoch, step: rf.Module(),
|
|
672
|
+
_forward_step,
|
|
673
|
+
test_tensorflow=False,
|
|
674
|
+
allow_inf_nan_in_output=True,
|
|
675
|
+
)
|
|
649
676
|
batch_size = res["batch_size"].raw_tensor.item()
|
|
650
677
|
assert res["start_states"].raw_tensor.shape == (batch_size,)
|
|
651
678
|
assert res["output"].raw_tensor.shape == (states_dim.dimension,)
|
|
@@ -286,12 +286,12 @@ def test_debug_inf_nan():
|
|
|
286
286
|
|
|
287
287
|
# Run directly, to just test that it goes through without exception.
|
|
288
288
|
# For some reason, the detect_anomaly does not print the forward op?
|
|
289
|
-
debug_inf_nan(func, with_grad=True)
|
|
289
|
+
debug_inf_nan(func, with_grad=True, stop_reporting_after_first_inf_nan=False)
|
|
290
290
|
|
|
291
291
|
from io import StringIO
|
|
292
292
|
|
|
293
293
|
out = StringIO()
|
|
294
|
-
debug_inf_nan(func, file=out)
|
|
294
|
+
debug_inf_nan(func, file=out, stop_reporting_after_first_inf_nan=False)
|
|
295
295
|
assert "inf in aten.exp" in out.getvalue()
|
|
296
296
|
assert "nan in aten.div" in out.getvalue()
|
|
297
297
|
assert "mod5" in out.getvalue()
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-record-and-push-to-webserver.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-chunking-blstm.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-contribrnn-lstm.12ax.config
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-maxgradnorm-lstm.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-native-lstm-lowmem.12ax.config
RENAMED
|
File without changes
|
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-native-lstm2.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-native-lstm2.12ax.tuned.config
RENAMED
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-neural-transducer.12ax.config
RENAMED
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-rec-explicit-lstm.config
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-search-compiled-graph.py
RENAMED
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-tf-vanilla-lstm.12ax.config
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/demo-upd-mult-model.lstm.12ax.config
RENAMED
|
File without changes
|
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/IAM_lines/a01-000u-00.png
RENAMED
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/IAM_lines/a01-007-04.png
RENAMED
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/IAM_lines/a01-007-06.png
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/IAM/create_IAM_dataset.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/artificial/create_test_h5.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/artificial_rgb/create_test_h5.py
RENAMED
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/artificial_rgb/forwardconfig
RENAMED
|
File without changes
|
|
File without changes
|
{returnn-1.20250204.4017 → returnn-1.20250206.144022}/demos/mdlstm/artificial_rgb/trainconfig
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|