returnn 1.20250514.151721__py3-none-any.whl → 1.20250516.145734__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of returnn might be problematic. Click here for more details.
- returnn/PKG-INFO +1 -1
- returnn/_setup_info_generated.py +2 -2
- returnn/datasets/lm.py +8 -5
- returnn/frontend/nested.py +3 -0
- {returnn-1.20250514.151721.dist-info → returnn-1.20250516.145734.dist-info}/METADATA +1 -1
- {returnn-1.20250514.151721.dist-info → returnn-1.20250516.145734.dist-info}/RECORD +9 -9
- {returnn-1.20250514.151721.dist-info → returnn-1.20250516.145734.dist-info}/LICENSE +0 -0
- {returnn-1.20250514.151721.dist-info → returnn-1.20250516.145734.dist-info}/WHEEL +0 -0
- {returnn-1.20250514.151721.dist-info → returnn-1.20250516.145734.dist-info}/top_level.txt +0 -0
returnn/PKG-INFO
CHANGED
returnn/_setup_info_generated.py
CHANGED
|
@@ -1,2 +1,2 @@
|
|
|
1
|
-
version = '1.
|
|
2
|
-
long_version = '1.
|
|
1
|
+
version = '1.20250516.145734'
|
|
2
|
+
long_version = '1.20250516.145734+git.6bf8581'
|
returnn/datasets/lm.py
CHANGED
|
@@ -85,6 +85,7 @@ class LmDataset(CachedDataset2):
|
|
|
85
85
|
add_delayed_seq_data=False,
|
|
86
86
|
delayed_seq_data_start_symbol="[START]",
|
|
87
87
|
dtype: Optional[str] = None,
|
|
88
|
+
tag_prefix: Optional[str] = None,
|
|
88
89
|
**kwargs,
|
|
89
90
|
):
|
|
90
91
|
"""
|
|
@@ -288,7 +289,9 @@ class LmDataset(CachedDataset2):
|
|
|
288
289
|
self.num_outputs = {"data": [num_labels, 1]}
|
|
289
290
|
self.num_inputs = num_labels
|
|
290
291
|
self.seq_order = None
|
|
291
|
-
|
|
292
|
+
|
|
293
|
+
# sequence tag is "line-n", where n is the line number (to be compatible with translation)
|
|
294
|
+
self.tag_prefix = tag_prefix or "line-"
|
|
292
295
|
self.auto_replace_unknown_symbol = auto_replace_unknown_symbol
|
|
293
296
|
self.log_auto_replace_unknown_symbols = log_auto_replace_unknown_symbols
|
|
294
297
|
self.log_skipped_seqs = log_skipped_seqs
|
|
@@ -504,8 +507,8 @@ class LmDataset(CachedDataset2):
|
|
|
504
507
|
elif seq_list is not None:
|
|
505
508
|
# Might not be initialized. Can even do without init. Thus check seq_list_file.
|
|
506
509
|
if self._seq_list_file is None:
|
|
507
|
-
assert all(s.startswith(self.
|
|
508
|
-
self.seq_order = [int(s[len(self.
|
|
510
|
+
assert all(s.startswith(self.tag_prefix) for s in seq_list)
|
|
511
|
+
self.seq_order = [int(s[len(self.tag_prefix) :]) for s in seq_list]
|
|
509
512
|
else:
|
|
510
513
|
# Need seq list for this. Just do the lazy init now.
|
|
511
514
|
self._lazy_init()
|
|
@@ -555,7 +558,7 @@ class LmDataset(CachedDataset2):
|
|
|
555
558
|
if self._seq_list is not None:
|
|
556
559
|
return self._seq_list
|
|
557
560
|
num_seqs = self.get_total_num_seqs()
|
|
558
|
-
return [self.
|
|
561
|
+
return [self.tag_prefix + str(line_nr) for line_nr in range(num_seqs)]
|
|
559
562
|
|
|
560
563
|
def _reduce_log_skipped_seqs(self):
|
|
561
564
|
if isinstance(self.log_skipped_seqs, bool):
|
|
@@ -594,7 +597,7 @@ class LmDataset(CachedDataset2):
|
|
|
594
597
|
idx, offset, len_ = self._orths_offsets_and_lens[true_idx]
|
|
595
598
|
orth = self._orth_mmaps[idx][offset : offset + len_].decode("utf8").strip()
|
|
596
599
|
if self._seq_list is None:
|
|
597
|
-
seq_tag = self.
|
|
600
|
+
seq_tag = self.tag_prefix + str(true_idx)
|
|
598
601
|
else:
|
|
599
602
|
seq_tag = self._seq_list[true_idx]
|
|
600
603
|
self.next_orth_idx += 1
|
returnn/frontend/nested.py
CHANGED
|
@@ -160,6 +160,7 @@ def _gather_prepare_dims(s: T, *, indices: Tensor, dim_map: Dict[Dim, Dim]) -> T
|
|
|
160
160
|
return new_dim
|
|
161
161
|
return s
|
|
162
162
|
# everything else ignored at this stage
|
|
163
|
+
return s
|
|
163
164
|
|
|
164
165
|
|
|
165
166
|
def _gather(s: T, *, indices: Tensor, dim_map: Optional[Dict[Dim, Dim]] = None) -> T:
|
|
@@ -243,6 +244,7 @@ def _masked_select_prepare_dims(s, *, mask: Tensor, dims: Sequence[Dim], out_dim
|
|
|
243
244
|
dim_map[s] = new_dim
|
|
244
245
|
return new_dim
|
|
245
246
|
# everything else ignored at this stage
|
|
247
|
+
return s
|
|
246
248
|
|
|
247
249
|
|
|
248
250
|
def _masked_select(
|
|
@@ -370,6 +372,7 @@ def _masked_scatter_merge_dims(
|
|
|
370
372
|
merged_dim_map[backup] = new_dim
|
|
371
373
|
return new_dim
|
|
372
374
|
# everything else ignored at this stage
|
|
375
|
+
return s
|
|
373
376
|
|
|
374
377
|
|
|
375
378
|
def _masked_scatter(
|
|
@@ -1,9 +1,9 @@
|
|
|
1
|
-
returnn/PKG-INFO,sha256=
|
|
1
|
+
returnn/PKG-INFO,sha256=sMynyg2d9ysTRZSFCwKggJBVS0ONCs7jJ9p7Y9Myf7o,5215
|
|
2
2
|
returnn/__init__.py,sha256=biBtRsM0WZ406vShaeH-9WFoqJ8XwTbn6g0EeFJ7l8E,1012
|
|
3
3
|
returnn/__main__.py,sha256=qBFbuB1yN3adgVM5pXt2-Yq9vorjRNchNPL8kDKx44M,31752
|
|
4
4
|
returnn/__old_mod_loader__.py,sha256=nvsNY-xELdS_IPNkv66Q9Rmvg4dbGW0-EBRDcCmctos,7654
|
|
5
5
|
returnn/__setup__.py,sha256=22kQn2fh11iPM0hLb2Fy5sLmoU1JGvmDxXRYuRgQkwU,4659
|
|
6
|
-
returnn/_setup_info_generated.py,sha256=
|
|
6
|
+
returnn/_setup_info_generated.py,sha256=uEuN_v07wAjAI2gdED6tkP7FaGiO4JlHaTlxuhwQHM4,77
|
|
7
7
|
returnn/config.py,sha256=3tmKhB6FnQZaNdtcYsiB61JnEY--iZ2qmJ4yq0b6tE0,29140
|
|
8
8
|
returnn/forward_iface.py,sha256=A_OJiaXsX4MlXQRzST86ylyxSUZbC402PQL1REcqHjM,911
|
|
9
9
|
returnn/learning_rate_control.py,sha256=ZvWryAn_tv9DhV8sh1LV3eE34Yltl3On3mYZAG4hR9s,34684
|
|
@@ -20,7 +20,7 @@ returnn/datasets/cached2.py,sha256=_6pza3IG68JexaExhj1ld3fP6pE7T-G804driJ9Z_qo,1
|
|
|
20
20
|
returnn/datasets/distrib_files.py,sha256=9-3pJaF8Ws1Cs4AlelFCODz6b5YiaTsrD7tMCB76PDY,29865
|
|
21
21
|
returnn/datasets/generating.py,sha256=9U_w6URIrv-Rb-hDbPOzYW9qYXzJbw32N6G268IKyoM,99833
|
|
22
22
|
returnn/datasets/hdf.py,sha256=v5sjBenURR9Z-g7AQ9tsL84yDSye5RtbLpym3M6HSDE,67833
|
|
23
|
-
returnn/datasets/lm.py,sha256=
|
|
23
|
+
returnn/datasets/lm.py,sha256=IqUsOzbdSWUynL0YFL25HbtMR4AxaQGHvjjqRE9IwBo,99215
|
|
24
24
|
returnn/datasets/map.py,sha256=kOBJVZmwDhLsOplzDNByIfa0NRSUaMo2Lsy36lBvxrM,10907
|
|
25
25
|
returnn/datasets/meta.py,sha256=KQtidTgSh-1gNgbpJ8OhXt6v2lkhPPH5dpjfzwsr3E4,95251
|
|
26
26
|
returnn/datasets/multi_proc.py,sha256=aVjsLt2qjHnHOrEYCgIPCwNYE-f1fiGP6eZ8NGAr3A4,22583
|
|
@@ -104,7 +104,7 @@ returnn/frontend/loss.py,sha256=uSvou2MPd13JiLAg_OIQ3AyyLvD3RHjMEVgFEN0gKqU,7440
|
|
|
104
104
|
returnn/frontend/math_.py,sha256=KlJxdIib8ENlid7cc4lcwHv5e21tzTjTEV8VgEDAijo,16984
|
|
105
105
|
returnn/frontend/matmul.py,sha256=xkueyxzSDz8MsYaWxPSjmV2Yy-tcaiOQDXbFt1IQM2A,1944
|
|
106
106
|
returnn/frontend/module.py,sha256=219rh5mE0CD0-NdxXLsKyhv3BNtOI9jSyiI1Rb8MOyU,10700
|
|
107
|
-
returnn/frontend/nested.py,sha256=
|
|
107
|
+
returnn/frontend/nested.py,sha256=P84u_cjoYdYRJ_0Cbt0vlKXxskmXTDfsnw_vFCCNKtU,15107
|
|
108
108
|
returnn/frontend/normalization.py,sha256=-lYJ9IWcheOQu1gXJehSOA76qgVtxd1C07Jqps6Qg1o,14116
|
|
109
109
|
returnn/frontend/parameter.py,sha256=zvrkhSYC1c_O9kVwgHvOtOnWNurl5J28lkS0i1LQpWU,10627
|
|
110
110
|
returnn/frontend/parametrizations.py,sha256=ptNgBw5IiPXVpB3QGse7AGAhdXp8X1rCqYUl2Mae8aI,2876
|
|
@@ -253,8 +253,8 @@ returnn/util/sig_proc.py,sha256=Tjz0VOAVyqu2qDCF5HZ1JjALjcFsHcNkcd96WgZeKfE,7265
|
|
|
253
253
|
returnn/util/task_system.py,sha256=y4sMVXQ25Qd2z0rx03uOlXlkE-jbCYC1Sjfn-XlraVU,26003
|
|
254
254
|
returnn/util/train_proc_manager.py,sha256=Pjht28k6uz6BNQ47uW6Gf880iyq5q4wx7P_K2tmoAM8,3266
|
|
255
255
|
returnn/util/watch_memory.py,sha256=BR5P2kvBN6UI81cE0_1WAA6Hd1SByLbBaiDxvLhPOew,4213
|
|
256
|
-
returnn-1.
|
|
257
|
-
returnn-1.
|
|
258
|
-
returnn-1.
|
|
259
|
-
returnn-1.
|
|
260
|
-
returnn-1.
|
|
256
|
+
returnn-1.20250516.145734.dist-info/LICENSE,sha256=ywBD_U2aD4vpuoIgNAsjIGBYydl0tVKll3De0Z8s77c,11041
|
|
257
|
+
returnn-1.20250516.145734.dist-info/METADATA,sha256=sMynyg2d9ysTRZSFCwKggJBVS0ONCs7jJ9p7Y9Myf7o,5215
|
|
258
|
+
returnn-1.20250516.145734.dist-info/WHEEL,sha256=iAkIy5fosb7FzIOwONchHf19Qu7_1wCWyFNR5gu9nU0,91
|
|
259
|
+
returnn-1.20250516.145734.dist-info/top_level.txt,sha256=Lsn4WZc5Pbfk0-xDQOgnFCxOoqxL4CyeM3N1TFbJncw,8
|
|
260
|
+
returnn-1.20250516.145734.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|