translate-package 0.0.2__tar.gz → 0.0.4__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {translate_package-0.0.2 → translate_package-0.0.4}/PKG-INFO +1 -1
- {translate_package-0.0.2 → translate_package-0.0.4}/setup.py +1 -1
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/models/machine_translation.py +32 -13
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package.egg-info/PKG-INFO +1 -1
- {translate_package-0.0.2 → translate_package-0.0.4}/setup.cfg +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/__init__.py +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/data/__init__.py +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/data/__pycache__/__init__.cpython-310.pyc +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/data/__pycache__/data_preparation.cpython-310.pyc +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/data/data_preparation.py +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/errors/__init__.py +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/errors/__pycache__/__init__.cpython-310.pyc +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/models/__init__.py +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/models/__pycache__/__init__.cpython-310.pyc +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/models/__pycache__/code_generation.cpython-310.pyc +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/models/__pycache__/machine_translation.cpython-310.pyc +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/models/gradient_observation.py +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/models/lstm.py +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/tokenization/__init__.py +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/tokenization/__pycache__/__init__.cpython-310.pyc +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/tokenization/__pycache__/load_tokenizer.cpython-310.pyc +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/tokenization/__pycache__/train_tokenizer.cpython-310.pyc +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/tokenization/load_tokenizer.py +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/tokenization/train_tokenizer.py +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/utils/__init__.py +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/utils/__pycache__/__init__.cpython-310.pyc +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/utils/__pycache__/checkpoint.cpython-310.pyc +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package/utils/checkpoint.py +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package.egg-info/SOURCES.txt +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package.egg-info/dependency_links.txt +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package.egg-info/requires.txt +0 -0
- {translate_package-0.0.2 → translate_package-0.0.4}/translate_package.egg-info/top_level.txt +0 -0
{translate_package-0.0.2 → translate_package-0.0.4}/translate_package/models/machine_translation.py
RENAMED
|
@@ -48,7 +48,7 @@ class MachineTranslationTransformer(pl.LightningModule):
|
|
|
48
48
|
lora_alpha=32,
|
|
49
49
|
lora_dropout=0.05,
|
|
50
50
|
bias="none",
|
|
51
|
-
max_new_tokens=
|
|
51
|
+
max_new_tokens=90,
|
|
52
52
|
predict_with_generate=True,
|
|
53
53
|
num_beams=0,
|
|
54
54
|
use_peft=False,
|
|
@@ -56,7 +56,8 @@ class MachineTranslationTransformer(pl.LightningModule):
|
|
|
56
56
|
num_layers=6,
|
|
57
57
|
hidden_size=128,
|
|
58
58
|
dropout=0.1,
|
|
59
|
-
bidirectional=False
|
|
59
|
+
bidirectional=False,
|
|
60
|
+
length_penalty=1.2
|
|
60
61
|
):
|
|
61
62
|
|
|
62
63
|
super().__init__()
|
|
@@ -131,6 +132,8 @@ class MachineTranslationTransformer(pl.LightningModule):
|
|
|
131
132
|
|
|
132
133
|
self.num_beams = num_beams
|
|
133
134
|
|
|
135
|
+
self.length_penalty = length_penalty
|
|
136
|
+
|
|
134
137
|
self.model_generation = model_generation
|
|
135
138
|
|
|
136
139
|
self.predictions = {
|
|
@@ -263,17 +266,33 @@ class MachineTranslationTransformer(pl.LightningModule):
|
|
|
263
266
|
)
|
|
264
267
|
|
|
265
268
|
# generate predictions
|
|
266
|
-
|
|
267
|
-
|
|
268
|
-
|
|
269
|
-
|
|
270
|
-
|
|
271
|
-
|
|
272
|
-
|
|
273
|
-
|
|
274
|
-
|
|
275
|
-
|
|
276
|
-
|
|
269
|
+
if not self.model_generation in ["lstm"] and self.num_beams > 0:
|
|
270
|
+
|
|
271
|
+
predictions = self.model.generate(
|
|
272
|
+
input_ids=batch["input_ids"],
|
|
273
|
+
attention_mask=batch["attention_mask"],
|
|
274
|
+
max_new_tokens=self.max_new_tokens,
|
|
275
|
+
do_sample=True,
|
|
276
|
+
num_beams=self.num_beams,
|
|
277
|
+
length_penalty=self.length_penalty
|
|
278
|
+
)
|
|
279
|
+
|
|
280
|
+
elif not self.model_generation in ["lstm"]:
|
|
281
|
+
|
|
282
|
+
predictions = self.model.generate(
|
|
283
|
+
input_ids=batch["input_ids"],
|
|
284
|
+
attention_mask=batch["attention_mask"],
|
|
285
|
+
max_new_tokens=self.max_new_tokens,
|
|
286
|
+
do_sample=False
|
|
287
|
+
)
|
|
288
|
+
|
|
289
|
+
else:
|
|
290
|
+
|
|
291
|
+
predictions = self.model.generate(
|
|
292
|
+
input=batch["input_ids"],
|
|
293
|
+
max_new_tokens=self.max_new_tokens,
|
|
294
|
+
use_sampling=True
|
|
295
|
+
)
|
|
277
296
|
|
|
278
297
|
# decode the labels
|
|
279
298
|
predictions = self.tokenizer.batch_decode(predictions, skip_special_tokens=True)
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{translate_package-0.0.2 → translate_package-0.0.4}/translate_package/data/data_preparation.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{translate_package-0.0.2 → translate_package-0.0.4}/translate_package/models/gradient_observation.py
RENAMED
|
File without changes
|
|
File without changes
|
{translate_package-0.0.2 → translate_package-0.0.4}/translate_package/tokenization/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{translate_package-0.0.2 → translate_package-0.0.4}/translate_package/tokenization/load_tokenizer.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{translate_package-0.0.2 → translate_package-0.0.4}/translate_package.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
|
File without changes
|
{translate_package-0.0.2 → translate_package-0.0.4}/translate_package.egg-info/top_level.txt
RENAMED
|
File without changes
|