PyPI - sdft-pytorch - Versions diffs - 0.0.1__tar.gz → 0.0.2__tar.gz - Mend

sdft-pytorch 0.0.1tar.gz → 0.0.2tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

{sdft_pytorch-0.0.1/sdft_pytorch.egg-info → sdft_pytorch-0.0.2}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: sdft-pytorch
-Version: 0.0.1
+Version: 0.0.2
 Summary: SDFT - Pytorch
 Author-email: Phil Wang <lucidrains@gmail.com>
 License: MIT

{sdft_pytorch-0.0.1 → sdft_pytorch-0.0.2}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "sdft-pytorch"
-version = "0.0.1"
+version = "0.0.2"
 description = "SDFT - Pytorch"
 readme = "README.md"
 requires-python = ">=3.10"

{sdft_pytorch-0.0.1 → sdft_pytorch-0.0.2}/sdft_pytorch/sdft_pytorch.py RENAMED Viewed

@@ -11,7 +11,11 @@ from torch import nn, cat, stack, is_tensor, tensor, Tensor
 from einops import rearrange
-from torch_einops_utils import pad_sequence
+from torch_einops_utils import (
+    pad_sequence,
+    safe_cat,
+    masked_mean
+)
 from ema_pytorch import EMA
@@ -71,6 +75,7 @@ class SDFT(Module):
         student_prompt_template = DEFAULT_STUDENT_PROMPT_TEMPLATE,
         teacher_update_rate = 0.01,
         teacher_prompt_template = DEFAULT_TEACHER_PROMPT_TEMPLATE,
+        eos_id = None, # if set, will mask out any losses after the first eos token id detected in a given sample
     ):
         super().__init__()
@@ -100,12 +105,18 @@ class SDFT(Module):
         assert get_variables_from_template(student_prompt_template) == {'question'}
         self.student_prompt_template = Template(student_prompt_template)
+        # end of string
+        self.eos_id = eos_id
     def forward(
         self,
         questions: list[str],
         answers: list[str],
         student_logit_sample_kwargs: dict = dict()
     ):
+        maybe_eos_id = self.eos_id
         encode = self.tokenizer_encode
         assert len(questions) == len(answers)
@@ -128,8 +139,8 @@ class SDFT(Module):
         # accumulate
-        student_response = []
-        token_kl_div_losses = []
+        student_responses = None
+        token_kl_div_losses = None
         for _ in range(self.student_max_response_len):
@@ -156,23 +167,34 @@ class SDFT(Module):
             ).sum(dim = -1)
-            token_kl_div_losses.append(token_kl_div)
+            token_kl_div_losses = safe_cat((token_kl_div_losses, token_kl_div), dim = 1)
             # sample
             sampled_action = self.discrete_readout.sample(student_token_logit, **student_logit_sample_kwargs)
-            student_response.append(sampled_action)
+            student_responses = safe_cat((student_responses, sampled_action), dim = 1)
+            # break if all eos
+            if exists(maybe_eos_id) and (student_responses == maybe_eos_id).any(dim = -1).all():
+                break
             # set student and teacher tokens to the next sampled token
             student_prompt_ids = sampled_action
             teacher_prompt_ids = sampled_action
-        # stack and return
+        # handle eos
+        mask = None
+        if exists(maybe_eos_id):
+            mask = ((student_responses == maybe_eos_id).cumsum(dim = -1) < 0)
+            mask = F.pad(mask, (1, -1), value = True)
-        student_response = cat(student_response, dim = 1)
-        token_kl_div_losses = cat(token_kl_div_losses, dim = 1)
+        # maybe masked mean for losses
-        loss = token_kl_div_losses.mean()
+        loss = masked_mean(token_kl_div_losses, mask)
-        return SDFTOutput(loss, student_response)
+        return SDFTOutput(loss, student_responses)

{sdft_pytorch-0.0.1 → sdft_pytorch-0.0.2/sdft_pytorch.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: sdft-pytorch
-Version: 0.0.1
+Version: 0.0.2
 Summary: SDFT - Pytorch
 Author-email: Phil Wang <lucidrains@gmail.com>
 License: MIT

{sdft_pytorch-0.0.1 → sdft_pytorch-0.0.2}/tests/test_sdft.py RENAMED Viewed

@@ -1,7 +1,13 @@
+import pytest
+param = pytest.mark.parametrize
 import torch
 from sdft_pytorch.sdft_pytorch import SDFT
-def test_sdft():
+@param('eos_id', (None, 1))
+def test_sdft(
+    eos_id
+):
     from torch import tensor
     from x_transformers import TransformerWrapper, Decoder
@@ -24,6 +30,7 @@ def test_sdft():
     sdft_wrapper = SDFT(
         model,
         student_max_response_len = 128,
+        eos_id = eos_id,
         tokenizer_encode = tokenizer_encode,
     )