x-transformers 2.4.3__tar.gz → 2.4.5__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {x_transformers-2.4.3 → x_transformers-2.4.5}/PKG-INFO +1 -1
- {x_transformers-2.4.3 → x_transformers-2.4.5}/pyproject.toml +1 -1
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/up_wrapper.py +1 -2
- {x_transformers-2.4.3 → x_transformers-2.4.5}/.github/FUNDING.yml +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/.github/workflows/python-publish.yml +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/.github/workflows/python-test.yaml +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/.gitignore +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/LICENSE +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/README.md +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/data/README.md +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/data/enwik8.gz +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/all-attention.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/attention-on-attention.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/cosine-sim-attention.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/deepnorm.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/dynamic-pos-bias-linear.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/dynamic-pos-bias-log.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/dynamic-pos-bias-sinusoidal.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/dynamic-pos-bias.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/enhanced-recurrence.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/fcm.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/ffglu.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/flash-attention.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/gate_values.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/gating.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/length-extrapolation-scale.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/macaron-1.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/macaron-2.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/memory-transformer.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/normformer.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/pia.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/qknorm-analysis.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/resi_dual.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/residual_attn.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/rezero.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/rotary.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/sandwich-2.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/sandwich.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/sandwich_norm.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/scalenorm.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/talking-heads.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/topk-attention.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/images/xval.png +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/tests/test_x_transformers.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/train_belief_state.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/train_copy.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/train_entropy_tokenizer.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/train_enwik8.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/train_length_extrapolate.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/train_parity.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/__init__.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/attend.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/autoregressive_wrapper.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/belief_state_wrapper.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/continuous.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/dpo.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/entropy_based_tokenizer.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/multi_input.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/neo_mlp.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/nonautoregressive_wrapper.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/x_transformers.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/xl_autoregressive_wrapper.py +0 -0
- {x_transformers-2.4.3 → x_transformers-2.4.5}/x_transformers/xval.py +0 -0
|
@@ -133,7 +133,7 @@ class UniversalPretrainWrapper(Module):
|
|
|
133
133
|
def __init__(
|
|
134
134
|
self,
|
|
135
135
|
model: TransformerWrapper,
|
|
136
|
-
data_generator: SyntheticDataGenerator | None = None,
|
|
136
|
+
data_generator: SyntheticDataGenerator | Module | None = None,
|
|
137
137
|
buffer_size = None,
|
|
138
138
|
num_reset = 20,
|
|
139
139
|
batch_size = 32,
|
|
@@ -222,7 +222,6 @@ class UniversalPretrainWrapper(Module):
|
|
|
222
222
|
# place "enriched" random generated sequences back
|
|
223
223
|
|
|
224
224
|
with torch.no_grad():
|
|
225
|
-
print(conditions.shape, generated.shape)
|
|
226
225
|
conditions.copy_(generated)
|
|
227
226
|
|
|
228
227
|
# sample yet again according to pseudocode
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|