PyPI - sae-lens - Versions diffs - 6.30.1__tar.gz → 6.31.0__tar.gz - Mend

sae-lens 6.30.1tar.gz → 6.31.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (52) hide show

{sae_lens-6.30.1 → sae_lens-6.31.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: sae-lens
-Version: 6.30.1
+Version: 6.31.0
 Summary: Training and Analyzing Sparse Autoencoders (SAEs)
 License: MIT
 License-File: LICENSE

{sae_lens-6.30.1 → sae_lens-6.31.0}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "sae-lens"
-version = "6.30.1"
+version = "6.31.0"
 description = "Training and Analyzing Sparse Autoencoders (SAEs)"
 authors = ["Joseph Bloom"]
 readme = "README.md"

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/__init__.py RENAMED Viewed

@@ -1,5 +1,5 @@
 # ruff: noqa: E402
-__version__ = "6.30.1"
+__version__ = "6.31.0"
 import logging

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/config.py RENAMED Viewed

@@ -82,6 +82,7 @@ class LoggingConfig:
     log_to_wandb: bool = True
     log_activations_store_to_wandb: bool = False
     log_optimizer_state_to_wandb: bool = False
+    log_weights_to_wandb: bool = True
     wandb_project: str = "sae_lens_training"
     wandb_id: str | None = None
     run_name: str | None = None
@@ -107,7 +108,8 @@ class LoggingConfig:
             type="model",
             metadata=dict(trainer.cfg.__dict__),
         )
-        model_artifact.add_file(str(weights_path))
+        if self.log_weights_to_wandb:
+            model_artifact.add_file(str(weights_path))
         model_artifact.add_file(str(cfg_path))
         wandb.log_artifact(model_artifact, aliases=wandb_aliases)
@@ -557,6 +559,12 @@ class CacheActivationsRunnerConfig:
                 context_size=self.context_size,
             )
+        if self.context_size > self.training_tokens:
+            raise ValueError(
+                f"context_size ({self.context_size}) is greater than training_tokens "
+                f"({self.training_tokens}). Please reduce context_size or increase training_tokens."
+            )
         if self.new_cached_activations_path is None:
             self.new_cached_activations_path = _default_cached_activations_path(  # type: ignore
                 self.dataset_path, self.model_name, self.hook_name, None

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/evals.py RENAMED Viewed

@@ -335,7 +335,7 @@ def get_downstream_reconstruction_metrics(
     batch_iter = range(n_batches)
     if verbose:
-        batch_iter = tqdm(batch_iter, desc="Reconstruction Batches")
+        batch_iter = tqdm(batch_iter, desc="Reconstruction Batches", leave=False)
     for _ in batch_iter:
         batch_tokens = activation_store.get_batch_tokens(eval_batch_size_prompts)
@@ -430,7 +430,7 @@ def get_sparsity_and_variance_metrics(
     batch_iter = range(n_batches)
     if verbose:
-        batch_iter = tqdm(batch_iter, desc="Sparsity and Variance Batches")
+        batch_iter = tqdm(batch_iter, desc="Sparsity and Variance Batches", leave=False)
     for _ in batch_iter:
         batch_tokens = activation_store.get_batch_tokens(eval_batch_size_prompts)

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/saes/temporal_sae.py RENAMED Viewed

@@ -4,7 +4,7 @@ TemporalSAE decomposes activations into:
 1. Predicted codes (from attention over context)
 2. Novel codes (sparse features of the residual)
-See: https://arxiv.org/abs/2410.04185
+See: https://arxiv.org/pdf/2511.01836
 """
 import math

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/training/activation_scaler.py RENAMED Viewed

@@ -28,7 +28,9 @@ class ActivationScaler:
     ) -> float:
         norms_per_batch: list[float] = []
         for _ in tqdm(
-            range(n_batches_for_norm_estimate), desc="Estimating norm scaling factor"
+            range(n_batches_for_norm_estimate),
+            desc="Estimating norm scaling factor",
+            leave=False,
         ):
             acts = next(data_provider)
             norms_per_batch.append(acts.norm(dim=-1).mean().item())

{sae_lens-6.30.1 → sae_lens-6.31.0}/LICENSE RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/README.md RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/analysis/__init__.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/analysis/hooked_sae_transformer.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/analysis/neuronpedia_integration.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/cache_activations_runner.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/constants.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/llm_sae_training_runner.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/load_model.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/loading/__init__.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/loading/pretrained_sae_loaders.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/loading/pretrained_saes_directory.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/pretokenize_runner.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/pretrained_saes.yaml RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/registry.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/saes/__init__.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/saes/batchtopk_sae.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/saes/gated_sae.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/saes/jumprelu_sae.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/saes/matching_pursuit_sae.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/saes/matryoshka_batchtopk_sae.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/saes/sae.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/saes/standard_sae.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/saes/topk_sae.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/saes/transcoder.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/synthetic/__init__.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/synthetic/activation_generator.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/synthetic/correlation.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/synthetic/evals.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/synthetic/feature_dictionary.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/synthetic/firing_probabilities.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/synthetic/hierarchy.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/synthetic/initialization.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/synthetic/plotting.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/synthetic/training.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/tokenization_and_batching.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/training/__init__.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/training/activations_store.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/training/mixing_buffer.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/training/optim.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/training/sae_trainer.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/training/types.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/training/upload_saes_to_huggingface.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/tutorial/tsea.py RENAMED Viewed

File without changes

{sae_lens-6.30.1 → sae_lens-6.31.0}/sae_lens/util.py RENAMED Viewed

File without changes

sae-lens 6.30.1__tar.gz → 6.31.0__tar.gz

sae-lens 6.30.1tar.gz → 6.31.0tar.gz