sae-lens 6.26.0__tar.gz → 6.26.1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {sae_lens-6.26.0 → sae_lens-6.26.1}/PKG-INFO +1 -1
- {sae_lens-6.26.0 → sae_lens-6.26.1}/pyproject.toml +2 -1
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/__init__.py +1 -1
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/pretrained_saes.yaml +144 -144
- {sae_lens-6.26.0 → sae_lens-6.26.1}/LICENSE +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/README.md +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/analysis/__init__.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/analysis/hooked_sae_transformer.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/analysis/neuronpedia_integration.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/cache_activations_runner.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/config.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/constants.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/evals.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/llm_sae_training_runner.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/load_model.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/loading/__init__.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/loading/pretrained_sae_loaders.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/loading/pretrained_saes_directory.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/pretokenize_runner.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/registry.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/saes/__init__.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/saes/batchtopk_sae.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/saes/gated_sae.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/saes/jumprelu_sae.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/saes/matching_pursuit_sae.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/saes/matryoshka_batchtopk_sae.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/saes/sae.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/saes/standard_sae.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/saes/temporal_sae.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/saes/topk_sae.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/saes/transcoder.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/tokenization_and_batching.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/training/__init__.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/training/activation_scaler.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/training/activations_store.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/training/mixing_buffer.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/training/optim.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/training/sae_trainer.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/training/types.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/training/upload_saes_to_huggingface.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/tutorial/tsea.py +0 -0
- {sae_lens-6.26.0 → sae_lens-6.26.1}/sae_lens/util.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
[tool.poetry]
|
|
2
2
|
name = "sae-lens"
|
|
3
|
-
version = "6.26.
|
|
3
|
+
version = "6.26.1"
|
|
4
4
|
description = "Training and Analyzing Sparse Autoencoders (SAEs)"
|
|
5
5
|
authors = ["Joseph Bloom"]
|
|
6
6
|
readme = "README.md"
|
|
@@ -51,6 +51,7 @@ mkdocs-redirects = "^1.2.1"
|
|
|
51
51
|
mkdocs-section-index = "^0.3.9"
|
|
52
52
|
mkdocstrings = "^0.25.2"
|
|
53
53
|
mkdocstrings-python = "^1.10.9"
|
|
54
|
+
beautifulsoup4 = "^4.12.0"
|
|
54
55
|
tabulate = "^0.9.0"
|
|
55
56
|
ruff = "^0.7.4"
|
|
56
57
|
eai-sparsify = "^1.1.1"
|
|
@@ -9072,150 +9072,150 @@ gemma-scope-2-27b-it-transcoders-all:
|
|
|
9072
9072
|
- id: layer_5_width_262k_l0_small_affine
|
|
9073
9073
|
path: transcoder_all/layer_5_width_262k_l0_small_affine
|
|
9074
9074
|
l0: 12
|
|
9075
|
-
|
|
9076
|
-
|
|
9077
|
-
|
|
9078
|
-
|
|
9079
|
-
|
|
9080
|
-
|
|
9081
|
-
|
|
9082
|
-
|
|
9083
|
-
|
|
9084
|
-
|
|
9085
|
-
|
|
9086
|
-
|
|
9087
|
-
|
|
9088
|
-
|
|
9089
|
-
|
|
9090
|
-
|
|
9091
|
-
|
|
9092
|
-
|
|
9093
|
-
|
|
9094
|
-
|
|
9095
|
-
|
|
9096
|
-
|
|
9097
|
-
|
|
9098
|
-
|
|
9099
|
-
|
|
9100
|
-
|
|
9101
|
-
|
|
9102
|
-
|
|
9103
|
-
|
|
9104
|
-
|
|
9105
|
-
|
|
9106
|
-
|
|
9107
|
-
|
|
9108
|
-
|
|
9109
|
-
|
|
9110
|
-
|
|
9111
|
-
|
|
9112
|
-
|
|
9113
|
-
|
|
9114
|
-
|
|
9115
|
-
|
|
9116
|
-
|
|
9117
|
-
|
|
9118
|
-
|
|
9119
|
-
|
|
9120
|
-
|
|
9121
|
-
|
|
9122
|
-
|
|
9123
|
-
|
|
9124
|
-
|
|
9125
|
-
|
|
9126
|
-
|
|
9127
|
-
|
|
9128
|
-
|
|
9129
|
-
|
|
9130
|
-
|
|
9131
|
-
|
|
9132
|
-
|
|
9133
|
-
|
|
9134
|
-
|
|
9135
|
-
|
|
9136
|
-
|
|
9137
|
-
|
|
9138
|
-
|
|
9139
|
-
|
|
9140
|
-
|
|
9141
|
-
|
|
9142
|
-
|
|
9143
|
-
|
|
9144
|
-
|
|
9145
|
-
|
|
9146
|
-
|
|
9147
|
-
|
|
9148
|
-
|
|
9149
|
-
|
|
9150
|
-
|
|
9151
|
-
|
|
9152
|
-
|
|
9153
|
-
|
|
9154
|
-
|
|
9155
|
-
|
|
9156
|
-
|
|
9157
|
-
|
|
9158
|
-
|
|
9159
|
-
|
|
9160
|
-
|
|
9161
|
-
|
|
9162
|
-
|
|
9163
|
-
|
|
9164
|
-
|
|
9165
|
-
|
|
9166
|
-
|
|
9167
|
-
|
|
9168
|
-
|
|
9169
|
-
|
|
9170
|
-
|
|
9171
|
-
|
|
9172
|
-
|
|
9173
|
-
|
|
9174
|
-
|
|
9175
|
-
|
|
9176
|
-
|
|
9177
|
-
|
|
9178
|
-
|
|
9179
|
-
|
|
9180
|
-
|
|
9181
|
-
|
|
9182
|
-
|
|
9183
|
-
|
|
9184
|
-
|
|
9185
|
-
|
|
9186
|
-
|
|
9187
|
-
|
|
9188
|
-
|
|
9189
|
-
|
|
9190
|
-
|
|
9191
|
-
|
|
9192
|
-
|
|
9193
|
-
|
|
9194
|
-
|
|
9195
|
-
|
|
9196
|
-
|
|
9197
|
-
|
|
9198
|
-
|
|
9199
|
-
|
|
9200
|
-
|
|
9201
|
-
|
|
9202
|
-
|
|
9203
|
-
|
|
9204
|
-
|
|
9205
|
-
|
|
9206
|
-
|
|
9207
|
-
|
|
9208
|
-
|
|
9209
|
-
|
|
9210
|
-
|
|
9211
|
-
|
|
9212
|
-
|
|
9213
|
-
|
|
9214
|
-
|
|
9215
|
-
|
|
9216
|
-
|
|
9217
|
-
|
|
9218
|
-
|
|
9075
|
+
- id: layer_60_width_16k_l0_big
|
|
9076
|
+
path: transcoder_all/layer_60_width_16k_l0_big
|
|
9077
|
+
l0: 120
|
|
9078
|
+
- id: layer_60_width_16k_l0_big_affine
|
|
9079
|
+
path: transcoder_all/layer_60_width_16k_l0_big_affine
|
|
9080
|
+
l0: 120
|
|
9081
|
+
- id: layer_60_width_16k_l0_small
|
|
9082
|
+
path: transcoder_all/layer_60_width_16k_l0_small
|
|
9083
|
+
l0: 20
|
|
9084
|
+
- id: layer_60_width_16k_l0_small_affine
|
|
9085
|
+
path: transcoder_all/layer_60_width_16k_l0_small_affine
|
|
9086
|
+
l0: 20
|
|
9087
|
+
- id: layer_60_width_262k_l0_big
|
|
9088
|
+
path: transcoder_all/layer_60_width_262k_l0_big
|
|
9089
|
+
l0: 120
|
|
9090
|
+
- id: layer_60_width_262k_l0_big_affine
|
|
9091
|
+
path: transcoder_all/layer_60_width_262k_l0_big_affine
|
|
9092
|
+
l0: 120
|
|
9093
|
+
- id: layer_60_width_262k_l0_small
|
|
9094
|
+
path: transcoder_all/layer_60_width_262k_l0_small
|
|
9095
|
+
l0: 20
|
|
9096
|
+
- id: layer_60_width_262k_l0_small_affine
|
|
9097
|
+
path: transcoder_all/layer_60_width_262k_l0_small_affine
|
|
9098
|
+
l0: 20
|
|
9099
|
+
- id: layer_61_width_16k_l0_big
|
|
9100
|
+
path: transcoder_all/layer_61_width_16k_l0_big
|
|
9101
|
+
l0: 120
|
|
9102
|
+
- id: layer_61_width_16k_l0_big_affine
|
|
9103
|
+
path: transcoder_all/layer_61_width_16k_l0_big_affine
|
|
9104
|
+
l0: 120
|
|
9105
|
+
- id: layer_61_width_16k_l0_small
|
|
9106
|
+
path: transcoder_all/layer_61_width_16k_l0_small
|
|
9107
|
+
l0: 20
|
|
9108
|
+
- id: layer_61_width_16k_l0_small_affine
|
|
9109
|
+
path: transcoder_all/layer_61_width_16k_l0_small_affine
|
|
9110
|
+
l0: 20
|
|
9111
|
+
- id: layer_61_width_262k_l0_big
|
|
9112
|
+
path: transcoder_all/layer_61_width_262k_l0_big
|
|
9113
|
+
l0: 120
|
|
9114
|
+
- id: layer_61_width_262k_l0_big_affine
|
|
9115
|
+
path: transcoder_all/layer_61_width_262k_l0_big_affine
|
|
9116
|
+
l0: 120
|
|
9117
|
+
- id: layer_61_width_262k_l0_small
|
|
9118
|
+
path: transcoder_all/layer_61_width_262k_l0_small
|
|
9119
|
+
l0: 20
|
|
9120
|
+
- id: layer_61_width_262k_l0_small_affine
|
|
9121
|
+
path: transcoder_all/layer_61_width_262k_l0_small_affine
|
|
9122
|
+
l0: 20
|
|
9123
|
+
- id: layer_6_width_16k_l0_big
|
|
9124
|
+
path: transcoder_all/layer_6_width_16k_l0_big
|
|
9125
|
+
l0: 77
|
|
9126
|
+
- id: layer_6_width_16k_l0_big_affine
|
|
9127
|
+
path: transcoder_all/layer_6_width_16k_l0_big_affine
|
|
9128
|
+
l0: 77
|
|
9129
|
+
- id: layer_6_width_16k_l0_small
|
|
9130
|
+
path: transcoder_all/layer_6_width_16k_l0_small
|
|
9131
|
+
l0: 12
|
|
9132
|
+
- id: layer_6_width_16k_l0_small_affine
|
|
9133
|
+
path: transcoder_all/layer_6_width_16k_l0_small_affine
|
|
9134
|
+
l0: 12
|
|
9135
|
+
- id: layer_6_width_262k_l0_big
|
|
9136
|
+
path: transcoder_all/layer_6_width_262k_l0_big
|
|
9137
|
+
l0: 77
|
|
9138
|
+
- id: layer_6_width_262k_l0_big_affine
|
|
9139
|
+
path: transcoder_all/layer_6_width_262k_l0_big_affine
|
|
9140
|
+
l0: 77
|
|
9141
|
+
- id: layer_6_width_262k_l0_small
|
|
9142
|
+
path: transcoder_all/layer_6_width_262k_l0_small
|
|
9143
|
+
l0: 12
|
|
9144
|
+
- id: layer_6_width_262k_l0_small_affine
|
|
9145
|
+
path: transcoder_all/layer_6_width_262k_l0_small_affine
|
|
9146
|
+
l0: 12
|
|
9147
|
+
- id: layer_7_width_16k_l0_big
|
|
9148
|
+
path: transcoder_all/layer_7_width_16k_l0_big
|
|
9149
|
+
l0: 80
|
|
9150
|
+
- id: layer_7_width_16k_l0_big_affine
|
|
9151
|
+
path: transcoder_all/layer_7_width_16k_l0_big_affine
|
|
9152
|
+
l0: 80
|
|
9153
|
+
- id: layer_7_width_16k_l0_small
|
|
9154
|
+
path: transcoder_all/layer_7_width_16k_l0_small
|
|
9155
|
+
l0: 13
|
|
9156
|
+
- id: layer_7_width_16k_l0_small_affine
|
|
9157
|
+
path: transcoder_all/layer_7_width_16k_l0_small_affine
|
|
9158
|
+
l0: 13
|
|
9159
|
+
- id: layer_7_width_262k_l0_big
|
|
9160
|
+
path: transcoder_all/layer_7_width_262k_l0_big
|
|
9161
|
+
l0: 80
|
|
9162
|
+
- id: layer_7_width_262k_l0_big_affine
|
|
9163
|
+
path: transcoder_all/layer_7_width_262k_l0_big_affine
|
|
9164
|
+
l0: 80
|
|
9165
|
+
- id: layer_7_width_262k_l0_small
|
|
9166
|
+
path: transcoder_all/layer_7_width_262k_l0_small
|
|
9167
|
+
l0: 13
|
|
9168
|
+
- id: layer_7_width_262k_l0_small_affine
|
|
9169
|
+
path: transcoder_all/layer_7_width_262k_l0_small_affine
|
|
9170
|
+
l0: 13
|
|
9171
|
+
- id: layer_8_width_16k_l0_big
|
|
9172
|
+
path: transcoder_all/layer_8_width_16k_l0_big
|
|
9173
|
+
l0: 83
|
|
9174
|
+
- id: layer_8_width_16k_l0_big_affine
|
|
9175
|
+
path: transcoder_all/layer_8_width_16k_l0_big_affine
|
|
9176
|
+
l0: 83
|
|
9177
|
+
- id: layer_8_width_16k_l0_small
|
|
9178
|
+
path: transcoder_all/layer_8_width_16k_l0_small
|
|
9179
|
+
l0: 13
|
|
9180
|
+
- id: layer_8_width_16k_l0_small_affine
|
|
9181
|
+
path: transcoder_all/layer_8_width_16k_l0_small_affine
|
|
9182
|
+
l0: 13
|
|
9183
|
+
- id: layer_8_width_262k_l0_big
|
|
9184
|
+
path: transcoder_all/layer_8_width_262k_l0_big
|
|
9185
|
+
l0: 83
|
|
9186
|
+
- id: layer_8_width_262k_l0_big_affine
|
|
9187
|
+
path: transcoder_all/layer_8_width_262k_l0_big_affine
|
|
9188
|
+
l0: 83
|
|
9189
|
+
- id: layer_8_width_262k_l0_small
|
|
9190
|
+
path: transcoder_all/layer_8_width_262k_l0_small
|
|
9191
|
+
l0: 13
|
|
9192
|
+
- id: layer_8_width_262k_l0_small_affine
|
|
9193
|
+
path: transcoder_all/layer_8_width_262k_l0_small_affine
|
|
9194
|
+
l0: 13
|
|
9195
|
+
- id: layer_9_width_16k_l0_big
|
|
9196
|
+
path: transcoder_all/layer_9_width_16k_l0_big
|
|
9197
|
+
l0: 86
|
|
9198
|
+
- id: layer_9_width_16k_l0_big_affine
|
|
9199
|
+
path: transcoder_all/layer_9_width_16k_l0_big_affine
|
|
9200
|
+
l0: 86
|
|
9201
|
+
- id: layer_9_width_16k_l0_small
|
|
9202
|
+
path: transcoder_all/layer_9_width_16k_l0_small
|
|
9203
|
+
l0: 14
|
|
9204
|
+
- id: layer_9_width_16k_l0_small_affine
|
|
9205
|
+
path: transcoder_all/layer_9_width_16k_l0_small_affine
|
|
9206
|
+
l0: 14
|
|
9207
|
+
- id: layer_9_width_262k_l0_big
|
|
9208
|
+
path: transcoder_all/layer_9_width_262k_l0_big
|
|
9209
|
+
l0: 86
|
|
9210
|
+
- id: layer_9_width_262k_l0_big_affine
|
|
9211
|
+
path: transcoder_all/layer_9_width_262k_l0_big_affine
|
|
9212
|
+
l0: 86
|
|
9213
|
+
- id: layer_9_width_262k_l0_small
|
|
9214
|
+
path: transcoder_all/layer_9_width_262k_l0_small
|
|
9215
|
+
l0: 14
|
|
9216
|
+
- id: layer_9_width_262k_l0_small_affine
|
|
9217
|
+
path: transcoder_all/layer_9_width_262k_l0_small_affine
|
|
9218
|
+
l0: 14
|
|
9219
9219
|
gemma-scope-2-27b-it-transcoders:
|
|
9220
9220
|
conversion_func: gemma_3
|
|
9221
9221
|
model: google/gemma-3-27b-it
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|