sae-lens 6.12.1__py3-none-any.whl → 6.12.3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- sae_lens/__init__.py +1 -1
- sae_lens/loading/pretrained_sae_loaders.py +6 -0
- sae_lens/saes/sae.py +1 -1
- {sae_lens-6.12.1.dist-info → sae_lens-6.12.3.dist-info}/METADATA +4 -2
- {sae_lens-6.12.1.dist-info → sae_lens-6.12.3.dist-info}/RECORD +7 -7
- {sae_lens-6.12.1.dist-info → sae_lens-6.12.3.dist-info}/WHEEL +1 -1
- {sae_lens-6.12.1.dist-info → sae_lens-6.12.3.dist-info/licenses}/LICENSE +0 -0
sae_lens/__init__.py
CHANGED
|
@@ -233,6 +233,12 @@ def handle_pre_6_0_config(cfg_dict: dict[str, Any]) -> dict[str, Any]:
|
|
|
233
233
|
"reshape_activations",
|
|
234
234
|
"hook_z" if "hook_z" in new_cfg.get("hook_name", "") else "none",
|
|
235
235
|
)
|
|
236
|
+
if (
|
|
237
|
+
new_cfg.get("activation_fn") == "topk"
|
|
238
|
+
and new_cfg.get("activation_fn_kwargs", {}).get("k") is not None
|
|
239
|
+
):
|
|
240
|
+
new_cfg["architecture"] = "topk"
|
|
241
|
+
new_cfg["k"] = new_cfg["activation_fn_kwargs"]["k"]
|
|
236
242
|
|
|
237
243
|
if "normalize_activations" in new_cfg and isinstance(
|
|
238
244
|
new_cfg["normalize_activations"], bool
|
sae_lens/saes/sae.py
CHANGED
|
@@ -245,7 +245,7 @@ class SAE(HookedRootModule, Generic[T_SAE_CONFIG], ABC):
|
|
|
245
245
|
|
|
246
246
|
self.cfg = cfg
|
|
247
247
|
|
|
248
|
-
if cfg.metadata and cfg.metadata:
|
|
248
|
+
if cfg.metadata and cfg.metadata.model_from_pretrained_kwargs:
|
|
249
249
|
warnings.warn(
|
|
250
250
|
"\nThis SAE has non-empty model_from_pretrained_kwargs. "
|
|
251
251
|
"\nFor optimal performance, load the model like so:\n"
|
|
@@ -1,8 +1,9 @@
|
|
|
1
|
-
Metadata-Version: 2.
|
|
1
|
+
Metadata-Version: 2.4
|
|
2
2
|
Name: sae-lens
|
|
3
|
-
Version: 6.12.
|
|
3
|
+
Version: 6.12.3
|
|
4
4
|
Summary: Training and Analyzing Sparse Autoencoders (SAEs)
|
|
5
5
|
License: MIT
|
|
6
|
+
License-File: LICENSE
|
|
6
7
|
Keywords: deep-learning,sparse-autoencoders,mechanistic-interpretability,PyTorch
|
|
7
8
|
Author: Joseph Bloom
|
|
8
9
|
Requires-Python: >=3.10,<4.0
|
|
@@ -12,6 +13,7 @@ Classifier: Programming Language :: Python :: 3.10
|
|
|
12
13
|
Classifier: Programming Language :: Python :: 3.11
|
|
13
14
|
Classifier: Programming Language :: Python :: 3.12
|
|
14
15
|
Classifier: Programming Language :: Python :: 3.13
|
|
16
|
+
Classifier: Programming Language :: Python :: 3.14
|
|
15
17
|
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
|
|
16
18
|
Provides-Extra: mamba
|
|
17
19
|
Requires-Dist: babe (>=0.0.7,<0.0.8)
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
sae_lens/__init__.py,sha256=
|
|
1
|
+
sae_lens/__init__.py,sha256=Y0IpvmIXo54khj-mXZsnluiwxvfrtxJFdxgwHuAmlAg,3589
|
|
2
2
|
sae_lens/analysis/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
3
3
|
sae_lens/analysis/hooked_sae_transformer.py,sha256=vRu6JseH1lZaEeILD5bEkQEQ1wYHHDcxD-f2olKmE9Y,14275
|
|
4
4
|
sae_lens/analysis/neuronpedia_integration.py,sha256=Gx1W7hUBEuMoasNcnOnZ1wmqbXDd1pSZ1nqKEya1HQc,4962
|
|
@@ -9,7 +9,7 @@ sae_lens/evals.py,sha256=4hanbyG8qZLItWqft94F4ZjUoytPVB7fw5s0P4Oi0VE,39504
|
|
|
9
9
|
sae_lens/llm_sae_training_runner.py,sha256=sJTcDX1bUJJ_jZLUT88-8KUYIAPeUGoXktX68PsBqw0,15137
|
|
10
10
|
sae_lens/load_model.py,sha256=C8AMykctj6H7tz_xRwB06-EXj6TfW64PtSJZR5Jxn1Y,8649
|
|
11
11
|
sae_lens/loading/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
12
|
-
sae_lens/loading/pretrained_sae_loaders.py,sha256=
|
|
12
|
+
sae_lens/loading/pretrained_sae_loaders.py,sha256=SM4aT8NM6ezYix5c2u7p72Fz2RfvTtf7gw5RdOSKXhc,49846
|
|
13
13
|
sae_lens/loading/pretrained_saes_directory.py,sha256=4Vn-Jex6SveD7EbxcSOBv8cx1gkPfUMLU1QOP-ww1ZE,3752
|
|
14
14
|
sae_lens/pretokenize_runner.py,sha256=w0f6SfZLAxbp5eAAKnet8RqUB_DKofZ9RGsoJwFnYbA,7058
|
|
15
15
|
sae_lens/pretrained_saes.yaml,sha256=6ca3geEB6NyhULUrmdtPDK8ea0YdpLp8_au78vIFC5w,602553
|
|
@@ -18,7 +18,7 @@ sae_lens/saes/__init__.py,sha256=jVwazK8Q6dW5J6_zFXPoNAuBvSxgziQ8eMOjGM3t-X8,147
|
|
|
18
18
|
sae_lens/saes/batchtopk_sae.py,sha256=GX_J0vH4vzeLqYxl0mkfsZQpFEoCEHMR4dIG8fz8N8w,3449
|
|
19
19
|
sae_lens/saes/gated_sae.py,sha256=qcmM9JwBA8aZR8z_IRHV1_gQX-q_63tKewWXRnhdXuo,8986
|
|
20
20
|
sae_lens/saes/jumprelu_sae.py,sha256=HHBF1sJ95lZvxwP5vwLSQFKdnJN2KKYK0WAEaLTrta0,13399
|
|
21
|
-
sae_lens/saes/sae.py,sha256=
|
|
21
|
+
sae_lens/saes/sae.py,sha256=McpF4pTh70r6SQUbHFm0YQ9X2c2qPULBUSd_YmnEk4Y,38284
|
|
22
22
|
sae_lens/saes/standard_sae.py,sha256=9UqYyYtQuThYxXKNaDjYcyowpOx2-7cShG-TeUP6JCQ,5940
|
|
23
23
|
sae_lens/saes/topk_sae.py,sha256=CXMBI6CFvI5829bOhoQ350VXR9d8uFHUDlULTIWHXoU,8686
|
|
24
24
|
sae_lens/saes/transcoder.py,sha256=BfLSbTYVNZh-ruGxseZiZJ_acEL6_7QyTdfqUr0lDOg,12156
|
|
@@ -33,7 +33,7 @@ sae_lens/training/types.py,sha256=qSjmGzXf3MLalygG0psnVjmhX_mpLmL47MQtZfe7qxg,81
|
|
|
33
33
|
sae_lens/training/upload_saes_to_huggingface.py,sha256=r_WzI1zLtGZ5TzAxuG3xa_8T09j3zXJrWd_vzPsPGkQ,4469
|
|
34
34
|
sae_lens/tutorial/tsea.py,sha256=fd1am_XXsf2KMbByDapJo-2qlxduKaa62Z2qcQZ3QKU,18145
|
|
35
35
|
sae_lens/util.py,sha256=lW7fBn_b8quvRYlen9PUmB7km60YhKyjmuelB1f6KzQ,2253
|
|
36
|
-
sae_lens-6.12.
|
|
37
|
-
sae_lens-6.12.
|
|
38
|
-
sae_lens-6.12.
|
|
39
|
-
sae_lens-6.12.
|
|
36
|
+
sae_lens-6.12.3.dist-info/METADATA,sha256=WIM_Eda9y85GQi6XlgW4R9grfqCdEdeEUfkCdymhC3E,5318
|
|
37
|
+
sae_lens-6.12.3.dist-info/WHEEL,sha256=zp0Cn7JsFoX2ATtOhtaFYIiE2rmFAD4OcMhtUki8W3U,88
|
|
38
|
+
sae_lens-6.12.3.dist-info/licenses/LICENSE,sha256=DW6e-hDosiu4CfW0-imI57sV1I5f9UEslpviNQcOAKs,1069
|
|
39
|
+
sae_lens-6.12.3.dist-info/RECORD,,
|
|
File without changes
|