sae-lens 6.29.1__tar.gz → 6.31.0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {sae_lens-6.29.1 → sae_lens-6.31.0}/PKG-INFO +1 -1
- {sae_lens-6.29.1 → sae_lens-6.31.0}/pyproject.toml +1 -1
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/__init__.py +1 -1
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/config.py +9 -1
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/evals.py +2 -2
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/loading/pretrained_sae_loaders.py +9 -3
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/pretrained_saes.yaml +36 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/saes/temporal_sae.py +1 -1
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/training/activation_scaler.py +3 -1
- {sae_lens-6.29.1 → sae_lens-6.31.0}/LICENSE +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/README.md +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/analysis/__init__.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/analysis/hooked_sae_transformer.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/analysis/neuronpedia_integration.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/cache_activations_runner.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/constants.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/llm_sae_training_runner.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/load_model.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/loading/__init__.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/loading/pretrained_saes_directory.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/pretokenize_runner.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/registry.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/saes/__init__.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/saes/batchtopk_sae.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/saes/gated_sae.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/saes/jumprelu_sae.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/saes/matching_pursuit_sae.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/saes/matryoshka_batchtopk_sae.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/saes/sae.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/saes/standard_sae.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/saes/topk_sae.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/saes/transcoder.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/synthetic/__init__.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/synthetic/activation_generator.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/synthetic/correlation.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/synthetic/evals.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/synthetic/feature_dictionary.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/synthetic/firing_probabilities.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/synthetic/hierarchy.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/synthetic/initialization.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/synthetic/plotting.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/synthetic/training.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/tokenization_and_batching.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/training/__init__.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/training/activations_store.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/training/mixing_buffer.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/training/optim.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/training/sae_trainer.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/training/types.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/training/upload_saes_to_huggingface.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/tutorial/tsea.py +0 -0
- {sae_lens-6.29.1 → sae_lens-6.31.0}/sae_lens/util.py +0 -0
|
@@ -82,6 +82,7 @@ class LoggingConfig:
|
|
|
82
82
|
log_to_wandb: bool = True
|
|
83
83
|
log_activations_store_to_wandb: bool = False
|
|
84
84
|
log_optimizer_state_to_wandb: bool = False
|
|
85
|
+
log_weights_to_wandb: bool = True
|
|
85
86
|
wandb_project: str = "sae_lens_training"
|
|
86
87
|
wandb_id: str | None = None
|
|
87
88
|
run_name: str | None = None
|
|
@@ -107,7 +108,8 @@ class LoggingConfig:
|
|
|
107
108
|
type="model",
|
|
108
109
|
metadata=dict(trainer.cfg.__dict__),
|
|
109
110
|
)
|
|
110
|
-
|
|
111
|
+
if self.log_weights_to_wandb:
|
|
112
|
+
model_artifact.add_file(str(weights_path))
|
|
111
113
|
model_artifact.add_file(str(cfg_path))
|
|
112
114
|
wandb.log_artifact(model_artifact, aliases=wandb_aliases)
|
|
113
115
|
|
|
@@ -557,6 +559,12 @@ class CacheActivationsRunnerConfig:
|
|
|
557
559
|
context_size=self.context_size,
|
|
558
560
|
)
|
|
559
561
|
|
|
562
|
+
if self.context_size > self.training_tokens:
|
|
563
|
+
raise ValueError(
|
|
564
|
+
f"context_size ({self.context_size}) is greater than training_tokens "
|
|
565
|
+
f"({self.training_tokens}). Please reduce context_size or increase training_tokens."
|
|
566
|
+
)
|
|
567
|
+
|
|
560
568
|
if self.new_cached_activations_path is None:
|
|
561
569
|
self.new_cached_activations_path = _default_cached_activations_path( # type: ignore
|
|
562
570
|
self.dataset_path, self.model_name, self.hook_name, None
|
|
@@ -335,7 +335,7 @@ def get_downstream_reconstruction_metrics(
|
|
|
335
335
|
|
|
336
336
|
batch_iter = range(n_batches)
|
|
337
337
|
if verbose:
|
|
338
|
-
batch_iter = tqdm(batch_iter, desc="Reconstruction Batches")
|
|
338
|
+
batch_iter = tqdm(batch_iter, desc="Reconstruction Batches", leave=False)
|
|
339
339
|
|
|
340
340
|
for _ in batch_iter:
|
|
341
341
|
batch_tokens = activation_store.get_batch_tokens(eval_batch_size_prompts)
|
|
@@ -430,7 +430,7 @@ def get_sparsity_and_variance_metrics(
|
|
|
430
430
|
|
|
431
431
|
batch_iter = range(n_batches)
|
|
432
432
|
if verbose:
|
|
433
|
-
batch_iter = tqdm(batch_iter, desc="Sparsity and Variance Batches")
|
|
433
|
+
batch_iter = tqdm(batch_iter, desc="Sparsity and Variance Batches", leave=False)
|
|
434
434
|
|
|
435
435
|
for _ in batch_iter:
|
|
436
436
|
batch_tokens = activation_store.get_batch_tokens(eval_batch_size_prompts)
|
|
@@ -575,6 +575,8 @@ def _infer_gemma_3_raw_cfg_dict(repo_id: str, folder_name: str) -> dict[str, Any
|
|
|
575
575
|
"model_name": model_name,
|
|
576
576
|
"hf_hook_point_in": hf_hook_point_in,
|
|
577
577
|
}
|
|
578
|
+
if "transcoder" in folder_name or "clt" in folder_name:
|
|
579
|
+
cfg["affine_connection"] = "affine" in folder_name
|
|
578
580
|
if hf_hook_point_out is not None:
|
|
579
581
|
cfg["hf_hook_point_out"] = hf_hook_point_out
|
|
580
582
|
|
|
@@ -614,11 +616,11 @@ def get_gemma_3_config_from_hf(
|
|
|
614
616
|
if "resid_post" in folder_name:
|
|
615
617
|
hook_name = f"blocks.{layer}.hook_resid_post"
|
|
616
618
|
elif "attn_out" in folder_name:
|
|
617
|
-
hook_name = f"blocks.{layer}.
|
|
619
|
+
hook_name = f"blocks.{layer}.attn.hook_z"
|
|
618
620
|
elif "mlp_out" in folder_name:
|
|
619
621
|
hook_name = f"blocks.{layer}.hook_mlp_out"
|
|
620
622
|
elif "transcoder" in folder_name or "clt" in folder_name:
|
|
621
|
-
hook_name = f"blocks.{layer}.
|
|
623
|
+
hook_name = f"blocks.{layer}.hook_mlp_in"
|
|
622
624
|
hook_name_out = f"blocks.{layer}.hook_mlp_out"
|
|
623
625
|
else:
|
|
624
626
|
raise ValueError("Hook name not found in folder_name.")
|
|
@@ -643,7 +645,11 @@ def get_gemma_3_config_from_hf(
|
|
|
643
645
|
|
|
644
646
|
architecture = "jumprelu"
|
|
645
647
|
if "transcoder" in folder_name or "clt" in folder_name:
|
|
646
|
-
architecture =
|
|
648
|
+
architecture = (
|
|
649
|
+
"jumprelu_skip_transcoder"
|
|
650
|
+
if raw_cfg_dict.get("affine_connection", False)
|
|
651
|
+
else "jumprelu_transcoder"
|
|
652
|
+
)
|
|
647
653
|
d_out = shapes_dict["w_dec"][-1]
|
|
648
654
|
|
|
649
655
|
cfg = {
|
|
@@ -4148,6 +4148,7 @@ gemma-scope-2-4b-it-res:
|
|
|
4148
4148
|
- id: layer_17_width_16k_l0_medium
|
|
4149
4149
|
path: resid_post/layer_17_width_16k_l0_medium
|
|
4150
4150
|
l0: 60
|
|
4151
|
+
neuronpedia: gemma-3-4b-it/17-gemmascope-2-res-16k
|
|
4151
4152
|
- id: layer_17_width_16k_l0_small
|
|
4152
4153
|
path: resid_post/layer_17_width_16k_l0_small
|
|
4153
4154
|
l0: 20
|
|
@@ -4166,6 +4167,7 @@ gemma-scope-2-4b-it-res:
|
|
|
4166
4167
|
- id: layer_17_width_262k_l0_medium
|
|
4167
4168
|
path: resid_post/layer_17_width_262k_l0_medium
|
|
4168
4169
|
l0: 60
|
|
4170
|
+
neuronpedia: gemma-3-4b-it/17-gemmascope-2-res-262k
|
|
4169
4171
|
- id: layer_17_width_262k_l0_medium_seed_1
|
|
4170
4172
|
path: resid_post/layer_17_width_262k_l0_medium_seed_1
|
|
4171
4173
|
l0: 60
|
|
@@ -4178,6 +4180,7 @@ gemma-scope-2-4b-it-res:
|
|
|
4178
4180
|
- id: layer_17_width_65k_l0_medium
|
|
4179
4181
|
path: resid_post/layer_17_width_65k_l0_medium
|
|
4180
4182
|
l0: 60
|
|
4183
|
+
neuronpedia: gemma-3-4b-it/17-gemmascope-2-res-65k
|
|
4181
4184
|
- id: layer_17_width_65k_l0_small
|
|
4182
4185
|
path: resid_post/layer_17_width_65k_l0_small
|
|
4183
4186
|
l0: 20
|
|
@@ -4187,6 +4190,7 @@ gemma-scope-2-4b-it-res:
|
|
|
4187
4190
|
- id: layer_22_width_16k_l0_medium
|
|
4188
4191
|
path: resid_post/layer_22_width_16k_l0_medium
|
|
4189
4192
|
l0: 60
|
|
4193
|
+
neuronpedia: gemma-3-4b-it/22-gemmascope-2-res-16k
|
|
4190
4194
|
- id: layer_22_width_16k_l0_small
|
|
4191
4195
|
path: resid_post/layer_22_width_16k_l0_small
|
|
4192
4196
|
l0: 20
|
|
@@ -4205,6 +4209,7 @@ gemma-scope-2-4b-it-res:
|
|
|
4205
4209
|
- id: layer_22_width_262k_l0_medium
|
|
4206
4210
|
path: resid_post/layer_22_width_262k_l0_medium
|
|
4207
4211
|
l0: 60
|
|
4212
|
+
neuronpedia: gemma-3-4b-it/22-gemmascope-2-res-262k
|
|
4208
4213
|
- id: layer_22_width_262k_l0_medium_seed_1
|
|
4209
4214
|
path: resid_post/layer_22_width_262k_l0_medium_seed_1
|
|
4210
4215
|
l0: 60
|
|
@@ -4217,6 +4222,7 @@ gemma-scope-2-4b-it-res:
|
|
|
4217
4222
|
- id: layer_22_width_65k_l0_medium
|
|
4218
4223
|
path: resid_post/layer_22_width_65k_l0_medium
|
|
4219
4224
|
l0: 60
|
|
4225
|
+
neuronpedia: gemma-3-4b-it/22-gemmascope-2-res-65k
|
|
4220
4226
|
- id: layer_22_width_65k_l0_small
|
|
4221
4227
|
path: resid_post/layer_22_width_65k_l0_small
|
|
4222
4228
|
l0: 20
|
|
@@ -4226,6 +4232,7 @@ gemma-scope-2-4b-it-res:
|
|
|
4226
4232
|
- id: layer_29_width_16k_l0_medium
|
|
4227
4233
|
path: resid_post/layer_29_width_16k_l0_medium
|
|
4228
4234
|
l0: 60
|
|
4235
|
+
neuronpedia: gemma-3-4b-it/29-gemmascope-2-res-16k
|
|
4229
4236
|
- id: layer_29_width_16k_l0_small
|
|
4230
4237
|
path: resid_post/layer_29_width_16k_l0_small
|
|
4231
4238
|
l0: 20
|
|
@@ -4244,6 +4251,7 @@ gemma-scope-2-4b-it-res:
|
|
|
4244
4251
|
- id: layer_29_width_262k_l0_medium
|
|
4245
4252
|
path: resid_post/layer_29_width_262k_l0_medium
|
|
4246
4253
|
l0: 60
|
|
4254
|
+
neuronpedia: gemma-3-4b-it/29-gemmascope-2-res-262k
|
|
4247
4255
|
- id: layer_29_width_262k_l0_medium_seed_1
|
|
4248
4256
|
path: resid_post/layer_29_width_262k_l0_medium_seed_1
|
|
4249
4257
|
l0: 60
|
|
@@ -4256,6 +4264,7 @@ gemma-scope-2-4b-it-res:
|
|
|
4256
4264
|
- id: layer_29_width_65k_l0_medium
|
|
4257
4265
|
path: resid_post/layer_29_width_65k_l0_medium
|
|
4258
4266
|
l0: 60
|
|
4267
|
+
neuronpedia: gemma-3-4b-it/29-gemmascope-2-res-65k
|
|
4259
4268
|
- id: layer_29_width_65k_l0_small
|
|
4260
4269
|
path: resid_post/layer_29_width_65k_l0_small
|
|
4261
4270
|
l0: 20
|
|
@@ -4265,6 +4274,7 @@ gemma-scope-2-4b-it-res:
|
|
|
4265
4274
|
- id: layer_9_width_16k_l0_medium
|
|
4266
4275
|
path: resid_post/layer_9_width_16k_l0_medium
|
|
4267
4276
|
l0: 53
|
|
4277
|
+
neuronpedia: gemma-3-4b-it/9-gemmascope-2-res-16k
|
|
4268
4278
|
- id: layer_9_width_16k_l0_small
|
|
4269
4279
|
path: resid_post/layer_9_width_16k_l0_small
|
|
4270
4280
|
l0: 17
|
|
@@ -4283,6 +4293,7 @@ gemma-scope-2-4b-it-res:
|
|
|
4283
4293
|
- id: layer_9_width_262k_l0_medium
|
|
4284
4294
|
path: resid_post/layer_9_width_262k_l0_medium
|
|
4285
4295
|
l0: 53
|
|
4296
|
+
neuronpedia: gemma-3-4b-it/9-gemmascope-2-res-262k
|
|
4286
4297
|
- id: layer_9_width_262k_l0_medium_seed_1
|
|
4287
4298
|
path: resid_post/layer_9_width_262k_l0_medium_seed_1
|
|
4288
4299
|
l0: 53
|
|
@@ -4295,6 +4306,7 @@ gemma-scope-2-4b-it-res:
|
|
|
4295
4306
|
- id: layer_9_width_65k_l0_medium
|
|
4296
4307
|
path: resid_post/layer_9_width_65k_l0_medium
|
|
4297
4308
|
l0: 53
|
|
4309
|
+
neuronpedia: gemma-3-4b-it/9-gemmascope-2-res-65k
|
|
4298
4310
|
- id: layer_9_width_65k_l0_small
|
|
4299
4311
|
path: resid_post/layer_9_width_65k_l0_small
|
|
4300
4312
|
l0: 17
|
|
@@ -14491,6 +14503,7 @@ gemma-scope-2-270m-it-res:
|
|
|
14491
14503
|
- id: layer_12_width_16k_l0_medium
|
|
14492
14504
|
path: resid_post/layer_12_width_16k_l0_medium
|
|
14493
14505
|
l0: 60
|
|
14506
|
+
neuronpedia: gemma-3-270m-it/12-gemmascope-2-res-16k
|
|
14494
14507
|
- id: layer_12_width_16k_l0_small
|
|
14495
14508
|
path: resid_post/layer_12_width_16k_l0_small
|
|
14496
14509
|
l0: 20
|
|
@@ -14509,6 +14522,7 @@ gemma-scope-2-270m-it-res:
|
|
|
14509
14522
|
- id: layer_12_width_262k_l0_medium
|
|
14510
14523
|
path: resid_post/layer_12_width_262k_l0_medium
|
|
14511
14524
|
l0: 60
|
|
14525
|
+
neuronpedia: gemma-3-270m-it/12-gemmascope-2-res-262k
|
|
14512
14526
|
- id: layer_12_width_262k_l0_medium_seed_1
|
|
14513
14527
|
path: resid_post/layer_12_width_262k_l0_medium_seed_1
|
|
14514
14528
|
l0: 60
|
|
@@ -14521,6 +14535,7 @@ gemma-scope-2-270m-it-res:
|
|
|
14521
14535
|
- id: layer_12_width_65k_l0_medium
|
|
14522
14536
|
path: resid_post/layer_12_width_65k_l0_medium
|
|
14523
14537
|
l0: 60
|
|
14538
|
+
neuronpedia: gemma-3-270m-it/12-gemmascope-2-res-65k
|
|
14524
14539
|
- id: layer_12_width_65k_l0_small
|
|
14525
14540
|
path: resid_post/layer_12_width_65k_l0_small
|
|
14526
14541
|
l0: 20
|
|
@@ -14530,6 +14545,7 @@ gemma-scope-2-270m-it-res:
|
|
|
14530
14545
|
- id: layer_15_width_16k_l0_medium
|
|
14531
14546
|
path: resid_post/layer_15_width_16k_l0_medium
|
|
14532
14547
|
l0: 60
|
|
14548
|
+
neuronpedia: gemma-3-270m-it/15-gemmascope-2-res-16k
|
|
14533
14549
|
- id: layer_15_width_16k_l0_small
|
|
14534
14550
|
path: resid_post/layer_15_width_16k_l0_small
|
|
14535
14551
|
l0: 20
|
|
@@ -14548,6 +14564,7 @@ gemma-scope-2-270m-it-res:
|
|
|
14548
14564
|
- id: layer_15_width_262k_l0_medium
|
|
14549
14565
|
path: resid_post/layer_15_width_262k_l0_medium
|
|
14550
14566
|
l0: 60
|
|
14567
|
+
neuronpedia: gemma-3-270m-it/15-gemmascope-2-res-262k
|
|
14551
14568
|
- id: layer_15_width_262k_l0_medium_seed_1
|
|
14552
14569
|
path: resid_post/layer_15_width_262k_l0_medium_seed_1
|
|
14553
14570
|
l0: 60
|
|
@@ -14560,6 +14577,7 @@ gemma-scope-2-270m-it-res:
|
|
|
14560
14577
|
- id: layer_15_width_65k_l0_medium
|
|
14561
14578
|
path: resid_post/layer_15_width_65k_l0_medium
|
|
14562
14579
|
l0: 60
|
|
14580
|
+
neuronpedia: gemma-3-270m-it/15-gemmascope-2-res-65k
|
|
14563
14581
|
- id: layer_15_width_65k_l0_small
|
|
14564
14582
|
path: resid_post/layer_15_width_65k_l0_small
|
|
14565
14583
|
l0: 20
|
|
@@ -14569,6 +14587,7 @@ gemma-scope-2-270m-it-res:
|
|
|
14569
14587
|
- id: layer_5_width_16k_l0_medium
|
|
14570
14588
|
path: resid_post/layer_5_width_16k_l0_medium
|
|
14571
14589
|
l0: 55
|
|
14590
|
+
neuronpedia: gemma-3-270m-it/5-gemmascope-2-res-16k
|
|
14572
14591
|
- id: layer_5_width_16k_l0_small
|
|
14573
14592
|
path: resid_post/layer_5_width_16k_l0_small
|
|
14574
14593
|
l0: 18
|
|
@@ -14587,6 +14606,7 @@ gemma-scope-2-270m-it-res:
|
|
|
14587
14606
|
- id: layer_5_width_262k_l0_medium
|
|
14588
14607
|
path: resid_post/layer_5_width_262k_l0_medium
|
|
14589
14608
|
l0: 55
|
|
14609
|
+
neuronpedia: gemma-3-270m-it/5-gemmascope-2-res-262k
|
|
14590
14610
|
- id: layer_5_width_262k_l0_medium_seed_1
|
|
14591
14611
|
path: resid_post/layer_5_width_262k_l0_medium_seed_1
|
|
14592
14612
|
l0: 55
|
|
@@ -14599,6 +14619,7 @@ gemma-scope-2-270m-it-res:
|
|
|
14599
14619
|
- id: layer_5_width_65k_l0_medium
|
|
14600
14620
|
path: resid_post/layer_5_width_65k_l0_medium
|
|
14601
14621
|
l0: 55
|
|
14622
|
+
neuronpedia: gemma-3-270m-it/5-gemmascope-2-res-65k
|
|
14602
14623
|
- id: layer_5_width_65k_l0_small
|
|
14603
14624
|
path: resid_post/layer_5_width_65k_l0_small
|
|
14604
14625
|
l0: 18
|
|
@@ -14608,6 +14629,7 @@ gemma-scope-2-270m-it-res:
|
|
|
14608
14629
|
- id: layer_9_width_16k_l0_medium
|
|
14609
14630
|
path: resid_post/layer_9_width_16k_l0_medium
|
|
14610
14631
|
l0: 60
|
|
14632
|
+
neuronpedia: gemma-3-270m-it/9-gemmascope-2-res-16k
|
|
14611
14633
|
- id: layer_9_width_16k_l0_small
|
|
14612
14634
|
path: resid_post/layer_9_width_16k_l0_small
|
|
14613
14635
|
l0: 20
|
|
@@ -14626,6 +14648,7 @@ gemma-scope-2-270m-it-res:
|
|
|
14626
14648
|
- id: layer_9_width_262k_l0_medium
|
|
14627
14649
|
path: resid_post/layer_9_width_262k_l0_medium
|
|
14628
14650
|
l0: 60
|
|
14651
|
+
neuronpedia: gemma-3-270m-it/9-gemmascope-2-res-262k
|
|
14629
14652
|
- id: layer_9_width_262k_l0_medium_seed_1
|
|
14630
14653
|
path: resid_post/layer_9_width_262k_l0_medium_seed_1
|
|
14631
14654
|
l0: 60
|
|
@@ -14638,6 +14661,7 @@ gemma-scope-2-270m-it-res:
|
|
|
14638
14661
|
- id: layer_9_width_65k_l0_medium
|
|
14639
14662
|
path: resid_post/layer_9_width_65k_l0_medium
|
|
14640
14663
|
l0: 60
|
|
14664
|
+
neuronpedia: gemma-3-270m-it/9-gemmascope-2-res-65k
|
|
14641
14665
|
- id: layer_9_width_65k_l0_small
|
|
14642
14666
|
path: resid_post/layer_9_width_65k_l0_small
|
|
14643
14667
|
l0: 20
|
|
@@ -18727,6 +18751,7 @@ gemma-scope-2-1b-it-res:
|
|
|
18727
18751
|
- id: layer_13_width_16k_l0_medium
|
|
18728
18752
|
path: resid_post/layer_13_width_16k_l0_medium
|
|
18729
18753
|
l0: 60
|
|
18754
|
+
neuronpedia: gemma-3-1b-it/13-gemmascope-2-res-16k
|
|
18730
18755
|
- id: layer_13_width_16k_l0_small
|
|
18731
18756
|
path: resid_post/layer_13_width_16k_l0_small
|
|
18732
18757
|
l0: 20
|
|
@@ -18745,6 +18770,7 @@ gemma-scope-2-1b-it-res:
|
|
|
18745
18770
|
- id: layer_13_width_262k_l0_medium
|
|
18746
18771
|
path: resid_post/layer_13_width_262k_l0_medium
|
|
18747
18772
|
l0: 60
|
|
18773
|
+
neuronpedia: gemma-3-1b-it/13-gemmascope-2-res-262k
|
|
18748
18774
|
- id: layer_13_width_262k_l0_medium_seed_1
|
|
18749
18775
|
path: resid_post/layer_13_width_262k_l0_medium_seed_1
|
|
18750
18776
|
l0: 60
|
|
@@ -18757,6 +18783,7 @@ gemma-scope-2-1b-it-res:
|
|
|
18757
18783
|
- id: layer_13_width_65k_l0_medium
|
|
18758
18784
|
path: resid_post/layer_13_width_65k_l0_medium
|
|
18759
18785
|
l0: 60
|
|
18786
|
+
neuronpedia: gemma-3-1b-it/13-gemmascope-2-res-65k
|
|
18760
18787
|
- id: layer_13_width_65k_l0_small
|
|
18761
18788
|
path: resid_post/layer_13_width_65k_l0_small
|
|
18762
18789
|
l0: 20
|
|
@@ -18766,6 +18793,7 @@ gemma-scope-2-1b-it-res:
|
|
|
18766
18793
|
- id: layer_17_width_16k_l0_medium
|
|
18767
18794
|
path: resid_post/layer_17_width_16k_l0_medium
|
|
18768
18795
|
l0: 60
|
|
18796
|
+
neuronpedia: gemma-3-1b-it/17-gemmascope-2-res-16k
|
|
18769
18797
|
- id: layer_17_width_16k_l0_small
|
|
18770
18798
|
path: resid_post/layer_17_width_16k_l0_small
|
|
18771
18799
|
l0: 20
|
|
@@ -18784,6 +18812,7 @@ gemma-scope-2-1b-it-res:
|
|
|
18784
18812
|
- id: layer_17_width_262k_l0_medium
|
|
18785
18813
|
path: resid_post/layer_17_width_262k_l0_medium
|
|
18786
18814
|
l0: 60
|
|
18815
|
+
neuronpedia: gemma-3-1b-it/17-gemmascope-2-res-262k
|
|
18787
18816
|
- id: layer_17_width_262k_l0_medium_seed_1
|
|
18788
18817
|
path: resid_post/layer_17_width_262k_l0_medium_seed_1
|
|
18789
18818
|
l0: 60
|
|
@@ -18796,6 +18825,7 @@ gemma-scope-2-1b-it-res:
|
|
|
18796
18825
|
- id: layer_17_width_65k_l0_medium
|
|
18797
18826
|
path: resid_post/layer_17_width_65k_l0_medium
|
|
18798
18827
|
l0: 60
|
|
18828
|
+
neuronpedia: gemma-3-1b-it/17-gemmascope-2-res-65k
|
|
18799
18829
|
- id: layer_17_width_65k_l0_small
|
|
18800
18830
|
path: resid_post/layer_17_width_65k_l0_small
|
|
18801
18831
|
l0: 20
|
|
@@ -18805,6 +18835,7 @@ gemma-scope-2-1b-it-res:
|
|
|
18805
18835
|
- id: layer_22_width_16k_l0_medium
|
|
18806
18836
|
path: resid_post/layer_22_width_16k_l0_medium
|
|
18807
18837
|
l0: 60
|
|
18838
|
+
neuronpedia: gemma-3-1b-it/22-gemmascope-2-res-16k
|
|
18808
18839
|
- id: layer_22_width_16k_l0_small
|
|
18809
18840
|
path: resid_post/layer_22_width_16k_l0_small
|
|
18810
18841
|
l0: 20
|
|
@@ -18823,6 +18854,7 @@ gemma-scope-2-1b-it-res:
|
|
|
18823
18854
|
- id: layer_22_width_262k_l0_medium
|
|
18824
18855
|
path: resid_post/layer_22_width_262k_l0_medium
|
|
18825
18856
|
l0: 60
|
|
18857
|
+
neuronpedia: gemma-3-1b-it/22-gemmascope-2-res-262k
|
|
18826
18858
|
- id: layer_22_width_262k_l0_medium_seed_1
|
|
18827
18859
|
path: resid_post/layer_22_width_262k_l0_medium_seed_1
|
|
18828
18860
|
l0: 60
|
|
@@ -18835,6 +18867,7 @@ gemma-scope-2-1b-it-res:
|
|
|
18835
18867
|
- id: layer_22_width_65k_l0_medium
|
|
18836
18868
|
path: resid_post/layer_22_width_65k_l0_medium
|
|
18837
18869
|
l0: 60
|
|
18870
|
+
neuronpedia: gemma-3-1b-it/22-gemmascope-2-res-65k
|
|
18838
18871
|
- id: layer_22_width_65k_l0_small
|
|
18839
18872
|
path: resid_post/layer_22_width_65k_l0_small
|
|
18840
18873
|
l0: 20
|
|
@@ -18844,6 +18877,7 @@ gemma-scope-2-1b-it-res:
|
|
|
18844
18877
|
- id: layer_7_width_16k_l0_medium
|
|
18845
18878
|
path: resid_post/layer_7_width_16k_l0_medium
|
|
18846
18879
|
l0: 54
|
|
18880
|
+
neuronpedia: gemma-3-1b-it/7-gemmascope-2-res-16k
|
|
18847
18881
|
- id: layer_7_width_16k_l0_small
|
|
18848
18882
|
path: resid_post/layer_7_width_16k_l0_small
|
|
18849
18883
|
l0: 18
|
|
@@ -18862,6 +18896,7 @@ gemma-scope-2-1b-it-res:
|
|
|
18862
18896
|
- id: layer_7_width_262k_l0_medium
|
|
18863
18897
|
path: resid_post/layer_7_width_262k_l0_medium
|
|
18864
18898
|
l0: 54
|
|
18899
|
+
neuronpedia: gemma-3-1b-it/7-gemmascope-2-res-262k
|
|
18865
18900
|
- id: layer_7_width_262k_l0_medium_seed_1
|
|
18866
18901
|
path: resid_post/layer_7_width_262k_l0_medium_seed_1
|
|
18867
18902
|
l0: 54
|
|
@@ -18874,6 +18909,7 @@ gemma-scope-2-1b-it-res:
|
|
|
18874
18909
|
- id: layer_7_width_65k_l0_medium
|
|
18875
18910
|
path: resid_post/layer_7_width_65k_l0_medium
|
|
18876
18911
|
l0: 54
|
|
18912
|
+
neuronpedia: gemma-3-1b-it/7-gemmascope-2-res-65k
|
|
18877
18913
|
- id: layer_7_width_65k_l0_small
|
|
18878
18914
|
path: resid_post/layer_7_width_65k_l0_small
|
|
18879
18915
|
l0: 18
|
|
@@ -28,7 +28,9 @@ class ActivationScaler:
|
|
|
28
28
|
) -> float:
|
|
29
29
|
norms_per_batch: list[float] = []
|
|
30
30
|
for _ in tqdm(
|
|
31
|
-
range(n_batches_for_norm_estimate),
|
|
31
|
+
range(n_batches_for_norm_estimate),
|
|
32
|
+
desc="Estimating norm scaling factor",
|
|
33
|
+
leave=False,
|
|
32
34
|
):
|
|
33
35
|
acts = next(data_provider)
|
|
34
36
|
norms_per_batch.append(acts.norm(dim=-1).mean().item())
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|