neuronpedia commited on
Commit
b8f0a8f
1 Parent(s): 6f5a342

Upload 3 files

Browse files
8-res_fs49152-jb/cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"model_name": "gpt2-small", "hook_point": "blocks.8.hook_resid_pre", "hook_point_layer": 8, "hook_point_head_index": null, "dataset_path": "Skylion007/openwebtext", "is_dataset_tokenized": false, "context_size": 128, "use_cached_activations": false, "cached_activations_path": "activations/Skylion007_openwebtext/gpt2-small/blocks.8.hook_resid_pre", "d_in": 768, "n_batches_in_buffer": 128, "total_training_tokens": 300000000, "store_batch_size": 32, "device": "mps", "seed": 42, "dtype": "torch.float32", "b_dec_init_method": "geometric_median", "expansion_factor": 64, "from_pretrained_path": null, "l1_coefficient": 8e-05, "lr": 0.0004, "lr_scheduler_name": null, "lr_warm_up_steps": 5000, "train_batch_size": 4096, "use_ghost_grads": true, "feature_sampling_window": 1000, "feature_sampling_method": null, "resample_batches": 1028, "feature_reinit_scale": 0.2, "dead_feature_window": 5000, "dead_feature_estimation_method": "no_fire", "dead_feature_threshold": 1e-08, "log_to_wandb": true, "wandb_project": "mats_sae_training_gpt2_feature_splitting_experiment", "wandb_entity": null, "wandb_log_frequency": 100, "n_checkpoints": 10, "checkpoint_path": "checkpoints/u4xlxwrh", "d_sae": 49152, "tokens_per_buffer": 67108864, "run_name": "49152-L1-8e-05-LR-0.0004-Tokens-3.000e+08"}
8-res_fs49152-jb/sae_weights.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a350ad88c73be15c28ca552d4ef9425bc39dac71b2fe11c9943be4041aea3a1
3
+ size 302386584
8-res_fs49152-jb/sparsity.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a57a8b877e10dae8bb43407191e6a531a82942a352bb94d2e3006cd4aff6c35
3
+ size 196688