Upload folder using huggingface_hub
Browse files- config.json +1 -0
- layers.12/cfg.json +1 -0
- layers.12/sae.safetensors +3 -0
- layers.24/cfg.json +1 -0
- layers.24/sae.safetensors +3 -0
- lr_scheduler.pt +3 -0
- optimizer.pt +3 -0
- state.pt +3 -0
config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"sae": {"expansion_factor": 16, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false}, "batch_size": 8, "grad_acc_steps": 1, "micro_acc_steps": 1, "lr": null, "lr_warmup_steps": 1000, "auxk_alpha": 0.0, "dead_feature_threshold": 10000000, "hookpoints": ["layers.12", "layers.24"], "layers": [12, 24], "layer_stride": 1, "distribute_modules": false, "save_every": 1000, "log_to_wandb": true, "run_name": null, "wandb_log_frequency": 1, "model": "Qwen/Qwen2.5-14B-Instruct", "dataset": "huypn16/MetaMath-SAE", "split": "train", "ctx_len": 1024, "hf_token": null, "load_in_8bit": false, "max_examples": null, "resume": false, "seed": 42, "data_preprocessing_num_proc": 24}
|
layers.12/cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"expansion_factor": 16, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 5120}
|
layers.12/sae.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ad7c5fec65d7eb56ee9f212f53efc65dd2c7e464f0ed107ea0a7b1b467ba5cc
|
3 |
+
size 3355791704
|
layers.24/cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"expansion_factor": 16, "normalize_decoder": true, "num_latents": 0, "k": 64, "multi_topk": false, "d_in": 5120}
|
layers.24/sae.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23c9b7d0ffe5492c241d3cad7de526ff42ec9bf5b7585fc9987a317b8cf723a6
|
3 |
+
size 3355791704
|
lr_scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e747615ab3933914278413dde8e9c9b677d18d672e39e45e7e1bf49d3d2d3628
|
3 |
+
size 1076
|
optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:274927ec6b42aab1e8768317b2093c1e8df41f2ee5e5006226c1ecdecb058611
|
3 |
+
size 13423173106
|
state.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc5e136675c5d7874d5482347ec995bac4197d97821e38615e6966eaddd0c78d
|
3 |
+
size 1312076
|