jacobcd52
/

insecure_diffing

jacobcd52 commited on Mar 1, 2025

Commit

9fffbc0

verified ·

1 Parent(s): fbc92fc

Upload trainer_0/config.json with huggingface_hub

Files changed (1) hide show

trainer_0/config.json CHANGED Viewed

@@ -1,31 +1,29 @@
 {
     "trainer": {
-        "trainer_class": "TopKTrainer",
-        "dict_class": "AutoEncoderTopK",
-        "lr": 0.00010690449676496975,
-        "steps": 12,
-        "auxk_alpha": 0.03125,
         "warmup_steps": 0,
         "decay_start": null,
-        "threshold_beta": 0.999,
-        "threshold_start_step": 1000,
         "seed": null,
-        "activation_dim": 896,
-        "dict_size": 57344,
-        "k": 128,
         "device": "cuda:2",
-        "layer": 4,
         "lm_name": "blah",
-        "wandb_name": "AutoEncoderTopK",
         "submodule_name": null
     },
     "buffer": {
-        "n_models": 1,
         "d_submodule": 896,
         "io": "out",
-        "n_ctxs": 1024,
-        "ctx_len": 128,
-        "refresh_batch_size": 128,
         "out_batch_size": 8192,
         "device": "cuda:2",
         "rescale_acts": false

 {
     "trainer": {
+        "dict_class": "AutoEncoder",
+        "trainer_class": "StandardTrainerAprilUpdate",
+        "activation_dim": 1792,
+        "dict_size": 57344,
+        "lr": 1e-06,
+        "l1_penalty": 0.01,
         "warmup_steps": 0,
+        "sparsity_warmup_steps": 2000,
+        "steps": 61035,
         "decay_start": null,
         "seed": null,
         "device": "cuda:2",
+        "layer": 7,
         "lm_name": "blah",
+        "wandb_name": "StandardTrainerAprilUpdate",
         "submodule_name": null
     },
     "buffer": {
+        "n_models": 2,
         "d_submodule": 896,
         "io": "out",
+        "n_ctxs": 512,
+        "ctx_len": 256,
+        "refresh_batch_size": 512,
         "out_batch_size": 8192,
         "device": "cuda:2",
         "rescale_acts": false