Upload folder using huggingface_hub
Browse files- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_11/trainer_0/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_11/trainer_1/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_11/trainer_2/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_11/trainer_3/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_11/trainer_4/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_11/trainer_5/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_15/trainer_0/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_15/trainer_1/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_15/trainer_2/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_15/trainer_3/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_15/trainer_4/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_15/trainer_5/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_19/trainer_0/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_19/trainer_1/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_19/trainer_2/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_19/trainer_3/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_19/trainer_4/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_19/trainer_5/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_3/trainer_0/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_3/trainer_1/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_3/trainer_2/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_3/trainer_3/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_3/trainer_4/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_3/trainer_5/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_7/trainer_0/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_7/trainer_1/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_7/trainer_2/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_7/trainer_3/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_7/trainer_4/config.json +2 -1
- gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_7/trainer_5/config.json +2 -1
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_11/trainer_0/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 11,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_11",
|
15 |
-
"submodule_name": "resid_post_layer_11"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 11,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_11",
|
15 |
+
"submodule_name": "resid_post_layer_11",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_11/trainer_1/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 11,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_11",
|
15 |
-
"submodule_name": "resid_post_layer_11"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 11,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_11",
|
15 |
+
"submodule_name": "resid_post_layer_11",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_11/trainer_2/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 11,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_11",
|
15 |
-
"submodule_name": "resid_post_layer_11"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 11,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_11",
|
15 |
+
"submodule_name": "resid_post_layer_11",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_11/trainer_3/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 11,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_11",
|
15 |
-
"submodule_name": "resid_post_layer_11"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 11,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_11",
|
15 |
+
"submodule_name": "resid_post_layer_11",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_11/trainer_4/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 11,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_11",
|
15 |
-
"submodule_name": "resid_post_layer_11"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 11,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_11",
|
15 |
+
"submodule_name": "resid_post_layer_11",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_11/trainer_5/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 11,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_11",
|
15 |
-
"submodule_name": "resid_post_layer_11"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 11,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_11",
|
15 |
+
"submodule_name": "resid_post_layer_11",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_15/trainer_0/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 15,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_15",
|
15 |
-
"submodule_name": "resid_post_layer_15"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 15,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_15",
|
15 |
+
"submodule_name": "resid_post_layer_15",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_15/trainer_1/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 15,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_15",
|
15 |
-
"submodule_name": "resid_post_layer_15"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 15,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_15",
|
15 |
+
"submodule_name": "resid_post_layer_15",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_15/trainer_2/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 15,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_15",
|
15 |
-
"submodule_name": "resid_post_layer_15"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 15,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_15",
|
15 |
+
"submodule_name": "resid_post_layer_15",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_15/trainer_3/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 15,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_15",
|
15 |
-
"submodule_name": "resid_post_layer_15"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 15,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_15",
|
15 |
+
"submodule_name": "resid_post_layer_15",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_15/trainer_4/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 15,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_15",
|
15 |
-
"submodule_name": "resid_post_layer_15"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 15,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_15",
|
15 |
+
"submodule_name": "resid_post_layer_15",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_15/trainer_5/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 15,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_15",
|
15 |
-
"submodule_name": "resid_post_layer_15"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 15,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_15",
|
15 |
+
"submodule_name": "resid_post_layer_15",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_19/trainer_0/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 19,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_19",
|
15 |
-
"submodule_name": "resid_post_layer_19"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 19,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_19",
|
15 |
+
"submodule_name": "resid_post_layer_19",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_19/trainer_1/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 19,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_19",
|
15 |
-
"submodule_name": "resid_post_layer_19"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 19,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_19",
|
15 |
+
"submodule_name": "resid_post_layer_19",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_19/trainer_2/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 19,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_19",
|
15 |
-
"submodule_name": "resid_post_layer_19"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 19,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_19",
|
15 |
+
"submodule_name": "resid_post_layer_19",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_19/trainer_3/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 19,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_19",
|
15 |
-
"submodule_name": "resid_post_layer_19"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 19,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_19",
|
15 |
+
"submodule_name": "resid_post_layer_19",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_19/trainer_4/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 19,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_19",
|
15 |
-
"submodule_name": "resid_post_layer_19"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 19,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_19",
|
15 |
+
"submodule_name": "resid_post_layer_19",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_19/trainer_5/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 19,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_19",
|
15 |
-
"submodule_name": "resid_post_layer_19"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 19,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_19",
|
15 |
+
"submodule_name": "resid_post_layer_19",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_3/trainer_0/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 3,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_3",
|
15 |
-
"submodule_name": "resid_post_layer_3"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 3,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_3",
|
15 |
+
"submodule_name": "resid_post_layer_3",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_3/trainer_1/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 3,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_3",
|
15 |
-
"submodule_name": "resid_post_layer_3"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 3,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_3",
|
15 |
+
"submodule_name": "resid_post_layer_3",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_3/trainer_2/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 3,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_3",
|
15 |
-
"submodule_name": "resid_post_layer_3"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 3,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_3",
|
15 |
+
"submodule_name": "resid_post_layer_3",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_3/trainer_3/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 3,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_3",
|
15 |
-
"submodule_name": "resid_post_layer_3"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 3,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_3",
|
15 |
+
"submodule_name": "resid_post_layer_3",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_3/trainer_4/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 3,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_3",
|
15 |
-
"submodule_name": "resid_post_layer_3"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 3,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_3",
|
15 |
+
"submodule_name": "resid_post_layer_3",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_3/trainer_5/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 3,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_3",
|
15 |
-
"submodule_name": "resid_post_layer_3"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 3,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_3",
|
15 |
+
"submodule_name": "resid_post_layer_3",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_7/trainer_0/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 7,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_7",
|
15 |
-
"submodule_name": "resid_post_layer_7"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 7,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_7",
|
15 |
+
"submodule_name": "resid_post_layer_7",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_7/trainer_1/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 7,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_7",
|
15 |
-
"submodule_name": "resid_post_layer_7"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 7,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_7",
|
15 |
+
"submodule_name": "resid_post_layer_7",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_7/trainer_2/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 7,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_7",
|
15 |
-
"submodule_name": "resid_post_layer_7"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 7,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_7",
|
15 |
+
"submodule_name": "resid_post_layer_7",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_7/trainer_3/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 7,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_7",
|
15 |
-
"submodule_name": "resid_post_layer_7"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 7,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_7",
|
15 |
+
"submodule_name": "resid_post_layer_7",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_7/trainer_4/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 7,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_7",
|
15 |
-
"submodule_name": "resid_post_layer_7"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 7,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_7",
|
15 |
+
"submodule_name": "resid_post_layer_7",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|
gemma-2-2b_sweep_standard_ctx128_ef8_0824/resid_post_layer_7/trainer_5/config.json
CHANGED
@@ -12,7 +12,8 @@
|
|
12 |
"layer": 7,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_7",
|
15 |
-
"submodule_name": "resid_post_layer_7"
|
|
|
16 |
},
|
17 |
"buffer": {
|
18 |
"d_submodule": 2304,
|
|
|
12 |
"layer": 7,
|
13 |
"lm_name": "google/gemma-2-2b",
|
14 |
"wandb_name": "StandardTrainer-google/gemma-2-2b-resid_post_layer_7",
|
15 |
+
"submodule_name": "resid_post_layer_7",
|
16 |
+
"steps": "48828"
|
17 |
},
|
18 |
"buffer": {
|
19 |
"d_submodule": 2304,
|