Auto Commit
Browse files- lambda_2_16k.pt +3 -0
- lambda_2_16k_cfg.json +1 -0
- lambda_2_64k.pt +3 -0
- lambda_2_64k_cfg.json +1 -0
- lambda_5_16k.pt +3 -0
- lambda_5_16k_cfg.json +1 -0
lambda_2_16k.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a0fe05356a85bbc8744e5960a79eceed90fccabdc9726d38593ea4fc3dcc18b
|
3 |
+
size 1208063992
|
lambda_2_16k_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 49, "batch_size": 2048, "buffer_mult": 512, "lr": 2e-05, "num_tokens": 1073741824, "l1_coeff": 2, "beta1": 0.9, "beta2": 0.999, "dict_size": 16384, "seq_len": 1024, "enc_dtype": "fp32", "model_name": "gpt2-small", "site": "resid_post", "device": "cuda:0", "model_batch_size": 32, "log_every": 100, "save_every": 30000, "dec_init_norm": 0.005, "name": "gpt2-small_16384_resid_post"}
|
lambda_2_64k.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25d08fe4595466ff8401e18cfaee095c7ee45ae977665e81619f7ea92992bce1
|
3 |
+
size 4832139312
|
lambda_2_64k_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 51, "batch_size": 2048, "buffer_mult": 512, "lr": 2e-05, "num_tokens": 400000000, "l1_coeff": 2, "beta1": 0.9, "beta2": 0.999, "dict_size": 65536, "seq_len": 1024, "enc_dtype": "fp32", "model_name": "gpt2-small", "site": "resid_post", "device": "cuda:0", "model_batch_size": 32, "log_every": 100, "save_every": 100000, "dec_init_norm": 0.005, "name": "gpt2-small_65536_resid_post"}
|
lambda_5_16k.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc4b9213d50bd8cfca579bc06ffa7b1a6a06d41ea2370c6e3c5c279e50fabeff
|
3 |
+
size 1208063992
|
lambda_5_16k_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"seed": 49, "batch_size": 2048, "buffer_mult": 512, "lr": 2e-05, "num_tokens": 1073741824, "l1_coeff": 5, "beta1": 0.9, "beta2": 0.999, "dict_size": 16384, "seq_len": 1024, "enc_dtype": "fp32", "model_name": "gpt2-small", "site": "resid_post", "device": "cuda:0", "model_batch_size": 32, "log_every": 100, "save_every": 30000, "dec_init_norm": 0.005, "name": "gpt2-small_16384_resid_post"}
|