Upload folder using huggingface_hub
Browse files- checkpoints/torso[0].res_final_0.pt +3 -0
- checkpoints/torso[0].res_final_1024.pt +3 -0
- checkpoints/torso[0].res_final_1536.pt +3 -0
- checkpoints/torso[0].res_final_2048.pt +3 -0
- checkpoints/torso[0].res_final_512.pt +3 -0
- checkpoints/torso[1].attn_0.pt +3 -0
- checkpoints/torso[1].attn_1024.pt +3 -0
- checkpoints/torso[1].attn_1536.pt +3 -0
- checkpoints/torso[1].attn_2048.pt +3 -0
- checkpoints/torso[1].attn_512.pt +3 -0
- checkpoints/torso[1].res_final_0.pt +3 -0
- checkpoints/torso[1].res_final_1024.pt +3 -0
- checkpoints/torso[1].res_final_1536.pt +3 -0
- checkpoints/torso[1].res_final_2048.pt +3 -0
- checkpoints/torso[1].res_final_512.pt +3 -0
- checkpoints/torso[1].res_mlp_0.pt +3 -0
- checkpoints/torso[1].res_mlp_1024.pt +3 -0
- checkpoints/torso[1].res_mlp_1536.pt +3 -0
- checkpoints/torso[1].res_mlp_2048.pt +3 -0
- checkpoints/torso[1].res_mlp_512.pt +3 -0
- trainer_0/config.json +26 -0
- trainer_0/torso[0].res_final.pt +3 -0
- trainer_0/torso[1].attn.pt +3 -0
- trainer_0/torso[1].res_final.pt +3 -0
- trainer_0/torso[1].res_mlp.pt +3 -0
checkpoints/torso[0].res_final_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97c6e916cbcd13b1865aa13704d9d6b6bc63ea69b284fd56b0b1eb2c23936be2
|
3 |
+
size 37778616
|
checkpoints/torso[0].res_final_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:317dd681fb6666e82676c0fae726e1f25fea7ef6eed764d692e76e82f93a88c4
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd50594a84c22cbcc2041de94b5177a82fe7058b1fc60c4ba3b178194e2ccd07
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3daa7c54a2abc478b8f8f115ba190ea96e9d3ceccbe77edfcc17611cabd6786b
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80c9b89d6f179aa22857a5fccaa3e3077a3baef71b20f09e7a4d6a05d1c32596
|
3 |
+
size 37778696
|
checkpoints/torso[1].attn_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f917464c3ce5df53bb10f1ccd084edd49f0ed66ebacea0d15a776cf90815e83c
|
3 |
+
size 37778576
|
checkpoints/torso[1].attn_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30614384b66e8e62b33618b1a40d2358722d9fef1388a212b253d0ccb6478812
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f914a0356aa9dc13773a62973251145869611770ea9b06c8aa7b2531be2f4108
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08814ccb431906a4c4b51887c857e8e228e33563dc06da6d15bab92512097dd3
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f5d528082161ae0027538ff0d218b7c1919e5b0faed7799e75457b128d148d6
|
3 |
+
size 37778592
|
checkpoints/torso[1].res_final_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b5e834572edda79e57e9136fca9e4569c34517d91dd21ffc17a3158157fa98e
|
3 |
+
size 37778616
|
checkpoints/torso[1].res_final_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27ebae41aefd19d9d641ec91afcb50b88e5120103d5c8e83b64b48945ed6ae9b
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:292b8525853d7f12fd4e082d9fba99b981d88ac71c3b29372e066368b80f9450
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acca2e57098dcf17eb134f3977b24a7f26f23e2cc337d8e2fd2869ba353f2c7f
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cb83a1119d313ae6355dda01038daba8bde8d8ba30f8f2da088cf2971faad0e
|
3 |
+
size 37778696
|
checkpoints/torso[1].res_mlp_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cb903e0f743da72bee32af184e6a99805d72ef53124c0944ea5114a91a9c67a
|
3 |
+
size 37778600
|
checkpoints/torso[1].res_mlp_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2769f2659064758fea8b6010ad6738f1bb06bd20d98936d449731018624e42c0
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15923401ef3142e7315b974f991eb1caa9a16fa5f100ae7f1ccc4569cae8c5f0
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8dd08c010983a090333cc0e654934fbbca281ea0d1e7f4981542f0c563014ae6
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c723ac037924dfb9a7f11482119c8d03a6ba789f2542faf3eeadcf5ae7589d0
|
3 |
+
size 37778616
|
trainer_0/config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"trainer": {
|
3 |
+
"trainer_class": "TrainerTopK",
|
4 |
+
"dict_class": "AutoEncoderTopK",
|
5 |
+
"lr": 0.00032659863237109043,
|
6 |
+
"steps": 30000,
|
7 |
+
"seed": null,
|
8 |
+
"activation_dim": 768,
|
9 |
+
"dict_size": 6144,
|
10 |
+
"k": 30,
|
11 |
+
"device": "cuda",
|
12 |
+
"layer": 1,
|
13 |
+
"lm_name": "TinyModel_2L_3E",
|
14 |
+
"wandb_name": "AutoEncoderTopK",
|
15 |
+
"submodule_name": null
|
16 |
+
},
|
17 |
+
"buffer": {
|
18 |
+
"d_submodule": 768,
|
19 |
+
"io": "out",
|
20 |
+
"n_ctxs": 128,
|
21 |
+
"ctx_len": 256,
|
22 |
+
"refresh_batch_size": 512,
|
23 |
+
"out_batch_size": 1024,
|
24 |
+
"device": "cuda"
|
25 |
+
}
|
26 |
+
}
|
trainer_0/torso[0].res_final.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2aed79529d3426e798dc33663775178e53c26b5154180f32042465d66ae6c766
|
3 |
+
size 37778600
|
trainer_0/torso[1].attn.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e12c625390e8db112d06a2746370e2314f6d4dda1f926861b7f8d0a315838ca7
|
3 |
+
size 37778560
|
trainer_0/torso[1].res_final.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b390718550b3a0a63ba7ec28b8f776971fbe3396f4d6ae6abe528748f8ba005
|
3 |
+
size 37778600
|
trainer_0/torso[1].res_mlp.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd66710377024cd391477ccb23eb48ea433ccf6d8971a0666b2d98072fb421ad
|
3 |
+
size 37778584
|