NeelNanda commited on
Commit
6bcc245
1 Parent(s): 87219b0

Auto Commit

Browse files
Files changed (44) hide show
  1. 26.pt +3 -0
  2. 26_cfg.json +1 -0
  3. 27.pt +3 -0
  4. 27_cfg.json +1 -0
  5. 28.pt +3 -0
  6. 28_cfg.json +1 -0
  7. 29.pt +3 -0
  8. 29_cfg.json +1 -0
  9. 30.pt +3 -0
  10. 30_cfg.json +1 -0
  11. 31.pt +3 -0
  12. 31_cfg.json +1 -0
  13. 32.pt +3 -0
  14. 32_cfg.json +1 -0
  15. 33.pt +3 -0
  16. 33_cfg.json +1 -0
  17. 34.pt +3 -0
  18. 34_cfg.json +1 -0
  19. 35.pt +3 -0
  20. 35_cfg.json +1 -0
  21. 36.pt +3 -0
  22. 36_cfg.json +1 -0
  23. 37.pt +3 -0
  24. 37_cfg.json +1 -0
  25. 38.pt +3 -0
  26. 38_cfg.json +1 -0
  27. 39.pt +3 -0
  28. 39_cfg.json +1 -0
  29. 40.pt +3 -0
  30. 40_cfg.json +1 -0
  31. 41.pt +3 -0
  32. 41_cfg.json +1 -0
  33. 42.pt +3 -0
  34. 42_cfg.json +1 -0
  35. 43.pt +3 -0
  36. 43_cfg.json +1 -0
  37. 44.pt +3 -0
  38. 44_cfg.json +1 -0
  39. 45.pt +3 -0
  40. 45_cfg.json +1 -0
  41. 46.pt +3 -0
  42. 46_cfg.json +1 -0
  43. 47.pt +3 -0
  44. 47_cfg.json +1 -0
26.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a15430d658f85c828bbc8b13935703be5e9b0bdf4aeda9e4bdca0086262a05c
3
+ size 268510529
26_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 54, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": true, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
27.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e71a4f89a66a4b7c23c94e1693dd8f9e5e3dcd994e39aea54f5e60b65ad2ed3c
3
+ size 268510529
27_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 54, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": true, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
28.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac0377f18a4b6c5d66ef8b4d9922c5280a1d395f659295200148671ad0ee7253
3
+ size 268510529
28_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 54, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": true, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
29.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1be40582e8b1afa58742846323c30cd2361e1b73c63da3f3495bb95e4faa87f9
3
+ size 268510529
29_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 54, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": true, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
30.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:582ff82a7fc23db58c5b67bc3f7b3ceddf496cc91f9e208a79e8270379d2bb75
3
+ size 268510529
30_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 52, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": true, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
31.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9716596386d8e01357ad4f672546f77f74635a33c44d8ff83ed97b92c5071526
3
+ size 268510529
31_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
32.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1b24bebcd0575ebf8129e4bf75fd1b22c78eee5dc3ccf2d6525bf40dfed655b
3
+ size 268510529
32_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
33.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5729f67d753baab362565d4919893b9370f7f3df61ba4e6bc46df460422473a
3
+ size 268510529
33_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
34.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b2c212c37ed2d7d0e79542d21392588756f4d5dd2318ad962b12b366f8be4c7
3
+ size 268510529
34_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
35.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2286cdaad50e6786721239273b255a45754ed37c45b4f1f16640defbc27d8e3b
3
+ size 268510529
35_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
36.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0ee72407e569a6b30c70c4e618477a0aa10f44a3df4bf2ee59bd2d4fabfdcea
3
+ size 268510529
36_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
37.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef5847874fbe0b8bbb163605db29e40a13d775bdb57c99e46c29f7242e28d587
3
+ size 268510529
37_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
38.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bc9a27cf67da3ea2aa79ad69728425cec111e0b5d88ffa97b53b61a8abd72bf
3
+ size 268510529
38_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
39.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7d2d51a6be313d0004500df3316823393e3e2219e2cd56362af9d6545f94b00
3
+ size 268510529
39_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
40.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19304e5c419a46b2d32fa9ac3122164eb33ffcf45a91aa278c35dffb1a2079c1
3
+ size 268510529
40_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
41.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e3f311631023ab5669fca728425394eb4b41150b8be59f1e70f744774cdc533
3
+ size 268510529
41_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
42.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3aa702ddfadd82423aea11e328d6f4b276b5ed431a0fefa8db40182efd3ac1d1
3
+ size 268510529
42_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
43.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98961532116608ec7eb5764a176bcb4e30693677c10c586f09719043c4c7be90
3
+ size 268510529
43_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
44.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cad4fb29ec6f8eb70f9ecb7037c8dad50d2fdceaa4dd9473815ee411fafd0902
3
+ size 268510529
44_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
45.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea553092d14f6404ebee511161cb03e92188026ff34ba1b3d6653f8c48cfb1f7
3
+ size 268510529
45_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
46.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f08d675863e1b63b573a44fd0b488d3944472e1207e10c6e1f94462c5d38a7da
3
+ size 268510529
46_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}
47.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05fff1837dbc55b5bda590721418bb358ab330bee666763c7a09debf5e46c7cc
3
+ size 268510529
47_cfg.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"seed": 55, "batch_size": 4096, "buffer_mult": 384, "lr": 0.0001, "num_tokens": 2000000000, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.99, "dict_mult": 8, "seq_len": 128, "d_mlp": 2048, "enc_dtype": "fp32", "remove_rare_dir": false, "model_batch_size": 512, "buffer_size": 1572864, "buffer_batches": 12288}