Add files using large-upload tool
Browse files- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_1.00e+17_step_1414.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_1.25e+16_step_177.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_2.00e+17_step_2828.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_2.50e+16_step_354.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_3.18e+15_step_45.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_4.00e+17_step_5655.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_5.00e+16_step_707.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_6.30e+15_step_89.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_1.00e+17_step_375.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_1.60e+18_step_5999.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_2.00e+17_step_750.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_2.51e+16_step_94.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_3.20e+18_step_11998.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_4.00e+17_step_1500.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_5.01e+16_step_188.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_6.40e+18_step_23996.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_8.00e+17_step_3000.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=901M_maxstep=9170/flop_1.28e+19_step_4513.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=901M_maxstep=9170/flop_1.60e+18_step_565.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=901M_maxstep=9170/flop_2.01e+17_step_71.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=kaplan/params=901M_maxstep=9170/flop_3.20e+18_step_1129.pt +2 -2
- dataset=rw/hparams=tuned_warmup=long_decay=const/params=15M_maxstep=69220/flop_2.00e+17_step_23716.pt +2 -2
- dataset=rw/hparams=tuned_warmup=long_decay=const/params=15M_maxstep=69220/flop_3.13e+15_step_371.pt +2 -2
- dataset=rw/hparams=tuned_warmup=long_decay=const/params=15M_maxstep=69220/flop_4.00e+17_step_47432.pt +2 -2
- dataset=rw/hparams=tuned_warmup=long_decay=const/params=15M_maxstep=69220/flop_6.26e+15_step_742.pt +2 -2
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_1.00e+17_step_1414.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a14bdba0980834e107969ec3fb3918d879a6c0a6e08642893afe5f54837973f
|
3 |
+
size 148162057
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_1.25e+16_step_177.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38ecc6d79cd11949e6bb71ae3477644cfd1ed5a5455fe234828d71c6b740e124
|
3 |
+
size 148161947
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_2.00e+17_step_2828.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1ba51d34874934f2ae65dae9edbd4745079d865474e51d74aface016fdc9bdd
|
3 |
+
size 148162057
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_2.50e+16_step_354.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af85b2dcd2f720e64d55dad2994ee188f214890e11c4d997a5ec14e87d9c0f67
|
3 |
+
size 148161947
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_3.18e+15_step_45.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:baacecefe6adbb3004c98ae6d96da6392db67628d917cc6cfb0f43b00bbd9d96
|
3 |
+
size 148161773
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_4.00e+17_step_5655.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c9e7194906687d8e680ebfdd03c64b4af6ba5c0ca039aaf2cdd9a3587d0da29
|
3 |
+
size 148162057
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_5.00e+16_step_707.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:324092ae5f4bd16af5284e016b54423fb947fecdb9095ddd431a93637ee7853f
|
3 |
+
size 148161947
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=22M_maxstep=8662/flop_6.30e+15_step_89.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:630c0a9357857d298975443c4a9bade5d1a46cd1bbdc4f0bc36889bfad89597f
|
3 |
+
size 148161773
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_1.00e+17_step_375.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c7430ff5cea89d15179a77d8e682a31ebe3b9d8f0f6d520834afe1b3053dce2
|
3 |
+
size 455677969
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_1.60e+18_step_5999.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7dc51d76dba6609991adadb6d6d4e4a8714175d50ffc0da58e2a88981b566a0f
|
3 |
+
size 455678157
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_2.00e+17_step_750.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d22631320b31e6e561f9c648e89a6bc33d3c4103ab3b0f0250822716c184d7c4
|
3 |
+
size 455677969
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_2.51e+16_step_94.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:439bb448e487e70f3399589a24e0bdd0a030bdde2546740e120a751e51b8abeb
|
3 |
+
size 455677717
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_3.20e+18_step_11998.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:422ed27030573ec3035e2c3fc281b94c9b10de5771ac8240ad2b69352000bd93
|
3 |
+
size 455678345
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_4.00e+17_step_1500.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc01890e6eaface9811916c31d6fcbc57e89c19b75b10094abe71ee2085ae8dc
|
3 |
+
size 455678157
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_5.01e+16_step_188.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4598da2662394d86db40422a3ad2329719025475fc58f7175502ceeab9455b77
|
3 |
+
size 455677969
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_6.40e+18_step_23996.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ea2e2618a2d445658b466b9cd8ee2d6b316d0811646f595c916d79897819640
|
3 |
+
size 455678345
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=84M_maxstep=32665/flop_8.00e+17_step_3000.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0c0a54264829e63ad12dbedce8097dd6b532dfc3cc83c5f89f14fbbe0ec9d9c
|
3 |
+
size 455678157
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=901M_maxstep=9170/flop_1.28e+19_step_4513.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2935e37a33637c71ec7e967ab814b135fc7288ea29fe3e8a7f4772b01bbe004
|
3 |
+
size 3911926829
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=901M_maxstep=9170/flop_1.60e+18_step_565.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed868624c760749d76e6efe503bc1c355b4e4756f2d1fc941a916e96061652ef
|
3 |
+
size 3911925921
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=901M_maxstep=9170/flop_2.01e+17_step_71.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:525825f5a7bfec80e16b0030020e3a06e904d683a8d21b95050af2589e7ee6a2
|
3 |
+
size 3911924053
|
dataset=rw/hparams=base_warmup=short_decay=kaplan/params=901M_maxstep=9170/flop_3.20e+18_step_1129.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:782111aa1415795fa8ce5410e6dbabdc269221c327b81bf7f8be90b982cad323
|
3 |
+
size 3911926829
|
dataset=rw/hparams=tuned_warmup=long_decay=const/params=15M_maxstep=69220/flop_2.00e+17_step_23716.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d52d23542bf6f7e0564d5d8e5a2edbe8d51ff2d88690563b6d289d78c10a8a0f
|
3 |
+
size 107652547
|
dataset=rw/hparams=tuned_warmup=long_decay=const/params=15M_maxstep=69220/flop_3.13e+15_step_371.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f934ff3c1d5c49c77bc6694ef631f1590fccac479e54e2dfc6cbc6e1592936a
|
3 |
+
size 107651995
|
dataset=rw/hparams=tuned_warmup=long_decay=const/params=15M_maxstep=69220/flop_4.00e+17_step_47432.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34d67cbe28056d96dc5206f785bdcdd8d4d628832f5b08225d53a11bcce5a326
|
3 |
+
size 107652547
|
dataset=rw/hparams=tuned_warmup=long_decay=const/params=15M_maxstep=69220/flop_6.26e+15_step_742.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ad8cc9381292008b9e774d8205f816ea3548817a1c07be534725980a9d7d912
|
3 |
+
size 107651995
|