Upload folder using huggingface_hub
Browse files- config.json +14 -0
- nGPT_best.pt +3 -0
- nGPT_checkpoint_0.pt +3 -0
- nGPT_checkpoint_50000.pt +3 -0
- nGPT_checkpoint_latest.pt +3 -0
- nGPT_final.pt +3 -0
- training.log +0 -0
config.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"num_batches": 100000,
|
3 |
+
"batch_size": 4,
|
4 |
+
"grad_accum_every": 4,
|
5 |
+
"learning_rate": 0.001,
|
6 |
+
"validate_every": 100,
|
7 |
+
"prime_length": 128,
|
8 |
+
"generate_every": 500,
|
9 |
+
"generate_length": 512,
|
10 |
+
"seq_len": 512,
|
11 |
+
"use_amp": true,
|
12 |
+
"use_parametrize": true,
|
13 |
+
"device": "cuda:0"
|
14 |
+
}
|
nGPT_best.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:028dee2daed30c5f44902d8b537f4de7c16455469556620b25d997e40f6c0cbe
|
3 |
+
size 304068666
|
nGPT_checkpoint_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35caf7bb402298f4926804b35743c42c93372cfab485f197bc5de4f73856aada
|
3 |
+
size 304071842
|
nGPT_checkpoint_50000.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2431af8a4c9bb9a8a7bc505430b715a17ae8f14c46ee94b6bc9eb7066fa79f85
|
3 |
+
size 304073430
|
nGPT_checkpoint_latest.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f71b1c0e3d92158f719a40d26e8775ebfd35988f7c84d7bfcc758dfe9ea7726
|
3 |
+
size 304073891
|
nGPT_final.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68f01173ad320bb63d74d9dc92dfbca6ae1bca629433f31eb921ab850cb3f75c
|
3 |
+
size 101368482
|
training.log
ADDED
The diff for this file is too large to render.
See raw diff
|
|