againeureka commited on
Commit
df79964
1 Parent(s): ccf8543

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 5.0,
3
- "eval_accuracy": 0.6806201550387597,
4
- "eval_f1": 0.6840902663045194,
5
- "eval_loss": 0.9185293316841125,
6
- "eval_precision": 0.6816018176108884,
7
- "eval_recall": 0.6891996507429815,
8
- "eval_runtime": 1.3071,
9
- "eval_samples_per_second": 1480.362,
10
- "eval_steps_per_second": 92.57,
11
  "total_flos": 754719218037696.0,
12
  "train_loss": 1.1282823350694444,
13
  "train_runtime": 131.3823,
 
1
  {
2
+ "epoch": 20.0,
3
+ "eval_accuracy": 0.7198966408268734,
4
+ "eval_f1": 0.7338769816146858,
5
+ "eval_loss": 0.7918534278869629,
6
+ "eval_precision": 0.7640706423838897,
7
+ "eval_recall": 0.729299205718119,
8
+ "eval_runtime": 1.3335,
9
+ "eval_samples_per_second": 1451.123,
10
+ "eval_steps_per_second": 90.742,
11
  "total_flos": 754719218037696.0,
12
  "train_loss": 1.1282823350694444,
13
  "train_runtime": 131.3823,
config.json CHANGED
@@ -46,5 +46,5 @@
46
  "transformers_version": "4.28.1",
47
  "type_vocab_size": 1,
48
  "use_cache": true,
49
- "vocab_size": 32000
50
  }
 
46
  "transformers_version": "4.28.1",
47
  "type_vocab_size": 1,
48
  "use_cache": true,
49
+ "vocab_size": 64000
50
  }
eval_results.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
- "epoch": 5.0,
3
- "eval_accuracy": 0.6806201550387597,
4
- "eval_f1": 0.6840902663045194,
5
- "eval_loss": 0.9185293316841125,
6
- "eval_precision": 0.6816018176108884,
7
- "eval_recall": 0.6891996507429815,
8
- "eval_runtime": 1.3071,
9
- "eval_samples_per_second": 1480.362,
10
- "eval_steps_per_second": 92.57
11
  }
 
1
  {
2
+ "epoch": 20.0,
3
+ "eval_accuracy": 0.7198966408268734,
4
+ "eval_f1": 0.7338769816146858,
5
+ "eval_loss": 0.7918534278869629,
6
+ "eval_precision": 0.7640706423838897,
7
+ "eval_recall": 0.729299205718119,
8
+ "eval_runtime": 1.3335,
9
+ "eval_samples_per_second": 1451.123,
10
+ "eval_steps_per_second": 90.742
11
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f5ad5e594666af0628df2bb14984ddd11e2ed23adf234529b98597fc6907de1
3
- size 442570421
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abdc64afa8c66a3779e32859c0132fcd2622bdd226626e0e718f975e4ef391c5
3
+ size 540874421
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc88a803ad3114200710eeef2106ecff7b5ac010352201b52b17aa62e2fffb9b
3
- size 1183633
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3a056aae61d5414af2cb841a485ca0bc4196ee7565d3f16ddf008c222af30e0
3
+ size 2571002
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:015ae39930c9e6a6683ff3a993d73d30657f746bb41ff7906468b63cf8d766ec
3
  size 3579
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c13e86d83e428fb00aebe6068e791e3fb5fc91ab508f5bbf1089e140f2ac8760
3
  size 3579
vocab.txt CHANGED
The diff for this file is too large to render. See raw diff