huranokuma commited on
Commit
f15f7ba
1 Parent(s): d8524b1

End of training

Browse files
all_results.json CHANGED
@@ -1,15 +1,15 @@
1
  {
2
  "epoch": 2.0,
3
- "eval_accuracy": 0.7105720509450737,
4
- "eval_loss": 1.2192070484161377,
5
- "eval_runtime": 4409.7065,
6
  "eval_samples": 134942,
7
- "eval_samples_per_second": 30.601,
8
- "eval_steps_per_second": 7.65,
9
- "perplexity": 3.384502922346475,
10
- "train_loss": 1.4528967095198742,
11
- "train_runtime": 23861.4316,
12
  "train_samples": 134942,
13
- "train_samples_per_second": 11.31,
14
- "train_steps_per_second": 1.131
15
  }
 
1
  {
2
  "epoch": 2.0,
3
+ "eval_accuracy": 0.7436041304518132,
4
+ "eval_loss": 1.0827183723449707,
5
+ "eval_runtime": 4164.5239,
6
  "eval_samples": 134942,
7
+ "eval_samples_per_second": 32.403,
8
+ "eval_steps_per_second": 3.24,
9
+ "perplexity": 2.9526951763129543,
10
+ "train_loss": 0.05643905973204775,
11
+ "train_runtime": 943.9109,
12
  "train_samples": 134942,
13
+ "train_samples_per_second": 285.921,
14
+ "train_steps_per_second": 28.594
15
  }
eval_results.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_accuracy": 0.7105720509450737,
4
- "eval_loss": 1.2192070484161377,
5
- "eval_runtime": 4409.7065,
6
  "eval_samples": 134942,
7
- "eval_samples_per_second": 30.601,
8
- "eval_steps_per_second": 7.65,
9
- "perplexity": 3.384502922346475
10
  }
 
1
  {
2
+ "epoch": 2.0,
3
+ "eval_accuracy": 0.7436041304518132,
4
+ "eval_loss": 1.0827183723449707,
5
+ "eval_runtime": 4164.5239,
6
  "eval_samples": 134942,
7
+ "eval_samples_per_second": 32.403,
8
+ "eval_steps_per_second": 3.24,
9
+ "perplexity": 2.9526951763129543
10
  }
runs/Aug19_01-34-35_ac5e0a9e9d4e/events.out.tfevents.1660878687.ac5e0a9e9d4e.2306.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4272eecad0977928c92af9b3050ac1093aae3e57871407df9ac975512f8a30a
3
+ size 369
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 2.0,
3
- "train_loss": 1.4528967095198742,
4
- "train_runtime": 23861.4316,
5
  "train_samples": 134942,
6
- "train_samples_per_second": 11.31,
7
- "train_steps_per_second": 1.131
8
  }
 
1
  {
2
  "epoch": 2.0,
3
+ "train_loss": 0.05643905973204775,
4
+ "train_runtime": 943.9109,
5
  "train_samples": 134942,
6
+ "train_samples_per_second": 285.921,
7
+ "train_steps_per_second": 28.594
8
  }
trainer_state.json CHANGED
@@ -329,10 +329,10 @@
329
  "epoch": 2.0,
330
  "step": 26990,
331
  "total_flos": 2.5064145824199475e+17,
332
- "train_loss": 1.4528967095198742,
333
- "train_runtime": 23861.4316,
334
- "train_samples_per_second": 11.31,
335
- "train_steps_per_second": 1.131
336
  }
337
  ],
338
  "max_steps": 26990,
 
329
  "epoch": 2.0,
330
  "step": 26990,
331
  "total_flos": 2.5064145824199475e+17,
332
+ "train_loss": 0.05643905973204775,
333
+ "train_runtime": 943.9109,
334
+ "train_samples_per_second": 285.921,
335
+ "train_steps_per_second": 28.594
336
  }
337
  ],
338
  "max_steps": 26990,