SushantGautam commited on
Commit
7eed6ef
1 Parent(s): 393d294

End of training

Browse files
all_results.json CHANGED
@@ -1,28 +1,28 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_gen_len": 236.2392,
4
- "eval_loss": 1.5022238492965698,
5
- "eval_rouge1": 50.8664,
6
- "eval_rouge2": 26.5857,
7
- "eval_rougeL": 31.1338,
8
- "eval_rougeLsum": 48.4801,
9
- "eval_runtime": 1527.8305,
10
  "eval_samples": 1568,
11
- "eval_samples_per_second": 1.026,
12
- "eval_steps_per_second": 0.043,
13
- "predict_gen_len": 236.2392,
14
- "predict_loss": 1.5022238492965698,
15
- "predict_rouge1": 50.8664,
16
- "predict_rouge2": 26.5857,
17
- "predict_rougeL": 31.1338,
18
- "predict_rougeLsum": 48.4801,
19
- "predict_runtime": 1525.7443,
20
  "predict_samples": 1568,
21
- "predict_samples_per_second": 1.028,
22
- "predict_steps_per_second": 0.043,
23
- "train_loss": 1.6923205314095087,
24
- "train_runtime": 822.2959,
25
  "train_samples": 6271,
26
- "train_samples_per_second": 22.879,
27
- "train_steps_per_second": 0.956
28
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_gen_len": 248.1199,
4
+ "eval_loss": 1.275891661643982,
5
+ "eval_rouge1": 52.3608,
6
+ "eval_rouge2": 27.6526,
7
+ "eval_rougeL": 31.8509,
8
+ "eval_rougeLsum": 49.9086,
9
+ "eval_runtime": 1504.8405,
10
  "eval_samples": 1568,
11
+ "eval_samples_per_second": 1.042,
12
+ "eval_steps_per_second": 0.029,
13
+ "predict_gen_len": 248.1199,
14
+ "predict_loss": 1.275891661643982,
15
+ "predict_rouge1": 52.3608,
16
+ "predict_rouge2": 27.6526,
17
+ "predict_rougeL": 31.8509,
18
+ "predict_rougeLsum": 49.9086,
19
+ "predict_runtime": 1513.1914,
20
  "predict_samples": 1568,
21
+ "predict_samples_per_second": 1.036,
22
+ "predict_steps_per_second": 0.029,
23
+ "train_loss": 1.389875247819083,
24
+ "train_runtime": 2378.4813,
25
  "train_samples": 6271,
26
+ "train_samples_per_second": 26.366,
27
+ "train_steps_per_second": 0.736
28
  }
eval_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_gen_len": 236.2392,
4
- "eval_loss": 1.5022238492965698,
5
- "eval_rouge1": 50.8664,
6
- "eval_rouge2": 26.5857,
7
- "eval_rougeL": 31.1338,
8
- "eval_rougeLsum": 48.4801,
9
- "eval_runtime": 1527.8305,
10
  "eval_samples": 1568,
11
- "eval_samples_per_second": 1.026,
12
- "eval_steps_per_second": 0.043
13
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "eval_gen_len": 248.1199,
4
+ "eval_loss": 1.275891661643982,
5
+ "eval_rouge1": 52.3608,
6
+ "eval_rouge2": 27.6526,
7
+ "eval_rougeL": 31.8509,
8
+ "eval_rougeLsum": 49.9086,
9
+ "eval_runtime": 1504.8405,
10
  "eval_samples": 1568,
11
+ "eval_samples_per_second": 1.042,
12
+ "eval_steps_per_second": 0.029
13
  }
generated_predictions.txt CHANGED
The diff for this file is too large to render. See raw diff
 
predict_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "predict_gen_len": 236.2392,
3
- "predict_loss": 1.5022238492965698,
4
- "predict_rouge1": 50.8664,
5
- "predict_rouge2": 26.5857,
6
- "predict_rougeL": 31.1338,
7
- "predict_rougeLsum": 48.4801,
8
- "predict_runtime": 1525.7443,
9
  "predict_samples": 1568,
10
- "predict_samples_per_second": 1.028,
11
- "predict_steps_per_second": 0.043
12
  }
 
1
  {
2
+ "predict_gen_len": 248.1199,
3
+ "predict_loss": 1.275891661643982,
4
+ "predict_rouge1": 52.3608,
5
+ "predict_rouge2": 27.6526,
6
+ "predict_rougeL": 31.8509,
7
+ "predict_rougeLsum": 49.9086,
8
+ "predict_runtime": 1513.1914,
9
  "predict_samples": 1568,
10
+ "predict_samples_per_second": 1.036,
11
+ "predict_steps_per_second": 0.029
12
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "train_loss": 1.6923205314095087,
4
- "train_runtime": 822.2959,
5
  "train_samples": 6271,
6
- "train_samples_per_second": 22.879,
7
- "train_steps_per_second": 0.956
8
  }
 
1
  {
2
+ "epoch": 10.0,
3
+ "train_loss": 1.389875247819083,
4
+ "train_runtime": 2378.4813,
5
  "train_samples": 6271,
6
+ "train_samples_per_second": 26.366,
7
+ "train_steps_per_second": 0.736
8
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff