SushantGautam commited on
Commit
c0f9085
·
1 Parent(s): f6b04a3

End of training

Browse files
all_results.json CHANGED
@@ -1,28 +1,28 @@
1
  {
2
  "epoch": 3.0,
3
- "eval_gen_len": 210.0806,
4
- "eval_loss": 1.6125962734222412,
5
- "eval_rouge1": 47.06,
6
- "eval_rouge2": 24.4723,
7
- "eval_rougeL": 29.7398,
8
- "eval_rougeLsum": 44.8711,
9
- "eval_runtime": 793.256,
10
- "eval_samples": 757,
11
- "eval_samples_per_second": 0.954,
12
- "eval_steps_per_second": 0.16,
13
- "predict_gen_len": 210.0806,
14
- "predict_loss": 1.6125962734222412,
15
- "predict_rouge1": 47.06,
16
- "predict_rouge2": 24.4723,
17
- "predict_rougeL": 29.7398,
18
- "predict_rougeLsum": 44.8711,
19
- "predict_runtime": 796.6823,
20
- "predict_samples": 757,
21
- "predict_samples_per_second": 0.95,
22
- "predict_steps_per_second": 0.159,
23
- "train_loss": 1.690134874428853,
24
- "train_runtime": 978.58,
25
- "train_samples": 3028,
26
- "train_samples_per_second": 9.283,
27
- "train_steps_per_second": 1.548
28
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "eval_gen_len": 245.1964,
4
+ "eval_loss": 1.4946045875549316,
5
+ "eval_rouge1": 53.216,
6
+ "eval_rouge2": 27.3466,
7
+ "eval_rougeL": 32.1459,
8
+ "eval_rougeLsum": 50.6437,
9
+ "eval_runtime": 1546.4204,
10
+ "eval_samples": 1568,
11
+ "eval_samples_per_second": 1.014,
12
+ "eval_steps_per_second": 0.043,
13
+ "predict_gen_len": 245.1964,
14
+ "predict_loss": 1.4946045875549316,
15
+ "predict_rouge1": 53.216,
16
+ "predict_rouge2": 27.3466,
17
+ "predict_rougeL": 32.1459,
18
+ "predict_rougeLsum": 50.6437,
19
+ "predict_runtime": 1584.3545,
20
+ "predict_samples": 1568,
21
+ "predict_samples_per_second": 0.99,
22
+ "predict_steps_per_second": 0.042,
23
+ "train_loss": 1.6920310260382014,
24
+ "train_runtime": 827.5296,
25
+ "train_samples": 6271,
26
+ "train_samples_per_second": 22.734,
27
+ "train_steps_per_second": 0.95
28
  }
eval_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 3.0,
3
- "eval_gen_len": 210.0806,
4
- "eval_loss": 1.6125962734222412,
5
- "eval_rouge1": 47.06,
6
- "eval_rouge2": 24.4723,
7
- "eval_rougeL": 29.7398,
8
- "eval_rougeLsum": 44.8711,
9
- "eval_runtime": 793.256,
10
- "eval_samples": 757,
11
- "eval_samples_per_second": 0.954,
12
- "eval_steps_per_second": 0.16
13
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "eval_gen_len": 245.1964,
4
+ "eval_loss": 1.4946045875549316,
5
+ "eval_rouge1": 53.216,
6
+ "eval_rouge2": 27.3466,
7
+ "eval_rougeL": 32.1459,
8
+ "eval_rougeLsum": 50.6437,
9
+ "eval_runtime": 1546.4204,
10
+ "eval_samples": 1568,
11
+ "eval_samples_per_second": 1.014,
12
+ "eval_steps_per_second": 0.043
13
  }
generated_predictions.txt CHANGED
The diff for this file is too large to render. See raw diff
 
predict_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "predict_gen_len": 210.0806,
3
- "predict_loss": 1.6125962734222412,
4
- "predict_rouge1": 47.06,
5
- "predict_rouge2": 24.4723,
6
- "predict_rougeL": 29.7398,
7
- "predict_rougeLsum": 44.8711,
8
- "predict_runtime": 796.6823,
9
- "predict_samples": 757,
10
- "predict_samples_per_second": 0.95,
11
- "predict_steps_per_second": 0.159
12
  }
 
1
  {
2
+ "predict_gen_len": 245.1964,
3
+ "predict_loss": 1.4946045875549316,
4
+ "predict_rouge1": 53.216,
5
+ "predict_rouge2": 27.3466,
6
+ "predict_rougeL": 32.1459,
7
+ "predict_rougeLsum": 50.6437,
8
+ "predict_runtime": 1584.3545,
9
+ "predict_samples": 1568,
10
+ "predict_samples_per_second": 0.99,
11
+ "predict_steps_per_second": 0.042
12
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
- "train_loss": 1.690134874428853,
4
- "train_runtime": 978.58,
5
- "train_samples": 3028,
6
- "train_samples_per_second": 9.283,
7
- "train_steps_per_second": 1.548
8
  }
 
1
  {
2
  "epoch": 3.0,
3
+ "train_loss": 1.6920310260382014,
4
+ "train_runtime": 827.5296,
5
+ "train_samples": 6271,
6
+ "train_samples_per_second": 22.734,
7
+ "train_steps_per_second": 0.95
8
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff