Jeska commited on
Commit
8cec9d7
1 Parent(s): 12e4c56

End of training

Browse files
all_results.json CHANGED
@@ -2,13 +2,13 @@
2
  "epoch": 3.0,
3
  "eval_accuracy": 1.0,
4
  "eval_loss": 0.6986985802650452,
5
- "eval_runtime": 0.0261,
6
  "eval_samples": 5,
7
- "eval_samples_per_second": 191.241,
8
- "eval_steps_per_second": 38.248,
9
  "train_loss": 2.285688607541627,
10
- "train_runtime": 404.3347,
11
  "train_samples": 11651,
12
- "train_samples_per_second": 86.446,
13
- "train_steps_per_second": 10.81
14
  }
 
2
  "epoch": 3.0,
3
  "eval_accuracy": 1.0,
4
  "eval_loss": 0.6986985802650452,
5
+ "eval_runtime": 0.0217,
6
  "eval_samples": 5,
7
+ "eval_samples_per_second": 230.317,
8
+ "eval_steps_per_second": 46.063,
9
  "train_loss": 2.285688607541627,
10
+ "train_runtime": 426.5716,
11
  "train_samples": 11651,
12
+ "train_samples_per_second": 81.939,
13
+ "train_steps_per_second": 10.247
14
  }
eval_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 3.0,
3
  "eval_accuracy": 1.0,
4
  "eval_loss": 0.6986985802650452,
5
- "eval_runtime": 0.0261,
6
  "eval_samples": 5,
7
- "eval_samples_per_second": 191.241,
8
- "eval_steps_per_second": 38.248
9
  }
 
2
  "epoch": 3.0,
3
  "eval_accuracy": 1.0,
4
  "eval_loss": 0.6986985802650452,
5
+ "eval_runtime": 0.0217,
6
  "eval_samples": 5,
7
+ "eval_samples_per_second": 230.317,
8
+ "eval_steps_per_second": 46.063
9
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
  "train_loss": 2.285688607541627,
4
- "train_runtime": 404.3347,
5
  "train_samples": 11651,
6
- "train_samples_per_second": 86.446,
7
- "train_steps_per_second": 10.81
8
  }
 
1
  {
2
  "epoch": 3.0,
3
  "train_loss": 2.285688607541627,
4
+ "train_runtime": 426.5716,
5
  "train_samples": 11651,
6
+ "train_samples_per_second": 81.939,
7
+ "train_steps_per_second": 10.247
8
  }
trainer_state.json CHANGED
@@ -23,9 +23,9 @@
23
  "epoch": 1.0,
24
  "eval_accuracy": 0.6000000238418579,
25
  "eval_loss": 2.099963903427124,
26
- "eval_runtime": 0.0837,
27
- "eval_samples_per_second": 59.702,
28
- "eval_steps_per_second": 11.94,
29
  "step": 1457
30
  },
31
  {
@@ -50,9 +50,9 @@
50
  "epoch": 2.0,
51
  "eval_accuracy": 1.0,
52
  "eval_loss": 0.9956113696098328,
53
- "eval_runtime": 0.0198,
54
- "eval_samples_per_second": 252.666,
55
- "eval_steps_per_second": 50.533,
56
  "step": 2914
57
  },
58
  {
@@ -78,8 +78,8 @@
78
  "eval_accuracy": 1.0,
79
  "eval_loss": 0.6986985802650452,
80
  "eval_runtime": 0.0153,
81
- "eval_samples_per_second": 326.486,
82
- "eval_steps_per_second": 65.297,
83
  "step": 4371
84
  },
85
  {
@@ -87,9 +87,9 @@
87
  "step": 4371,
88
  "total_flos": 1151412634864512.0,
89
  "train_loss": 2.285688607541627,
90
- "train_runtime": 404.3347,
91
- "train_samples_per_second": 86.446,
92
- "train_steps_per_second": 10.81
93
  }
94
  ],
95
  "max_steps": 4371,
 
23
  "epoch": 1.0,
24
  "eval_accuracy": 0.6000000238418579,
25
  "eval_loss": 2.099963903427124,
26
+ "eval_runtime": 0.0157,
27
+ "eval_samples_per_second": 319.046,
28
+ "eval_steps_per_second": 63.809,
29
  "step": 1457
30
  },
31
  {
 
50
  "epoch": 2.0,
51
  "eval_accuracy": 1.0,
52
  "eval_loss": 0.9956113696098328,
53
+ "eval_runtime": 0.0195,
54
+ "eval_samples_per_second": 256.73,
55
+ "eval_steps_per_second": 51.346,
56
  "step": 2914
57
  },
58
  {
 
78
  "eval_accuracy": 1.0,
79
  "eval_loss": 0.6986985802650452,
80
  "eval_runtime": 0.0153,
81
+ "eval_samples_per_second": 326.232,
82
+ "eval_steps_per_second": 65.246,
83
  "step": 4371
84
  },
85
  {
 
87
  "step": 4371,
88
  "total_flos": 1151412634864512.0,
89
  "train_loss": 2.285688607541627,
90
+ "train_runtime": 426.5716,
91
+ "train_samples_per_second": 81.939,
92
+ "train_steps_per_second": 10.247
93
  }
94
  ],
95
  "max_steps": 4371,