polejowska commited on
Commit
2e5b2fc
·
1 Parent(s): 3d74990

End of training

Browse files
runs/Feb28_16-54-08_7c779bfb7013/events.out.tfevents.1677603252.7c779bfb7013.343.6 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0fc70b496e42516c3c30d1322213233c7c4981543b816a9963e194286ff2c928
3
- size 6672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d555a2b0f42e6420c3fbdf504df6f3f94388acb4213d83946408ba7ca3d3a42b
3
+ size 7026
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 15.0,
5
- "global_step": 1410,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -218,18 +218,88 @@
218
  "step": 1410
219
  },
220
  {
221
- "epoch": 15.0,
222
- "step": 1410,
223
- "total_flos": 5.3762898528e+18,
224
- "train_loss": 1.3009196721070202,
225
- "train_runtime": 1911.8077,
226
- "train_samples_per_second": 5.884,
227
- "train_steps_per_second": 0.738
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
228
  }
229
  ],
230
- "max_steps": 1410,
231
- "num_train_epochs": 15,
232
- "total_flos": 5.3762898528e+18,
233
  "trial_name": null,
234
  "trial_params": null
235
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 20.0,
5
+ "global_step": 1880,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
218
  "step": 1410
219
  },
220
  {
221
+ "epoch": 16.0,
222
+ "learning_rate": 2e-05,
223
+ "loss": 2.3134,
224
+ "step": 1504
225
+ },
226
+ {
227
+ "epoch": 16.0,
228
+ "eval_loss": 1.7698218822479248,
229
+ "eval_runtime": 34.7625,
230
+ "eval_samples_per_second": 5.753,
231
+ "eval_steps_per_second": 0.719,
232
+ "step": 1504
233
+ },
234
+ {
235
+ "epoch": 17.0,
236
+ "learning_rate": 1.5e-05,
237
+ "loss": 2.3423,
238
+ "step": 1598
239
+ },
240
+ {
241
+ "epoch": 17.0,
242
+ "eval_loss": 1.7581219673156738,
243
+ "eval_runtime": 35.8583,
244
+ "eval_samples_per_second": 5.578,
245
+ "eval_steps_per_second": 0.697,
246
+ "step": 1598
247
+ },
248
+ {
249
+ "epoch": 18.0,
250
+ "learning_rate": 1e-05,
251
+ "loss": 2.3536,
252
+ "step": 1692
253
+ },
254
+ {
255
+ "epoch": 18.0,
256
+ "eval_loss": 1.7658276557922363,
257
+ "eval_runtime": 35.6301,
258
+ "eval_samples_per_second": 5.613,
259
+ "eval_steps_per_second": 0.702,
260
+ "step": 1692
261
+ },
262
+ {
263
+ "epoch": 19.0,
264
+ "learning_rate": 5e-06,
265
+ "loss": 2.2957,
266
+ "step": 1786
267
+ },
268
+ {
269
+ "epoch": 19.0,
270
+ "eval_loss": 1.7328851222991943,
271
+ "eval_runtime": 36.2644,
272
+ "eval_samples_per_second": 5.515,
273
+ "eval_steps_per_second": 0.689,
274
+ "step": 1786
275
+ },
276
+ {
277
+ "epoch": 20.0,
278
+ "learning_rate": 0.0,
279
+ "loss": 2.274,
280
+ "step": 1880
281
+ },
282
+ {
283
+ "epoch": 20.0,
284
+ "eval_loss": 1.7334604263305664,
285
+ "eval_runtime": 34.2732,
286
+ "eval_samples_per_second": 5.835,
287
+ "eval_steps_per_second": 0.729,
288
+ "step": 1880
289
+ },
290
+ {
291
+ "epoch": 20.0,
292
+ "step": 1880,
293
+ "total_flos": 7.1683864704e+18,
294
+ "train_loss": 0.5789503787426238,
295
+ "train_runtime": 1191.4496,
296
+ "train_samples_per_second": 12.59,
297
+ "train_steps_per_second": 1.578
298
  }
299
  ],
300
+ "max_steps": 1880,
301
+ "num_train_epochs": 20,
302
+ "total_flos": 7.1683864704e+18,
303
  "trial_name": null,
304
  "trial_params": null
305
  }