marinone94 commited on
Commit
6afffc7
β€’
1 Parent(s): 3bca5eb

Training in progress, step 1000

Browse files
{checkpoint-700 β†’ checkpoint-1000}/config.json RENAMED
File without changes
{checkpoint-700 β†’ checkpoint-1000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2734597abb10a2a590cf139e66decfdf1bc18e26d32aa5f4749a68f74109f763
3
  size 2490337809
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95fabf5e2139b58b89a0a9dc4a0dd7eab2d7fb1e0bf2132c5d106a85eafec112
3
  size 2490337809
{checkpoint-700 β†’ checkpoint-1000}/preprocessor_config.json RENAMED
File without changes
{checkpoint-700 β†’ checkpoint-1000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:866e0246bd78706b1bfb6c07818d34662e459927e54718460f8a950f5fc33ae8
3
  size 1262063089
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dccfbc86aa27461d23f7422a406db1866d4a1ca82d159e2b5e3bcbdbc5a4a7a
3
  size 1262063089
{checkpoint-700 β†’ checkpoint-1000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21798b4aee64ae056ff3e0e6a64832942beff047fe94bbbddb9d06dcf74d9125
3
  size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d345fee08e052171f81f97e38f40e29d1f10781ff7f283285eab3f13efe48ad
3
  size 14567
{checkpoint-700 β†’ checkpoint-1000}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7fb213daf5cce18a5f92167ca14da9df084d907f2b9796efc4666630f312b58c
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f810fc7b695697c440d8985f6042b4ba23a9e1027604c265718b518ca29f1b2b
3
  size 559
{checkpoint-700 β†’ checkpoint-1000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fcdecc30328ffcc8e9b8e7d7b6cfb5d7c85a8e3d5e777d680eff74cf60f2dc24
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1b9ce074e953ed3bd3e9fe29e7e413ec9c091cd274300ea3bee0f296265516c
3
  size 623
{checkpoint-700 β†’ checkpoint-1000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 7.688524590163935,
5
- "global_step": 700,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -279,11 +279,128 @@
279
  "eval_steps_per_second": 0.785,
280
  "eval_wer": 1.0,
281
  "step": 700
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
282
  }
283
  ],
284
  "max_steps": 4550,
285
  "num_train_epochs": 50,
286
- "total_flos": 1.0835835827730653e+19,
287
  "trial_name": null,
288
  "trial_params": null
289
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 10.98360655737705,
5
+ "global_step": 1000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
279
  "eval_steps_per_second": 0.785,
280
  "eval_wer": 1.0,
281
  "step": 700
282
+ },
283
+ {
284
+ "epoch": 7.91,
285
+ "learning_rate": 8.999999999999999e-05,
286
+ "loss": 2.9639,
287
+ "step": 720
288
+ },
289
+ {
290
+ "epoch": 8.13,
291
+ "learning_rate": 9.25e-05,
292
+ "loss": 3.0215,
293
+ "step": 740
294
+ },
295
+ {
296
+ "epoch": 8.35,
297
+ "learning_rate": 9.5e-05,
298
+ "loss": 2.9454,
299
+ "step": 760
300
+ },
301
+ {
302
+ "epoch": 8.57,
303
+ "learning_rate": 9.750000000000001e-05,
304
+ "loss": 2.9239,
305
+ "step": 780
306
+ },
307
+ {
308
+ "epoch": 8.79,
309
+ "learning_rate": 0.0001,
310
+ "loss": 2.8756,
311
+ "step": 800
312
+ },
313
+ {
314
+ "epoch": 8.79,
315
+ "eval_loss": 2.7302000522613525,
316
+ "eval_runtime": 191.8065,
317
+ "eval_samples_per_second": 25.249,
318
+ "eval_steps_per_second": 0.792,
319
+ "eval_wer": 1.0,
320
+ "step": 800
321
+ },
322
+ {
323
+ "epoch": 9.01,
324
+ "learning_rate": 0.0001025,
325
+ "loss": 2.8933,
326
+ "step": 820
327
+ },
328
+ {
329
+ "epoch": 9.23,
330
+ "learning_rate": 0.000105,
331
+ "loss": 2.7318,
332
+ "step": 840
333
+ },
334
+ {
335
+ "epoch": 9.45,
336
+ "learning_rate": 0.0001075,
337
+ "loss": 2.5941,
338
+ "step": 860
339
+ },
340
+ {
341
+ "epoch": 9.67,
342
+ "learning_rate": 0.00011,
343
+ "loss": 2.4441,
344
+ "step": 880
345
+ },
346
+ {
347
+ "epoch": 9.89,
348
+ "learning_rate": 0.00011250000000000001,
349
+ "loss": 2.2931,
350
+ "step": 900
351
+ },
352
+ {
353
+ "epoch": 9.89,
354
+ "eval_loss": 1.5057899951934814,
355
+ "eval_runtime": 196.4368,
356
+ "eval_samples_per_second": 24.654,
357
+ "eval_steps_per_second": 0.774,
358
+ "eval_wer": 0.9775759296054499,
359
+ "step": 900
360
+ },
361
+ {
362
+ "epoch": 10.11,
363
+ "learning_rate": 0.000115,
364
+ "loss": 2.1999,
365
+ "step": 920
366
+ },
367
+ {
368
+ "epoch": 10.33,
369
+ "learning_rate": 0.0001175,
370
+ "loss": 2.0574,
371
+ "step": 940
372
+ },
373
+ {
374
+ "epoch": 10.55,
375
+ "learning_rate": 0.00012,
376
+ "loss": 1.9672,
377
+ "step": 960
378
+ },
379
+ {
380
+ "epoch": 10.77,
381
+ "learning_rate": 0.0001225,
382
+ "loss": 1.9015,
383
+ "step": 980
384
+ },
385
+ {
386
+ "epoch": 10.98,
387
+ "learning_rate": 0.000125,
388
+ "loss": 1.8427,
389
+ "step": 1000
390
+ },
391
+ {
392
+ "epoch": 10.98,
393
+ "eval_loss": 0.9154536724090576,
394
+ "eval_runtime": 203.1168,
395
+ "eval_samples_per_second": 23.843,
396
+ "eval_steps_per_second": 0.748,
397
+ "eval_wer": 0.7832245245529378,
398
+ "step": 1000
399
  }
400
  ],
401
  "max_steps": 4550,
402
  "num_train_epochs": 50,
403
+ "total_flos": 1.5461756183168242e+19,
404
  "trial_name": null,
405
  "trial_params": null
406
  }
{checkpoint-700 β†’ checkpoint-1000}/training_args.bin RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:704e6898ee156f5080bd3c12729eab90778262ef46c752641e041495f274ba56
3
  size 1262063089
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dccfbc86aa27461d23f7422a406db1866d4a1ca82d159e2b5e3bcbdbc5a4a7a
3
  size 1262063089