lyan62 commited on
Commit
8e02c70
1 Parent(s): 8d41083

Training in progress, step 35000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9dfb8ee546a393cbd088a1267e0528b64ac1f6edc55a139ae628e0fae50bc81f
3
  size 402587859
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6a5a7674dbb8d58ec4d7b340f1e19ce8cd6e355cf21b578954983287a8734b6
3
  size 402587859
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:552e7d2fc0351ff5002d604566f010c93ce9e53db2a7a86ba323848706c62524
3
  size 201355195
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2677cfed78ccae5496a895d92941064711c7091014942cb86f552eaa9b73b86b
3
  size 201355195
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b5cf95a496e0d0c153b9cfd4e8a1f7162ed59c2414c99c7838d29cd8f942ca48
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2084cf08b52c1263f45bb8b8d4f65131103615cabf4896bf98de710a4ca1760
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9035eb22871e934ea2071d3c37031d3b68bc4ca9c57bb37af510e052600d5a2
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:668b3257e9fcad50addd96ee800eedbd732b610a370bd832008ee3ea4b26fb8e
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f37c6f1bf46d4683c647937edd88a5957adcf809e2ade87bcd816e5a9ad05c40
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e83414b6fee779cf5d18e0d6de9bcb0d6baea757a03c57176cc09bb4cd38cf3d
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70c5619b7d22e67fa4d8ad8e5aac6be8872972633f6b700f4285106349937d54
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0a9889c36f8cea70cf9f3a51e8e629fdb3421f3d44d2e389fe9d24a271ed606
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7facac06cf47f02915a64f3844ee1569b5a7479cd81db3f11a1da1896148a4d
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:946d977aec6ac3e6d969a438e59b6cba069f78c02c4d887419131bdbe7403a10
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b2ecce13783d3eb66c2381b219fe80ea60a6817507cb21aea863465c4774335
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0991d8986307506ff20d1a384de1955fdf6c7f066139da3ee7c2fdbb8b4f5ce
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.5106339520514719,
5
- "global_step": 30000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -366,6 +366,66 @@
366
  "learning_rate": 0.00014876101394745023,
367
  "loss": 0.3747,
368
  "step": 30000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
369
  }
370
  ],
371
  "max_steps": 500000,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.5957396107267172,
5
+ "global_step": 35000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
366
  "learning_rate": 0.00014876101394745023,
367
  "loss": 0.3747,
368
  "step": 30000
369
+ },
370
+ {
371
+ "epoch": 0.52,
372
+ "learning_rate": 0.00014871948232026222,
373
+ "loss": 0.3741,
374
+ "step": 30500
375
+ },
376
+ {
377
+ "epoch": 0.53,
378
+ "learning_rate": 0.00014867727245952692,
379
+ "loss": 0.3739,
380
+ "step": 31000
381
+ },
382
+ {
383
+ "epoch": 0.54,
384
+ "learning_rate": 0.00014863447123337502,
385
+ "loss": 0.3736,
386
+ "step": 31500
387
+ },
388
+ {
389
+ "epoch": 0.54,
390
+ "learning_rate": 0.00014859090751637814,
391
+ "loss": 0.3733,
392
+ "step": 32000
393
+ },
394
+ {
395
+ "epoch": 0.55,
396
+ "learning_rate": 0.00014854666683481534,
397
+ "loss": 0.3728,
398
+ "step": 32500
399
+ },
400
+ {
401
+ "epoch": 0.56,
402
+ "learning_rate": 0.0001485017496253243,
403
+ "loss": 0.3725,
404
+ "step": 33000
405
+ },
406
+ {
407
+ "epoch": 0.57,
408
+ "learning_rate": 0.00014845624819224238,
409
+ "loss": 0.3722,
410
+ "step": 33500
411
+ },
412
+ {
413
+ "epoch": 0.58,
414
+ "learning_rate": 0.00014840998061432743,
415
+ "loss": 0.3719,
416
+ "step": 34000
417
+ },
418
+ {
419
+ "epoch": 0.59,
420
+ "learning_rate": 0.00014836313241655734,
421
+ "loss": 0.3717,
422
+ "step": 34500
423
+ },
424
+ {
425
+ "epoch": 0.6,
426
+ "learning_rate": 0.00014831551629313194,
427
+ "loss": 0.3711,
428
+ "step": 35000
429
  }
430
  ],
431
  "max_steps": 500000,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:552e7d2fc0351ff5002d604566f010c93ce9e53db2a7a86ba323848706c62524
3
  size 201355195
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2677cfed78ccae5496a895d92941064711c7091014942cb86f552eaa9b73b86b
3
  size 201355195