rootxhacker commited on
Commit
66b8895
·
verified ·
1 Parent(s): b91c7ff

Training in progress, step 20500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37a2fe2b7cf5d7145d364d49968edb54efe43efd98eba6806289d74f7e529ae8
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f82c93836bc692e34902f10bc204524481cd7a576e6d3e28b3bb7e2d682f323f
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7d0dd97707c0f0f3c8a12fdba68ea5ed4110d1f028231a6ea1054c90fb8603f
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e8703e2ac4edb79cf8f1764c40656f93e9be69ded66eb4cce14bbce6431a5e0
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59e604c620209e5ccc9d2a6df440d8eb819dc89b0c5554c52e42549c656e3250
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:411bf70b4f8c28dcde0ada0a6ab13ec881cbbf19e85c2796efaba99e8b13583e
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b205d8106465470d82a9f668e113b1a4c937f3fe768b385e78f85eb171e49cc2
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dbffb5b9d940a96eb51dbe7a35860718ecfeca99437ad8b1b71dbafaefdd573
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eee3ef0a596a0ef37ef802555af22f2c3a4f5d3b4c13d00ed6df2466a73dd8ed
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:384ba37c8844299a29c3c998811c9d47320ed4f7666069a4fb9a63d0dddfe44f
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83d15c547e182574b42460e3490faaf5cb37f299e2d2acbd532f1ef35e0b3aee
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c62f9fce1be162dfb9c17d3cf04dc0505b42c85ac9a955fe99836e3dd2e88351
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 18750,
3
- "best_metric": 1.4757392406463623,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-15500",
5
- "epoch": 1.5383432043688947,
6
  "eval_steps": 250,
7
- "global_step": 20000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3448,6 +3448,92 @@
3448
  "eval_samples_per_second": 55.752,
3449
  "eval_steps_per_second": 13.938,
3450
  "step": 20000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3451
  }
3452
  ],
3453
  "logging_steps": 50,
 
1
  {
2
+ "best_global_step": 20250,
3
+ "best_metric": 1.4724150896072388,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-15500",
5
+ "epoch": 1.576801784478117,
6
  "eval_steps": 250,
7
+ "global_step": 20500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3448
  "eval_samples_per_second": 55.752,
3449
  "eval_steps_per_second": 13.938,
3450
  "step": 20000
3451
+ },
3452
+ {
3453
+ "epoch": 1.542189062379817,
3454
+ "grad_norm": 1.7058050632476807,
3455
+ "learning_rate": 9.850660987455523e-05,
3456
+ "loss": 1.4646,
3457
+ "step": 20050
3458
+ },
3459
+ {
3460
+ "epoch": 1.5460349203907393,
3461
+ "grad_norm": 2.2624917030334473,
3462
+ "learning_rate": 9.824688985273876e-05,
3463
+ "loss": 1.4586,
3464
+ "step": 20100
3465
+ },
3466
+ {
3467
+ "epoch": 1.5498807784016613,
3468
+ "grad_norm": 2.216883420944214,
3469
+ "learning_rate": 9.798716983092227e-05,
3470
+ "loss": 1.4376,
3471
+ "step": 20150
3472
+ },
3473
+ {
3474
+ "epoch": 1.5537266364125837,
3475
+ "grad_norm": 1.9749584197998047,
3476
+ "learning_rate": 9.772744980910578e-05,
3477
+ "loss": 1.47,
3478
+ "step": 20200
3479
+ },
3480
+ {
3481
+ "epoch": 1.5575724944235059,
3482
+ "grad_norm": 2.185480833053589,
3483
+ "learning_rate": 9.746772978728931e-05,
3484
+ "loss": 1.39,
3485
+ "step": 20250
3486
+ },
3487
+ {
3488
+ "epoch": 1.5575724944235059,
3489
+ "eval_loss": 1.4724150896072388,
3490
+ "eval_runtime": 17.8191,
3491
+ "eval_samples_per_second": 56.12,
3492
+ "eval_steps_per_second": 14.03,
3493
+ "step": 20250
3494
+ },
3495
+ {
3496
+ "epoch": 1.561418352434428,
3497
+ "grad_norm": 1.5810290575027466,
3498
+ "learning_rate": 9.720800976547284e-05,
3499
+ "loss": 1.4267,
3500
+ "step": 20300
3501
+ },
3502
+ {
3503
+ "epoch": 1.5652642104453505,
3504
+ "grad_norm": 2.0329344272613525,
3505
+ "learning_rate": 9.694828974365633e-05,
3506
+ "loss": 1.5066,
3507
+ "step": 20350
3508
+ },
3509
+ {
3510
+ "epoch": 1.5691100684562724,
3511
+ "grad_norm": 2.7335126399993896,
3512
+ "learning_rate": 9.668856972183986e-05,
3513
+ "loss": 1.4749,
3514
+ "step": 20400
3515
+ },
3516
+ {
3517
+ "epoch": 1.5729559264671948,
3518
+ "grad_norm": 1.0576220750808716,
3519
+ "learning_rate": 9.642884970002339e-05,
3520
+ "loss": 1.4318,
3521
+ "step": 20450
3522
+ },
3523
+ {
3524
+ "epoch": 1.576801784478117,
3525
+ "grad_norm": 0.6857870817184448,
3526
+ "learning_rate": 9.616912967820689e-05,
3527
+ "loss": 1.3567,
3528
+ "step": 20500
3529
+ },
3530
+ {
3531
+ "epoch": 1.576801784478117,
3532
+ "eval_loss": 1.479669213294983,
3533
+ "eval_runtime": 17.8378,
3534
+ "eval_samples_per_second": 56.061,
3535
+ "eval_steps_per_second": 14.015,
3536
+ "step": 20500
3537
  }
3538
  ],
3539
  "logging_steps": 50,