rootxhacker commited on
Commit
a83ee2d
·
verified ·
1 Parent(s): ad5678e

Training in progress, step 22000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:66cda148dcae03c8b6ee9a988c41356b8fb7dd85bc794057def1a0a106239b14
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d7b8f572c134e72c7026e2e9ad914d2679628dec1b66f03f49c50f611744778
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a7ccadc0fc62d6e734efb6eac59f8de15c8962f84260b3fa84659524029cca9
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70ce7eba6d133886c57e789ae1ced0054a79c486c5c2f9581bd59cf429b1f437
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4cde556e6d84497b700bedd313afb1db4fbdff84a922d3df94365577a9ffe5cb
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d3bd2c73ee827d2b8927a44cbea930a6ab308656fbc61ae1272b12f9654d264
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24cdd6f45f9ebce887e06d548bf949bd18ccf52b17999d18752823b6dd7dc03a
3
- size 14308
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:625da12a62ce1ec712e7ea0b4fc06eed36ff20b9634198d1bc6029989e807f8d
3
+ size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76d7482aa4f2ea8d9ee623a2338b27a160c64d9b3e6847f775500f74a89d839e
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8788cf54002af30b32604c9f2a6a5a9fa6c726ebc719ce2f7ca555b2dcfdfac8
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba5e991474e4af796236702d23dc20d105ef404660d6c7d1c95fb199aa1ce3be
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:854a60bf19d6e0989bdf3b974086f8fa81da02ef244adb541905035064ca56fc
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 21000,
3
- "best_metric": 1.4690666198730469,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-21000",
5
- "epoch": 1.6537189446965619,
6
  "eval_steps": 250,
7
- "global_step": 21500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3706,6 +3706,92 @@
3706
  "eval_samples_per_second": 56.129,
3707
  "eval_steps_per_second": 14.032,
3708
  "step": 21500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3709
  }
3710
  ],
3711
  "logging_steps": 50,
 
1
  {
2
+ "best_global_step": 21750,
3
+ "best_metric": 1.4662117958068848,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-21000",
5
+ "epoch": 1.6921775248057842,
6
  "eval_steps": 250,
7
+ "global_step": 22000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3706
  "eval_samples_per_second": 56.129,
3707
  "eval_steps_per_second": 14.032,
3708
  "step": 21500
3709
+ },
3710
+ {
3711
+ "epoch": 1.657564802707484,
3712
+ "grad_norm": 1.3839844465255737,
3713
+ "learning_rate": 9.072020362049712e-05,
3714
+ "loss": 1.522,
3715
+ "step": 21550
3716
+ },
3717
+ {
3718
+ "epoch": 1.6614106607184063,
3719
+ "grad_norm": 1.187853455543518,
3720
+ "learning_rate": 9.046048359868063e-05,
3721
+ "loss": 1.4469,
3722
+ "step": 21600
3723
+ },
3724
+ {
3725
+ "epoch": 1.6652565187293287,
3726
+ "grad_norm": 2.8398866653442383,
3727
+ "learning_rate": 9.020076357686414e-05,
3728
+ "loss": 1.4875,
3729
+ "step": 21650
3730
+ },
3731
+ {
3732
+ "epoch": 1.6691023767402506,
3733
+ "grad_norm": 1.801963448524475,
3734
+ "learning_rate": 8.994104355504767e-05,
3735
+ "loss": 1.3892,
3736
+ "step": 21700
3737
+ },
3738
+ {
3739
+ "epoch": 1.672948234751173,
3740
+ "grad_norm": 1.7727116346359253,
3741
+ "learning_rate": 8.968132353323118e-05,
3742
+ "loss": 1.3886,
3743
+ "step": 21750
3744
+ },
3745
+ {
3746
+ "epoch": 1.672948234751173,
3747
+ "eval_loss": 1.4662117958068848,
3748
+ "eval_runtime": 17.7809,
3749
+ "eval_samples_per_second": 56.24,
3750
+ "eval_steps_per_second": 14.06,
3751
+ "step": 21750
3752
+ },
3753
+ {
3754
+ "epoch": 1.6767940927620952,
3755
+ "grad_norm": 1.7052053213119507,
3756
+ "learning_rate": 8.94216035114147e-05,
3757
+ "loss": 1.4483,
3758
+ "step": 21800
3759
+ },
3760
+ {
3761
+ "epoch": 1.6806399507730174,
3762
+ "grad_norm": 1.9812465906143188,
3763
+ "learning_rate": 8.916188348959822e-05,
3764
+ "loss": 1.4325,
3765
+ "step": 21850
3766
+ },
3767
+ {
3768
+ "epoch": 1.6844858087839398,
3769
+ "grad_norm": 1.2499721050262451,
3770
+ "learning_rate": 8.890216346778173e-05,
3771
+ "loss": 1.5246,
3772
+ "step": 21900
3773
+ },
3774
+ {
3775
+ "epoch": 1.6883316667948618,
3776
+ "grad_norm": 1.2503259181976318,
3777
+ "learning_rate": 8.864244344596525e-05,
3778
+ "loss": 1.4661,
3779
+ "step": 21950
3780
+ },
3781
+ {
3782
+ "epoch": 1.6921775248057842,
3783
+ "grad_norm": 2.201223134994507,
3784
+ "learning_rate": 8.838272342414877e-05,
3785
+ "loss": 1.5103,
3786
+ "step": 22000
3787
+ },
3788
+ {
3789
+ "epoch": 1.6921775248057842,
3790
+ "eval_loss": 1.470120906829834,
3791
+ "eval_runtime": 17.7715,
3792
+ "eval_samples_per_second": 56.27,
3793
+ "eval_steps_per_second": 14.067,
3794
+ "step": 22000
3795
  }
3796
  ],
3797
  "logging_steps": 50,