rootxhacker commited on
Commit
efab289
·
verified ·
1 Parent(s): 7a1ef69

Training in progress, step 33000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d47a059c4465cb96ca8cf7f1905ca26df8afde99f0c2208111a3832ed682273e
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a1f3a37b9195f9fe5315c1a417cc9c4c1837b6b4960ab692b3988674668e641
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:789a7c970269f3838d005c341e4869fd88818ad8ae5141deea1681f158455f61
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3523599b620af8d4d35f82aaf704dae1a9541799dcba2ac70510840b2a4877a5
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01682574d44e97467301d5779733da7210577aa9e9ec38e6d369a4e1bb9c71a7
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b004e01986e4ffc28df93cce958d9d9b3e3c05bd2e39ed3961cf317990155cfc
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e10cec93434f8ec9066e53d88256d0df13c4dfad53975c2a473bada794e39de4
3
- size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0849d6e61493156c95f17fe6b7e25f79c73daada8cac211ebd8c78fd56fdbe07
3
+ size 14180
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe23086b61822081f0f874226d60c752bbd88420dba9100921fe74a8fe8db57f
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99769539adfb817adf246fb69dd78f4ed98ef4d44e4b95e77847af02938c82df
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16e4c0e7d997f50c97bce12877fd963ff1e035235b3d794e37197e971fb5ab23
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ba7f7caed94fa0fdab770ae562d792042367a76a376e41d1e68e45e9207a740
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 30000,
3
  "best_metric": 0.9945911169052124,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-30000",
5
- "epoch": 2.4998077070994538,
6
  "eval_steps": 250,
7
- "global_step": 32500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5598,6 +5598,92 @@
5598
  "eval_samples_per_second": 57.674,
5599
  "eval_steps_per_second": 14.418,
5600
  "step": 32500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5601
  }
5602
  ],
5603
  "logging_steps": 50,
 
2
  "best_global_step": 30000,
3
  "best_metric": 0.9945911169052124,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-30000",
5
+ "epoch": 2.5382662872086765,
6
  "eval_steps": 250,
7
+ "global_step": 33000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5598
  "eval_samples_per_second": 57.674,
5599
  "eval_steps_per_second": 14.418,
5600
  "step": 32500
5601
+ },
5602
+ {
5603
+ "epoch": 2.503653565110376,
5604
+ "grad_norm": 0.867513120174408,
5605
+ "learning_rate": 3.359738202218009e-05,
5606
+ "loss": 0.994,
5607
+ "step": 32550
5608
+ },
5609
+ {
5610
+ "epoch": 2.507499423121298,
5611
+ "grad_norm": 1.7425885200500488,
5612
+ "learning_rate": 3.3337662000363615e-05,
5613
+ "loss": 1.0068,
5614
+ "step": 32600
5615
+ },
5616
+ {
5617
+ "epoch": 2.5113452811322206,
5618
+ "grad_norm": 0.9053608775138855,
5619
+ "learning_rate": 3.307794197854713e-05,
5620
+ "loss": 0.9704,
5621
+ "step": 32650
5622
+ },
5623
+ {
5624
+ "epoch": 2.515191139143143,
5625
+ "grad_norm": 1.0533051490783691,
5626
+ "learning_rate": 3.281822195673064e-05,
5627
+ "loss": 0.9506,
5628
+ "step": 32700
5629
+ },
5630
+ {
5631
+ "epoch": 2.519036997154065,
5632
+ "grad_norm": 1.2495230436325073,
5633
+ "learning_rate": 3.255850193491417e-05,
5634
+ "loss": 0.9936,
5635
+ "step": 32750
5636
+ },
5637
+ {
5638
+ "epoch": 2.519036997154065,
5639
+ "eval_loss": 0.9990929961204529,
5640
+ "eval_runtime": 17.239,
5641
+ "eval_samples_per_second": 58.008,
5642
+ "eval_steps_per_second": 14.502,
5643
+ "step": 32750
5644
+ },
5645
+ {
5646
+ "epoch": 2.5228828551649873,
5647
+ "grad_norm": 0.8339760303497314,
5648
+ "learning_rate": 3.229878191309768e-05,
5649
+ "loss": 1.0008,
5650
+ "step": 32800
5651
+ },
5652
+ {
5653
+ "epoch": 2.5267287131759097,
5654
+ "grad_norm": 1.2839399576187134,
5655
+ "learning_rate": 3.20390618912812e-05,
5656
+ "loss": 1.0109,
5657
+ "step": 32850
5658
+ },
5659
+ {
5660
+ "epoch": 2.5305745711868317,
5661
+ "grad_norm": 1.2146100997924805,
5662
+ "learning_rate": 3.177934186946472e-05,
5663
+ "loss": 0.9834,
5664
+ "step": 32900
5665
+ },
5666
+ {
5667
+ "epoch": 2.534420429197754,
5668
+ "grad_norm": 0.7952923774719238,
5669
+ "learning_rate": 3.151962184764823e-05,
5670
+ "loss": 1.0013,
5671
+ "step": 32950
5672
+ },
5673
+ {
5674
+ "epoch": 2.5382662872086765,
5675
+ "grad_norm": 1.67001211643219,
5676
+ "learning_rate": 3.125990182583176e-05,
5677
+ "loss": 0.9797,
5678
+ "step": 33000
5679
+ },
5680
+ {
5681
+ "epoch": 2.5382662872086765,
5682
+ "eval_loss": 1.001037359237671,
5683
+ "eval_runtime": 17.347,
5684
+ "eval_samples_per_second": 57.647,
5685
+ "eval_steps_per_second": 14.412,
5686
+ "step": 33000
5687
  }
5688
  ],
5689
  "logging_steps": 50,