rootxhacker commited on
Commit
2bc3e98
·
verified ·
1 Parent(s): af8c3c8

Training in progress, step 34500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:183bead4ca9a0d8a9ad0402f8298de3e2bfdf1c6bc3c98f0a8a4be0ee1e31d4d
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53c2dc91061b5eda8052d1184b1536e107f67954828f13fc73c5f566d9eec7e7
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b47889f113a05e0ff3862fe30181a9dc731902d20018b65b9702f60ad52946b
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd069bd3f52dbe1e9e9aa12f2a80d00bcd8aecaa208ac2ee4066c63760aef004
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e318b97ed9819790ac140e0dd6c53dca0b92f84a57cf1dedca58f5c9fdf217c4
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f6e144665188da17e67d918c6abe6a3a0b2a9a0712038ae5ff60cbb2015b996
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a8f7000d6d396338bd8027a37093a36e3ad9a9fa3dd5e939b7cf2fd1b06a270
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2aa00c75821a3bd67f749b822eac4f44391e9055a1d2f4b3c96ab88dfd278a9
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d185966dc7e40240f30d39f221c00702b5a813416a3b53099b3469fe07e391c8
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fe927b439a1a453ba57ba9d3a3e3ce57ef03a538257a3403279d996da7cbd98
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2206e3ea9caa91bbe357a176c4a03573c2b47177cf241fe9772382f8b2e0ca8f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b632fa657d89cf9d024b864a979b41e9d4484feec7658b4550443a85b8f54ac3
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 34000,
3
  "best_metric": 0.987713634967804,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-34000",
5
- "epoch": 2.615183447427121,
6
  "eval_steps": 250,
7
- "global_step": 34000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5856,6 +5856,92 @@
5856
  "eval_samples_per_second": 57.993,
5857
  "eval_steps_per_second": 14.498,
5858
  "step": 34000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5859
  }
5860
  ],
5861
  "logging_steps": 50,
 
2
  "best_global_step": 34000,
3
  "best_metric": 0.987713634967804,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-34000",
5
+ "epoch": 2.6536420275363435,
6
  "eval_steps": 250,
7
+ "global_step": 34500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5856
  "eval_samples_per_second": 57.993,
5857
  "eval_steps_per_second": 14.498,
5858
  "step": 34000
5859
+ },
5860
+ {
5861
+ "epoch": 2.619029305438043,
5862
+ "grad_norm": 0.5307362079620361,
5863
+ "learning_rate": 2.580578136768564e-05,
5864
+ "loss": 1.0031,
5865
+ "step": 34050
5866
+ },
5867
+ {
5868
+ "epoch": 2.6228751634489655,
5869
+ "grad_norm": 1.1112557649612427,
5870
+ "learning_rate": 2.5546061345869156e-05,
5871
+ "loss": 0.9928,
5872
+ "step": 34100
5873
+ },
5874
+ {
5875
+ "epoch": 2.626721021459888,
5876
+ "grad_norm": 0.646759569644928,
5877
+ "learning_rate": 2.5286341324052672e-05,
5878
+ "loss": 1.0173,
5879
+ "step": 34150
5880
+ },
5881
+ {
5882
+ "epoch": 2.63056687947081,
5883
+ "grad_norm": 1.0114878416061401,
5884
+ "learning_rate": 2.502662130223619e-05,
5885
+ "loss": 0.9765,
5886
+ "step": 34200
5887
+ },
5888
+ {
5889
+ "epoch": 2.6344127374817323,
5890
+ "grad_norm": 0.8782021403312683,
5891
+ "learning_rate": 2.4766901280419708e-05,
5892
+ "loss": 0.9926,
5893
+ "step": 34250
5894
+ },
5895
+ {
5896
+ "epoch": 2.6344127374817323,
5897
+ "eval_loss": 0.9932020306587219,
5898
+ "eval_runtime": 17.1921,
5899
+ "eval_samples_per_second": 58.166,
5900
+ "eval_steps_per_second": 14.542,
5901
+ "step": 34250
5902
+ },
5903
+ {
5904
+ "epoch": 2.6382585954926543,
5905
+ "grad_norm": 1.0792268514633179,
5906
+ "learning_rate": 2.4507181258603227e-05,
5907
+ "loss": 1.0541,
5908
+ "step": 34300
5909
+ },
5910
+ {
5911
+ "epoch": 2.6421044535035767,
5912
+ "grad_norm": 0.9647793173789978,
5913
+ "learning_rate": 2.4247461236786744e-05,
5914
+ "loss": 0.9779,
5915
+ "step": 34350
5916
+ },
5917
+ {
5918
+ "epoch": 2.6459503115144987,
5919
+ "grad_norm": 1.0052498579025269,
5920
+ "learning_rate": 2.3987741214970263e-05,
5921
+ "loss": 0.9798,
5922
+ "step": 34400
5923
+ },
5924
+ {
5925
+ "epoch": 2.649796169525421,
5926
+ "grad_norm": 0.8122023344039917,
5927
+ "learning_rate": 2.3728021193153783e-05,
5928
+ "loss": 1.0205,
5929
+ "step": 34450
5930
+ },
5931
+ {
5932
+ "epoch": 2.6536420275363435,
5933
+ "grad_norm": 1.452087163925171,
5934
+ "learning_rate": 2.3468301171337302e-05,
5935
+ "loss": 0.9745,
5936
+ "step": 34500
5937
+ },
5938
+ {
5939
+ "epoch": 2.6536420275363435,
5940
+ "eval_loss": 0.9959968328475952,
5941
+ "eval_runtime": 17.2025,
5942
+ "eval_samples_per_second": 58.131,
5943
+ "eval_steps_per_second": 14.533,
5944
+ "step": 34500
5945
  }
5946
  ],
5947
  "logging_steps": 50,