rootxhacker commited on
Commit
4016107
·
verified ·
1 Parent(s): 5a4df68

Training in progress, step 30500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:069e8aec2bc91b01e99f7b79f39b1217a37ea88d9f6f4132f8acee4f393c01b1
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99d93c7c60c932d10ad33d1552af0aac71474f293137a45805a4a2ce763ee9d3
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:05de4cdebfe1224dfd9ad2f7aac9780ebf9102b682b1460f83379a4262dee74b
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35dbfc13847779b0a35938e8b0f588714c0a9135f44df01b3743c87ca265465a
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:585e32212caa9f4214a347406425426d068333176e31042b8c5c439f5b429d00
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6542d07369db36fde40d38be458a1a754a1635e655b17a3c1ef863154ef95d8
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65c2f44365d34d95613ad949972f890d6a6afc2c6e9d4d4d8c47a473b1c2b039
3
- size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d84d85985e40eaca2f8aecd8e39909983ecc43ecb61e48fd72ba84ffc8de605b
3
+ size 14180
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:195e35eaf32578f671662018e8b669b6388d8b5ac81f855c1c95157d655e6122
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:425d397e4698665694b259ae6a1b829b317ed54337dd9e06f3cd56fd2ec805f8
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f8616cef5b8dab506166471a2c46c7770aee1e224f56ecc6b4d1b9b5b17b94e
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:840262f69bbf64219997ced1350b5b0f0a6ada0892f4ec21d8f526e52fcbb247
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 30000,
3
  "best_metric": 0.9945911169052124,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-30000",
5
- "epoch": 2.307514806553342,
6
  "eval_steps": 250,
7
- "global_step": 30000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5168,6 +5168,92 @@
5168
  "eval_samples_per_second": 57.971,
5169
  "eval_steps_per_second": 14.493,
5170
  "step": 30000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5171
  }
5172
  ],
5173
  "logging_steps": 50,
 
2
  "best_global_step": 30000,
3
  "best_metric": 0.9945911169052124,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-30000",
5
+ "epoch": 2.3459733866625645,
6
  "eval_steps": 250,
7
+ "global_step": 30500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5168
  "eval_samples_per_second": 57.971,
5169
  "eval_steps_per_second": 14.493,
5170
  "step": 30000
5171
+ },
5172
+ {
5173
+ "epoch": 2.311360664564264,
5174
+ "grad_norm": 1.3450604677200317,
5175
+ "learning_rate": 4.657818871256786e-05,
5176
+ "loss": 0.973,
5177
+ "step": 30050
5178
+ },
5179
+ {
5180
+ "epoch": 2.3152065225751866,
5181
+ "grad_norm": 1.1462957859039307,
5182
+ "learning_rate": 4.631846869075137e-05,
5183
+ "loss": 0.9789,
5184
+ "step": 30100
5185
+ },
5186
+ {
5187
+ "epoch": 2.3190523805861085,
5188
+ "grad_norm": 1.0691301822662354,
5189
+ "learning_rate": 4.605874866893489e-05,
5190
+ "loss": 0.9937,
5191
+ "step": 30150
5192
+ },
5193
+ {
5194
+ "epoch": 2.322898238597031,
5195
+ "grad_norm": 1.527723789215088,
5196
+ "learning_rate": 4.579902864711841e-05,
5197
+ "loss": 0.9276,
5198
+ "step": 30200
5199
+ },
5200
+ {
5201
+ "epoch": 2.3267440966079533,
5202
+ "grad_norm": 0.7396986484527588,
5203
+ "learning_rate": 4.553930862530192e-05,
5204
+ "loss": 0.9648,
5205
+ "step": 30250
5206
+ },
5207
+ {
5208
+ "epoch": 2.3267440966079533,
5209
+ "eval_loss": 1.0029717683792114,
5210
+ "eval_runtime": 17.2662,
5211
+ "eval_samples_per_second": 57.917,
5212
+ "eval_steps_per_second": 14.479,
5213
+ "step": 30250
5214
+ },
5215
+ {
5216
+ "epoch": 2.3305899546188753,
5217
+ "grad_norm": 0.9694539308547974,
5218
+ "learning_rate": 4.527958860348545e-05,
5219
+ "loss": 0.9378,
5220
+ "step": 30300
5221
+ },
5222
+ {
5223
+ "epoch": 2.3344358126297977,
5224
+ "grad_norm": 1.161028504371643,
5225
+ "learning_rate": 4.501986858166896e-05,
5226
+ "loss": 0.9807,
5227
+ "step": 30350
5228
+ },
5229
+ {
5230
+ "epoch": 2.33828167064072,
5231
+ "grad_norm": 1.6975845098495483,
5232
+ "learning_rate": 4.476014855985248e-05,
5233
+ "loss": 0.9809,
5234
+ "step": 30400
5235
+ },
5236
+ {
5237
+ "epoch": 2.342127528651642,
5238
+ "grad_norm": 1.3228962421417236,
5239
+ "learning_rate": 4.4500428538036e-05,
5240
+ "loss": 1.0339,
5241
+ "step": 30450
5242
+ },
5243
+ {
5244
+ "epoch": 2.3459733866625645,
5245
+ "grad_norm": 1.0168397426605225,
5246
+ "learning_rate": 4.424070851621952e-05,
5247
+ "loss": 0.9544,
5248
+ "step": 30500
5249
+ },
5250
+ {
5251
+ "epoch": 2.3459733866625645,
5252
+ "eval_loss": 1.002646565437317,
5253
+ "eval_runtime": 17.3363,
5254
+ "eval_samples_per_second": 57.682,
5255
+ "eval_steps_per_second": 14.421,
5256
+ "step": 30500
5257
  }
5258
  ],
5259
  "logging_steps": 50,