JulienRPA commited on
Commit
74cca0d
1 Parent(s): 94e3b14

Training in progress, step 10000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f7e8f5369bfc2a29f36f7b10957832c0e20a5a70d77b74647f2ca26ac882624
3
  size 2023671531
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14c9a2e55c4c50b24b29ffda31bbbf8b2ce79105a3817c65ef74a18d2c29ccd0
3
  size 2023671531
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:563b0a357a2dc71eec9a097e4c7356b071b95a6f14bf272d39a798ac00c8b93f
3
  size 1014236857
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1985db2a12fd26ee3312f17e5b5c9269d139ea9375f805eaa6bedfdbc502aed3
3
  size 1014236857
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0fb75bd8c52e3fd47730e38465db8261e233f22f3a237ac4bbce2f0d46dafd10
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:223d17683d85a6b838bf63109231365183224af0ce92c28b1ea819c53db67266
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7dbe52cd022df1b5a43d833c96a319fe1d93b440f729ffdf50bc9798e6a7f019
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:180a76762e48468dc084ebe39054009bb6587d7f0fcb0961ce0eec20c5af2575
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 230.76923076923077,
5
- "global_step": 9000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -330,11 +330,47 @@
330
  "eval_samples_per_second": 3.559,
331
  "eval_steps_per_second": 0.452,
332
  "step": 9000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
333
  }
334
  ],
335
  "max_steps": 11700,
336
  "num_train_epochs": 300,
337
- "total_flos": 7274599459543680.0,
338
  "trial_name": null,
339
  "trial_params": null
340
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 256.4102564102564,
5
+ "global_step": 10000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
330
  "eval_samples_per_second": 3.559,
331
  "eval_steps_per_second": 0.452,
332
  "step": 9000
333
+ },
334
+ {
335
+ "epoch": 243.59,
336
+ "learning_rate": 1.1360824742268042e-05,
337
+ "loss": 0.0502,
338
+ "step": 9500
339
+ },
340
+ {
341
+ "epoch": 243.59,
342
+ "eval_bleu": 95.1882,
343
+ "eval_em": 0.1319,
344
+ "eval_gen_len": 58.5228,
345
+ "eval_loss": 0.3490062654018402,
346
+ "eval_rm": 0.3141,
347
+ "eval_runtime": 118.559,
348
+ "eval_samples_per_second": 3.517,
349
+ "eval_steps_per_second": 0.447,
350
+ "step": 9500
351
+ },
352
+ {
353
+ "epoch": 256.41,
354
+ "learning_rate": 8.783505154639175e-06,
355
+ "loss": 0.0473,
356
+ "step": 10000
357
+ },
358
+ {
359
+ "epoch": 256.41,
360
+ "eval_bleu": 95.1198,
361
+ "eval_em": 0.1319,
362
+ "eval_gen_len": 58.4245,
363
+ "eval_loss": 0.3504057824611664,
364
+ "eval_rm": 0.307,
365
+ "eval_runtime": 118.462,
366
+ "eval_samples_per_second": 3.52,
367
+ "eval_steps_per_second": 0.447,
368
+ "step": 10000
369
  }
370
  ],
371
  "max_steps": 11700,
372
  "num_train_epochs": 300,
373
+ "total_flos": 8083589088527040.0,
374
  "trial_name": null,
375
  "trial_params": null
376
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:563b0a357a2dc71eec9a097e4c7356b071b95a6f14bf272d39a798ac00c8b93f
3
  size 1014236857
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1985db2a12fd26ee3312f17e5b5c9269d139ea9375f805eaa6bedfdbc502aed3
3
  size 1014236857
runs/Jun01_11-16-06_2f3322bc44db/events.out.tfevents.1685618949.2f3322bc44db.4217.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d04c0c561bed68c646c44b3398c50c017920833a05db2429bb948013b4a847c
3
- size 19699
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21397dc7fa148fe1a54e9c47d988caf74cf88c782cf80ab207dabd14c450b5a5
3
+ size 20937