Kudod commited on
Commit
b08e58c
·
verified ·
1 Parent(s): 2f8e4c4

Training in progress, step 161088, checkpoint

Browse files
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3fd70c2ee9103dacc2e8460e11a544a0da08573c15a524763aa473249698e80
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4caa78e2064d47e2ccbf882089e5403067cd8ee5d79157d96a300242fc6a5b1b
3
  size 14244
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 3.972983710766786,
6
  "eval_steps": 5000,
7
- "global_step": 160000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2504,6 +2504,20 @@
2504
  "eval_samples_per_second": 440.496,
2505
  "eval_steps_per_second": 13.766,
2506
  "step": 160000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2507
  }
2508
  ],
2509
  "logging_steps": 500,
@@ -2518,12 +2532,12 @@
2518
  "should_evaluate": false,
2519
  "should_log": false,
2520
  "should_save": true,
2521
- "should_training_stop": false
2522
  },
2523
  "attributes": {}
2524
  }
2525
  },
2526
- "total_flos": 3.3978863868862464e+17,
2527
  "train_batch_size": 32,
2528
  "trial_name": null,
2529
  "trial_params": null
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 4.0,
6
  "eval_steps": 5000,
7
+ "global_step": 161088,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2504
  "eval_samples_per_second": 440.496,
2505
  "eval_steps_per_second": 13.766,
2506
  "step": 160000
2507
+ },
2508
+ {
2509
+ "epoch": 3.985399284862932,
2510
+ "grad_norm": NaN,
2511
+ "learning_rate": 0.0004900742091849483,
2512
+ "loss": 0.0,
2513
+ "step": 160500
2514
+ },
2515
+ {
2516
+ "epoch": 3.997814858959078,
2517
+ "grad_norm": NaN,
2518
+ "learning_rate": 0.0004900742091849483,
2519
+ "loss": 0.0,
2520
+ "step": 161000
2521
  }
2522
  ],
2523
  "logging_steps": 500,
 
2532
  "should_evaluate": false,
2533
  "should_log": false,
2534
  "should_save": true,
2535
+ "should_training_stop": true
2536
  },
2537
  "attributes": {}
2538
  }
2539
  },
2540
+ "total_flos": 3.4209723453526426e+17,
2541
  "train_batch_size": 32,
2542
  "trial_name": null,
2543
  "trial_params": null