| { |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 25.12562814070352, |
| "global_step": 2500, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.99, |
| "eval_loss": 2.7764203548431396, |
| "eval_runtime": 34.2112, |
| "eval_samples_per_second": 24.612, |
| "eval_steps_per_second": 3.098, |
| "eval_wer": 1.0, |
| "step": 99 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_loss": 2.762573003768921, |
| "eval_runtime": 33.9987, |
| "eval_samples_per_second": 24.766, |
| "eval_steps_per_second": 3.118, |
| "eval_wer": 1.0, |
| "step": 199 |
| }, |
| { |
| "epoch": 2.99, |
| "eval_loss": 1.5485457181930542, |
| "eval_runtime": 34.1904, |
| "eval_samples_per_second": 24.627, |
| "eval_steps_per_second": 3.1, |
| "eval_wer": 0.9983126781870018, |
| "step": 298 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_loss": 0.4536263048648834, |
| "eval_runtime": 34.3008, |
| "eval_samples_per_second": 24.548, |
| "eval_steps_per_second": 3.09, |
| "eval_wer": 0.6440914644789667, |
| "step": 398 |
| }, |
| { |
| "epoch": 4.99, |
| "eval_loss": 0.32973894476890564, |
| "eval_runtime": 34.0188, |
| "eval_samples_per_second": 24.751, |
| "eval_steps_per_second": 3.116, |
| "eval_wer": 0.5054983417699423, |
| "step": 497 |
| }, |
| { |
| "epoch": 5.03, |
| "learning_rate": 0.0002497979797979798, |
| "loss": 2.1303, |
| "step": 500 |
| }, |
| { |
| "epoch": 6.0, |
| "eval_loss": 0.27073708176612854, |
| "eval_runtime": 33.9387, |
| "eval_samples_per_second": 24.809, |
| "eval_steps_per_second": 3.123, |
| "eval_wer": 0.3777273520684238, |
| "step": 597 |
| }, |
| { |
| "epoch": 6.99, |
| "eval_loss": 0.2596016526222229, |
| "eval_runtime": 33.9444, |
| "eval_samples_per_second": 24.805, |
| "eval_steps_per_second": 3.123, |
| "eval_wer": 0.3815092802699715, |
| "step": 696 |
| }, |
| { |
| "epoch": 8.0, |
| "eval_loss": 0.25216805934906006, |
| "eval_runtime": 33.8461, |
| "eval_samples_per_second": 24.877, |
| "eval_steps_per_second": 3.132, |
| "eval_wer": 0.2978413917495782, |
| "step": 796 |
| }, |
| { |
| "epoch": 8.99, |
| "eval_loss": 0.22613081336021423, |
| "eval_runtime": 33.8906, |
| "eval_samples_per_second": 24.845, |
| "eval_steps_per_second": 3.128, |
| "eval_wer": 0.30965264444056556, |
| "step": 895 |
| }, |
| { |
| "epoch": 10.0, |
| "eval_loss": 0.23950138688087463, |
| "eval_runtime": 33.9858, |
| "eval_samples_per_second": 24.775, |
| "eval_steps_per_second": 3.119, |
| "eval_wer": 0.2646767905975447, |
| "step": 995 |
| }, |
| { |
| "epoch": 10.05, |
| "learning_rate": 0.00019929292929292926, |
| "loss": 0.2057, |
| "step": 1000 |
| }, |
| { |
| "epoch": 10.99, |
| "eval_loss": 0.21791674196720123, |
| "eval_runtime": 33.9224, |
| "eval_samples_per_second": 24.821, |
| "eval_steps_per_second": 3.125, |
| "eval_wer": 0.2613603304823413, |
| "step": 1094 |
| }, |
| { |
| "epoch": 12.0, |
| "eval_loss": 0.21110226213932037, |
| "eval_runtime": 33.8358, |
| "eval_samples_per_second": 24.885, |
| "eval_steps_per_second": 3.133, |
| "eval_wer": 0.25903299005061964, |
| "step": 1194 |
| }, |
| { |
| "epoch": 12.99, |
| "eval_loss": 0.22310343384742737, |
| "eval_runtime": 33.7767, |
| "eval_samples_per_second": 24.928, |
| "eval_steps_per_second": 3.138, |
| "eval_wer": 0.25368010705765986, |
| "step": 1293 |
| }, |
| { |
| "epoch": 14.0, |
| "eval_loss": 0.2454575151205063, |
| "eval_runtime": 33.8201, |
| "eval_samples_per_second": 24.896, |
| "eval_steps_per_second": 3.134, |
| "eval_wer": 0.2483854075754931, |
| "step": 1393 |
| }, |
| { |
| "epoch": 14.99, |
| "eval_loss": 0.24834834039211273, |
| "eval_runtime": 33.7913, |
| "eval_samples_per_second": 24.918, |
| "eval_steps_per_second": 3.137, |
| "eval_wer": 0.23663233839529876, |
| "step": 1492 |
| }, |
| { |
| "epoch": 15.08, |
| "learning_rate": 0.00014878787878787875, |
| "loss": 0.0945, |
| "step": 1500 |
| }, |
| { |
| "epoch": 16.0, |
| "eval_loss": 0.259757936000824, |
| "eval_runtime": 33.8499, |
| "eval_samples_per_second": 24.875, |
| "eval_steps_per_second": 3.131, |
| "eval_wer": 0.22348286495607145, |
| "step": 1592 |
| }, |
| { |
| "epoch": 16.99, |
| "eval_loss": 0.26361608505249023, |
| "eval_runtime": 33.9334, |
| "eval_samples_per_second": 24.813, |
| "eval_steps_per_second": 3.124, |
| "eval_wer": 0.21935183568976552, |
| "step": 1691 |
| }, |
| { |
| "epoch": 18.0, |
| "eval_loss": 0.2598336637020111, |
| "eval_runtime": 33.8712, |
| "eval_samples_per_second": 24.859, |
| "eval_steps_per_second": 3.13, |
| "eval_wer": 0.21964275324373073, |
| "step": 1791 |
| }, |
| { |
| "epoch": 18.99, |
| "eval_loss": 0.24791987240314484, |
| "eval_runtime": 33.8138, |
| "eval_samples_per_second": 24.901, |
| "eval_steps_per_second": 3.135, |
| "eval_wer": 0.20882062023622505, |
| "step": 1890 |
| }, |
| { |
| "epoch": 20.0, |
| "eval_loss": 0.24469724297523499, |
| "eval_runtime": 33.9448, |
| "eval_samples_per_second": 24.805, |
| "eval_steps_per_second": 3.123, |
| "eval_wer": 0.2091697213009833, |
| "step": 1990 |
| }, |
| { |
| "epoch": 20.1, |
| "learning_rate": 9.828282828282828e-05, |
| "loss": 0.0567, |
| "step": 2000 |
| }, |
| { |
| "epoch": 20.99, |
| "eval_loss": 0.25630325078964233, |
| "eval_runtime": 33.677, |
| "eval_samples_per_second": 25.002, |
| "eval_steps_per_second": 3.148, |
| "eval_wer": 0.20463140745912609, |
| "step": 2089 |
| }, |
| { |
| "epoch": 22.0, |
| "eval_loss": 0.2675672173500061, |
| "eval_runtime": 33.7312, |
| "eval_samples_per_second": 24.962, |
| "eval_steps_per_second": 3.142, |
| "eval_wer": 0.198871239890615, |
| "step": 2189 |
| }, |
| { |
| "epoch": 22.99, |
| "eval_loss": 0.25741901993751526, |
| "eval_runtime": 33.6669, |
| "eval_samples_per_second": 25.01, |
| "eval_steps_per_second": 3.148, |
| "eval_wer": 0.19951125850933846, |
| "step": 2288 |
| }, |
| { |
| "epoch": 24.0, |
| "eval_loss": 0.2615770101547241, |
| "eval_runtime": 33.8091, |
| "eval_samples_per_second": 24.905, |
| "eval_steps_per_second": 3.135, |
| "eval_wer": 0.1961947983941351, |
| "step": 2388 |
| }, |
| { |
| "epoch": 24.99, |
| "eval_loss": 0.257935494184494, |
| "eval_runtime": 33.8705, |
| "eval_samples_per_second": 24.859, |
| "eval_steps_per_second": 3.13, |
| "eval_wer": 0.1956129632862047, |
| "step": 2487 |
| }, |
| { |
| "epoch": 25.13, |
| "learning_rate": 4.777777777777778e-05, |
| "loss": 0.0418, |
| "step": 2500 |
| } |
| ], |
| "max_steps": 2970, |
| "num_train_epochs": 30, |
| "total_flos": 6.454758338809764e+19, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|