gary109's picture
End of training
3a67842
raw
history blame
23.8 kB
{
"best_metric": 2.332979202270508,
"best_model_checkpoint": "ai-light-dance_drums_ft_pretrain_wav2vec2-base-new_onset-rbma13-2_7k/checkpoint-40",
"epoch": 100.0,
"global_step": 100,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_loss": 68.1357650756836,
"eval_runtime": 0.3976,
"eval_samples_per_second": 5.03,
"eval_steps_per_second": 2.515,
"eval_wer": 1.0,
"step": 1
},
{
"epoch": 2.0,
"eval_loss": 68.1357650756836,
"eval_runtime": 0.4117,
"eval_samples_per_second": 4.858,
"eval_steps_per_second": 2.429,
"eval_wer": 1.0,
"step": 2
},
{
"epoch": 3.0,
"eval_loss": 68.1357650756836,
"eval_runtime": 0.4341,
"eval_samples_per_second": 4.607,
"eval_steps_per_second": 2.304,
"eval_wer": 1.0,
"step": 3
},
{
"epoch": 4.0,
"eval_loss": 68.02447509765625,
"eval_runtime": 0.4095,
"eval_samples_per_second": 4.884,
"eval_steps_per_second": 2.442,
"eval_wer": 1.0,
"step": 4
},
{
"epoch": 5.0,
"eval_loss": 67.78739166259766,
"eval_runtime": 0.4118,
"eval_samples_per_second": 4.857,
"eval_steps_per_second": 2.428,
"eval_wer": 1.0,
"step": 5
},
{
"epoch": 6.0,
"eval_loss": 67.45346069335938,
"eval_runtime": 0.4145,
"eval_samples_per_second": 4.825,
"eval_steps_per_second": 2.413,
"eval_wer": 1.0,
"step": 6
},
{
"epoch": 7.0,
"eval_loss": 67.01423645019531,
"eval_runtime": 0.4121,
"eval_samples_per_second": 4.853,
"eval_steps_per_second": 2.427,
"eval_wer": 1.0,
"step": 7
},
{
"epoch": 8.0,
"eval_loss": 67.01423645019531,
"eval_runtime": 0.4095,
"eval_samples_per_second": 4.884,
"eval_steps_per_second": 2.442,
"eval_wer": 1.0,
"step": 8
},
{
"epoch": 9.0,
"eval_loss": 66.4334716796875,
"eval_runtime": 0.4143,
"eval_samples_per_second": 4.828,
"eval_steps_per_second": 2.414,
"eval_wer": 1.0,
"step": 9
},
{
"epoch": 10.0,
"learning_rate": 7e-05,
"loss": 38.4011,
"step": 10
},
{
"epoch": 10.0,
"eval_loss": 65.70997619628906,
"eval_runtime": 0.4061,
"eval_samples_per_second": 4.925,
"eval_steps_per_second": 2.463,
"eval_wer": 1.0,
"step": 10
},
{
"epoch": 11.0,
"eval_loss": 64.820556640625,
"eval_runtime": 0.4105,
"eval_samples_per_second": 4.872,
"eval_steps_per_second": 2.436,
"eval_wer": 1.0,
"step": 11
},
{
"epoch": 12.0,
"eval_loss": 63.82392120361328,
"eval_runtime": 0.4177,
"eval_samples_per_second": 4.788,
"eval_steps_per_second": 2.394,
"eval_wer": 1.0,
"step": 12
},
{
"epoch": 13.0,
"eval_loss": 62.648887634277344,
"eval_runtime": 0.41,
"eval_samples_per_second": 4.878,
"eval_steps_per_second": 2.439,
"eval_wer": 1.0,
"step": 13
},
{
"epoch": 14.0,
"eval_loss": 61.307098388671875,
"eval_runtime": 0.4232,
"eval_samples_per_second": 4.726,
"eval_steps_per_second": 2.363,
"eval_wer": 1.0,
"step": 14
},
{
"epoch": 15.0,
"eval_loss": 59.74273681640625,
"eval_runtime": 0.4053,
"eval_samples_per_second": 4.934,
"eval_steps_per_second": 2.467,
"eval_wer": 1.0,
"step": 15
},
{
"epoch": 16.0,
"eval_loss": 58.02557373046875,
"eval_runtime": 0.4173,
"eval_samples_per_second": 4.793,
"eval_steps_per_second": 2.397,
"eval_wer": 0.98,
"step": 16
},
{
"epoch": 17.0,
"eval_loss": 56.03272247314453,
"eval_runtime": 0.4178,
"eval_samples_per_second": 4.787,
"eval_steps_per_second": 2.394,
"eval_wer": 1.0,
"step": 17
},
{
"epoch": 18.0,
"eval_loss": 53.77244567871094,
"eval_runtime": 0.4131,
"eval_samples_per_second": 4.841,
"eval_steps_per_second": 2.421,
"eval_wer": 1.0,
"step": 18
},
{
"epoch": 19.0,
"eval_loss": 51.255592346191406,
"eval_runtime": 0.4212,
"eval_samples_per_second": 4.748,
"eval_steps_per_second": 2.374,
"eval_wer": 1.0,
"step": 19
},
{
"epoch": 20.0,
"learning_rate": 0.00016999999999999999,
"loss": 33.2554,
"step": 20
},
{
"epoch": 20.0,
"eval_loss": 48.49556350708008,
"eval_runtime": 0.4219,
"eval_samples_per_second": 4.741,
"eval_steps_per_second": 2.37,
"eval_wer": 1.0,
"step": 20
},
{
"epoch": 21.0,
"eval_loss": 45.40376281738281,
"eval_runtime": 0.4164,
"eval_samples_per_second": 4.803,
"eval_steps_per_second": 2.401,
"eval_wer": 1.0,
"step": 21
},
{
"epoch": 22.0,
"eval_loss": 41.99801254272461,
"eval_runtime": 0.4115,
"eval_samples_per_second": 4.86,
"eval_steps_per_second": 2.43,
"eval_wer": 1.0,
"step": 22
},
{
"epoch": 23.0,
"eval_loss": 41.99801254272461,
"eval_runtime": 0.4148,
"eval_samples_per_second": 4.822,
"eval_steps_per_second": 2.411,
"eval_wer": 1.0,
"step": 23
},
{
"epoch": 24.0,
"eval_loss": 38.22810745239258,
"eval_runtime": 0.4152,
"eval_samples_per_second": 4.817,
"eval_steps_per_second": 2.409,
"eval_wer": 1.0,
"step": 24
},
{
"epoch": 25.0,
"eval_loss": 34.15771484375,
"eval_runtime": 0.4229,
"eval_samples_per_second": 4.73,
"eval_steps_per_second": 2.365,
"eval_wer": 1.0,
"step": 25
},
{
"epoch": 26.0,
"eval_loss": 29.798538208007812,
"eval_runtime": 0.4129,
"eval_samples_per_second": 4.843,
"eval_steps_per_second": 2.422,
"eval_wer": 1.0,
"step": 26
},
{
"epoch": 27.0,
"eval_loss": 25.11461067199707,
"eval_runtime": 0.441,
"eval_samples_per_second": 4.535,
"eval_steps_per_second": 2.268,
"eval_wer": 1.0,
"step": 27
},
{
"epoch": 28.0,
"eval_loss": 20.228670120239258,
"eval_runtime": 0.4246,
"eval_samples_per_second": 4.71,
"eval_steps_per_second": 2.355,
"eval_wer": 1.0,
"step": 28
},
{
"epoch": 29.0,
"eval_loss": 15.340555191040039,
"eval_runtime": 0.4159,
"eval_samples_per_second": 4.809,
"eval_steps_per_second": 2.405,
"eval_wer": 1.0,
"step": 29
},
{
"epoch": 30.0,
"learning_rate": 0.00026,
"loss": 15.1206,
"step": 30
},
{
"epoch": 30.0,
"eval_loss": 10.769251823425293,
"eval_runtime": 0.4274,
"eval_samples_per_second": 4.68,
"eval_steps_per_second": 2.34,
"eval_wer": 1.0,
"step": 30
},
{
"epoch": 31.0,
"eval_loss": 6.8997721672058105,
"eval_runtime": 0.4239,
"eval_samples_per_second": 4.718,
"eval_steps_per_second": 2.359,
"eval_wer": 1.0,
"step": 31
},
{
"epoch": 32.0,
"eval_loss": 4.590747356414795,
"eval_runtime": 0.423,
"eval_samples_per_second": 4.728,
"eval_steps_per_second": 2.364,
"eval_wer": 1.0,
"step": 32
},
{
"epoch": 33.0,
"eval_loss": 3.359570026397705,
"eval_runtime": 0.4292,
"eval_samples_per_second": 4.66,
"eval_steps_per_second": 2.33,
"eval_wer": 1.0,
"step": 33
},
{
"epoch": 34.0,
"eval_loss": 2.7710704803466797,
"eval_runtime": 0.4158,
"eval_samples_per_second": 4.81,
"eval_steps_per_second": 2.405,
"eval_wer": 1.0,
"step": 34
},
{
"epoch": 35.0,
"eval_loss": 2.5961642265319824,
"eval_runtime": 0.4262,
"eval_samples_per_second": 4.692,
"eval_steps_per_second": 2.346,
"eval_wer": 1.0,
"step": 35
},
{
"epoch": 36.0,
"eval_loss": 2.900197982788086,
"eval_runtime": 0.4192,
"eval_samples_per_second": 4.771,
"eval_steps_per_second": 2.386,
"eval_wer": 1.0,
"step": 36
},
{
"epoch": 37.0,
"eval_loss": 3.0060811042785645,
"eval_runtime": 0.4182,
"eval_samples_per_second": 4.783,
"eval_steps_per_second": 2.391,
"eval_wer": 1.0,
"step": 37
},
{
"epoch": 38.0,
"eval_loss": 2.817464828491211,
"eval_runtime": 0.4241,
"eval_samples_per_second": 4.716,
"eval_steps_per_second": 2.358,
"eval_wer": 1.0,
"step": 38
},
{
"epoch": 39.0,
"eval_loss": 2.4512133598327637,
"eval_runtime": 0.4212,
"eval_samples_per_second": 4.748,
"eval_steps_per_second": 2.374,
"eval_wer": 1.0,
"step": 39
},
{
"epoch": 40.0,
"learning_rate": 0.00027428571428571427,
"loss": 2.4298,
"step": 40
},
{
"epoch": 40.0,
"eval_loss": 2.332979202270508,
"eval_runtime": 0.4231,
"eval_samples_per_second": 4.727,
"eval_steps_per_second": 2.363,
"eval_wer": 1.0,
"step": 40
},
{
"epoch": 41.0,
"eval_loss": 2.3766188621520996,
"eval_runtime": 0.4235,
"eval_samples_per_second": 4.723,
"eval_steps_per_second": 2.361,
"eval_wer": 1.0,
"step": 41
},
{
"epoch": 42.0,
"eval_loss": 2.5625646114349365,
"eval_runtime": 0.4219,
"eval_samples_per_second": 4.741,
"eval_steps_per_second": 2.37,
"eval_wer": 1.0,
"step": 42
},
{
"epoch": 43.0,
"eval_loss": 2.9632387161254883,
"eval_runtime": 0.4235,
"eval_samples_per_second": 4.722,
"eval_steps_per_second": 2.361,
"eval_wer": 1.0,
"step": 43
},
{
"epoch": 44.0,
"eval_loss": 3.279555082321167,
"eval_runtime": 0.4175,
"eval_samples_per_second": 4.79,
"eval_steps_per_second": 2.395,
"eval_wer": 1.0,
"step": 44
},
{
"epoch": 45.0,
"eval_loss": 3.4015283584594727,
"eval_runtime": 0.4178,
"eval_samples_per_second": 4.787,
"eval_steps_per_second": 2.393,
"eval_wer": 1.0,
"step": 45
},
{
"epoch": 46.0,
"eval_loss": 3.2808432579040527,
"eval_runtime": 0.4209,
"eval_samples_per_second": 4.752,
"eval_steps_per_second": 2.376,
"eval_wer": 1.0,
"step": 46
},
{
"epoch": 47.0,
"eval_loss": 3.2373273372650146,
"eval_runtime": 0.4225,
"eval_samples_per_second": 4.734,
"eval_steps_per_second": 2.367,
"eval_wer": 1.0,
"step": 47
},
{
"epoch": 48.0,
"eval_loss": 3.2461540699005127,
"eval_runtime": 0.4121,
"eval_samples_per_second": 4.853,
"eval_steps_per_second": 2.427,
"eval_wer": 1.0,
"step": 48
},
{
"epoch": 49.0,
"eval_loss": 3.6168460845947266,
"eval_runtime": 0.436,
"eval_samples_per_second": 4.587,
"eval_steps_per_second": 2.293,
"eval_wer": 1.0,
"step": 49
},
{
"epoch": 50.0,
"learning_rate": 0.00023142857142857142,
"loss": 1.6143,
"step": 50
},
{
"epoch": 50.0,
"eval_loss": 3.6624670028686523,
"eval_runtime": 0.4363,
"eval_samples_per_second": 4.584,
"eval_steps_per_second": 2.292,
"eval_wer": 1.0,
"step": 50
},
{
"epoch": 51.0,
"eval_loss": 3.759349822998047,
"eval_runtime": 0.4284,
"eval_samples_per_second": 4.668,
"eval_steps_per_second": 2.334,
"eval_wer": 1.0,
"step": 51
},
{
"epoch": 52.0,
"eval_loss": 3.9326891899108887,
"eval_runtime": 0.4199,
"eval_samples_per_second": 4.763,
"eval_steps_per_second": 2.382,
"eval_wer": 1.0,
"step": 52
},
{
"epoch": 53.0,
"eval_loss": 3.718548536300659,
"eval_runtime": 0.4129,
"eval_samples_per_second": 4.843,
"eval_steps_per_second": 2.422,
"eval_wer": 1.0,
"step": 53
},
{
"epoch": 54.0,
"eval_loss": 3.90997052192688,
"eval_runtime": 0.4206,
"eval_samples_per_second": 4.755,
"eval_steps_per_second": 2.377,
"eval_wer": 1.0,
"step": 54
},
{
"epoch": 55.0,
"eval_loss": 4.312277317047119,
"eval_runtime": 0.4164,
"eval_samples_per_second": 4.803,
"eval_steps_per_second": 2.401,
"eval_wer": 1.0,
"step": 55
},
{
"epoch": 56.0,
"eval_loss": 4.2904229164123535,
"eval_runtime": 0.4192,
"eval_samples_per_second": 4.771,
"eval_steps_per_second": 2.386,
"eval_wer": 1.0,
"step": 56
},
{
"epoch": 57.0,
"eval_loss": 3.951892852783203,
"eval_runtime": 0.4198,
"eval_samples_per_second": 4.765,
"eval_steps_per_second": 2.382,
"eval_wer": 1.0,
"step": 57
},
{
"epoch": 58.0,
"eval_loss": 3.45182728767395,
"eval_runtime": 0.4295,
"eval_samples_per_second": 4.657,
"eval_steps_per_second": 2.328,
"eval_wer": 1.0,
"step": 58
},
{
"epoch": 59.0,
"eval_loss": 3.0196707248687744,
"eval_runtime": 0.4211,
"eval_samples_per_second": 4.75,
"eval_steps_per_second": 2.375,
"eval_wer": 1.0,
"step": 59
},
{
"epoch": 60.0,
"learning_rate": 0.00018857142857142854,
"loss": 1.4054,
"step": 60
},
{
"epoch": 60.0,
"eval_loss": 2.886315107345581,
"eval_runtime": 0.4413,
"eval_samples_per_second": 4.533,
"eval_steps_per_second": 2.266,
"eval_wer": 1.0,
"step": 60
},
{
"epoch": 61.0,
"eval_loss": 2.97536563873291,
"eval_runtime": 0.4417,
"eval_samples_per_second": 4.528,
"eval_steps_per_second": 2.264,
"eval_wer": 1.0,
"step": 61
},
{
"epoch": 62.0,
"eval_loss": 3.299807548522949,
"eval_runtime": 0.426,
"eval_samples_per_second": 4.695,
"eval_steps_per_second": 2.347,
"eval_wer": 1.0,
"step": 62
},
{
"epoch": 63.0,
"eval_loss": 3.871462821960449,
"eval_runtime": 0.4236,
"eval_samples_per_second": 4.721,
"eval_steps_per_second": 2.36,
"eval_wer": 1.0,
"step": 63
},
{
"epoch": 64.0,
"eval_loss": 4.189750671386719,
"eval_runtime": 0.4223,
"eval_samples_per_second": 4.736,
"eval_steps_per_second": 2.368,
"eval_wer": 1.0,
"step": 64
},
{
"epoch": 65.0,
"eval_loss": 4.18125057220459,
"eval_runtime": 0.4138,
"eval_samples_per_second": 4.833,
"eval_steps_per_second": 2.417,
"eval_wer": 1.0,
"step": 65
},
{
"epoch": 66.0,
"eval_loss": 3.9024930000305176,
"eval_runtime": 0.4391,
"eval_samples_per_second": 4.555,
"eval_steps_per_second": 2.277,
"eval_wer": 1.0,
"step": 66
},
{
"epoch": 67.0,
"eval_loss": 3.4319417476654053,
"eval_runtime": 0.4273,
"eval_samples_per_second": 4.681,
"eval_steps_per_second": 2.34,
"eval_wer": 1.0,
"step": 67
},
{
"epoch": 68.0,
"eval_loss": 3.275496482849121,
"eval_runtime": 0.4173,
"eval_samples_per_second": 4.793,
"eval_steps_per_second": 2.396,
"eval_wer": 1.0,
"step": 68
},
{
"epoch": 69.0,
"eval_loss": 3.334933042526245,
"eval_runtime": 0.4221,
"eval_samples_per_second": 4.738,
"eval_steps_per_second": 2.369,
"eval_wer": 1.0,
"step": 69
},
{
"epoch": 70.0,
"learning_rate": 0.0001457142857142857,
"loss": 1.3121,
"step": 70
},
{
"epoch": 70.0,
"eval_loss": 3.548488140106201,
"eval_runtime": 0.4291,
"eval_samples_per_second": 4.661,
"eval_steps_per_second": 2.331,
"eval_wer": 1.0,
"step": 70
},
{
"epoch": 71.0,
"eval_loss": 3.9019012451171875,
"eval_runtime": 0.4171,
"eval_samples_per_second": 4.795,
"eval_steps_per_second": 2.398,
"eval_wer": 1.0,
"step": 71
},
{
"epoch": 72.0,
"eval_loss": 4.081923961639404,
"eval_runtime": 0.4176,
"eval_samples_per_second": 4.789,
"eval_steps_per_second": 2.395,
"eval_wer": 1.0,
"step": 72
},
{
"epoch": 73.0,
"eval_loss": 3.9955055713653564,
"eval_runtime": 0.4176,
"eval_samples_per_second": 4.789,
"eval_steps_per_second": 2.395,
"eval_wer": 1.0,
"step": 73
},
{
"epoch": 74.0,
"eval_loss": 3.70878529548645,
"eval_runtime": 0.423,
"eval_samples_per_second": 4.729,
"eval_steps_per_second": 2.364,
"eval_wer": 1.0,
"step": 74
},
{
"epoch": 75.0,
"eval_loss": 3.295703887939453,
"eval_runtime": 0.4128,
"eval_samples_per_second": 4.846,
"eval_steps_per_second": 2.423,
"eval_wer": 1.0,
"step": 75
},
{
"epoch": 76.0,
"eval_loss": 3.114126682281494,
"eval_runtime": 0.4146,
"eval_samples_per_second": 4.824,
"eval_steps_per_second": 2.412,
"eval_wer": 1.0,
"step": 76
},
{
"epoch": 77.0,
"eval_loss": 3.085181713104248,
"eval_runtime": 0.4266,
"eval_samples_per_second": 4.688,
"eval_steps_per_second": 2.344,
"eval_wer": 1.0,
"step": 77
},
{
"epoch": 78.0,
"eval_loss": 3.187084436416626,
"eval_runtime": 0.4233,
"eval_samples_per_second": 4.725,
"eval_steps_per_second": 2.362,
"eval_wer": 1.0,
"step": 78
},
{
"epoch": 79.0,
"eval_loss": 3.4126548767089844,
"eval_runtime": 0.406,
"eval_samples_per_second": 4.926,
"eval_steps_per_second": 2.463,
"eval_wer": 1.0,
"step": 79
},
{
"epoch": 80.0,
"learning_rate": 0.00010285714285714284,
"loss": 1.2576,
"step": 80
},
{
"epoch": 80.0,
"eval_loss": 3.6913061141967773,
"eval_runtime": 0.4088,
"eval_samples_per_second": 4.892,
"eval_steps_per_second": 2.446,
"eval_wer": 1.0,
"step": 80
},
{
"epoch": 81.0,
"eval_loss": 3.8285651206970215,
"eval_runtime": 0.4079,
"eval_samples_per_second": 4.904,
"eval_steps_per_second": 2.452,
"eval_wer": 1.0,
"step": 81
},
{
"epoch": 82.0,
"eval_loss": 3.815654993057251,
"eval_runtime": 0.4087,
"eval_samples_per_second": 4.894,
"eval_steps_per_second": 2.447,
"eval_wer": 1.0,
"step": 82
},
{
"epoch": 83.0,
"eval_loss": 3.6813836097717285,
"eval_runtime": 0.4035,
"eval_samples_per_second": 4.957,
"eval_steps_per_second": 2.478,
"eval_wer": 1.0,
"step": 83
},
{
"epoch": 84.0,
"eval_loss": 3.44958758354187,
"eval_runtime": 0.4079,
"eval_samples_per_second": 4.903,
"eval_steps_per_second": 2.452,
"eval_wer": 1.0,
"step": 84
},
{
"epoch": 85.0,
"eval_loss": 3.284428119659424,
"eval_runtime": 0.4066,
"eval_samples_per_second": 4.919,
"eval_steps_per_second": 2.46,
"eval_wer": 1.0,
"step": 85
},
{
"epoch": 86.0,
"eval_loss": 3.2253918647766113,
"eval_runtime": 0.405,
"eval_samples_per_second": 4.938,
"eval_steps_per_second": 2.469,
"eval_wer": 1.0,
"step": 86
},
{
"epoch": 87.0,
"eval_loss": 3.268294334411621,
"eval_runtime": 0.4089,
"eval_samples_per_second": 4.892,
"eval_steps_per_second": 2.446,
"eval_wer": 1.0,
"step": 87
},
{
"epoch": 88.0,
"eval_loss": 3.3791449069976807,
"eval_runtime": 0.4084,
"eval_samples_per_second": 4.897,
"eval_steps_per_second": 2.449,
"eval_wer": 1.0,
"step": 88
},
{
"epoch": 89.0,
"eval_loss": 3.550123453140259,
"eval_runtime": 0.4056,
"eval_samples_per_second": 4.931,
"eval_steps_per_second": 2.466,
"eval_wer": 1.0,
"step": 89
},
{
"epoch": 90.0,
"learning_rate": 5.9999999999999995e-05,
"loss": 1.2373,
"step": 90
},
{
"epoch": 90.0,
"eval_loss": 3.662168025970459,
"eval_runtime": 0.4176,
"eval_samples_per_second": 4.789,
"eval_steps_per_second": 2.395,
"eval_wer": 1.0,
"step": 90
},
{
"epoch": 91.0,
"eval_loss": 3.7207443714141846,
"eval_runtime": 0.4173,
"eval_samples_per_second": 4.793,
"eval_steps_per_second": 2.396,
"eval_wer": 1.0,
"step": 91
},
{
"epoch": 92.0,
"eval_loss": 3.6961331367492676,
"eval_runtime": 0.4129,
"eval_samples_per_second": 4.844,
"eval_steps_per_second": 2.422,
"eval_wer": 1.0,
"step": 92
},
{
"epoch": 93.0,
"eval_loss": 3.6098761558532715,
"eval_runtime": 0.4061,
"eval_samples_per_second": 4.925,
"eval_steps_per_second": 2.463,
"eval_wer": 1.0,
"step": 93
},
{
"epoch": 94.0,
"eval_loss": 3.533604860305786,
"eval_runtime": 0.4224,
"eval_samples_per_second": 4.735,
"eval_steps_per_second": 2.368,
"eval_wer": 1.0,
"step": 94
},
{
"epoch": 95.0,
"eval_loss": 3.4341912269592285,
"eval_runtime": 0.4255,
"eval_samples_per_second": 4.701,
"eval_steps_per_second": 2.35,
"eval_wer": 1.0,
"step": 95
},
{
"epoch": 96.0,
"eval_loss": 3.316969871520996,
"eval_runtime": 0.4089,
"eval_samples_per_second": 4.891,
"eval_steps_per_second": 2.445,
"eval_wer": 1.0,
"step": 96
},
{
"epoch": 97.0,
"eval_loss": 3.2624034881591797,
"eval_runtime": 0.4046,
"eval_samples_per_second": 4.943,
"eval_steps_per_second": 2.471,
"eval_wer": 1.0,
"step": 97
},
{
"epoch": 98.0,
"eval_loss": 3.2437386512756348,
"eval_runtime": 0.4006,
"eval_samples_per_second": 4.993,
"eval_steps_per_second": 2.497,
"eval_wer": 1.0,
"step": 98
},
{
"epoch": 99.0,
"eval_loss": 3.259126663208008,
"eval_runtime": 0.4066,
"eval_samples_per_second": 4.919,
"eval_steps_per_second": 2.46,
"eval_wer": 1.0,
"step": 99
},
{
"epoch": 100.0,
"learning_rate": 1.7142857142857142e-05,
"loss": 1.1952,
"step": 100
},
{
"epoch": 100.0,
"eval_loss": 3.292677402496338,
"eval_runtime": 0.4167,
"eval_samples_per_second": 4.799,
"eval_steps_per_second": 2.4,
"eval_wer": 1.0,
"step": 100
},
{
"epoch": 100.0,
"step": 100,
"total_flos": 2.094330789153408e+17,
"train_loss": 9.722876396179199,
"train_runtime": 860.4357,
"train_samples_per_second": 1.86,
"train_steps_per_second": 0.116
}
],
"max_steps": 100,
"num_train_epochs": 100,
"total_flos": 2.094330789153408e+17,
"trial_name": null,
"trial_params": null
}