lsnoo's picture
Uploading trained model
2607071
raw
history blame
12.7 kB
{
"best_metric": 1.0679948329925537,
"best_model_checkpoint": "asd_pronunciation_w2v_xlsr-300m/checkpoint-99",
"epoch": 49.977777777777774,
"global_step": 550,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.98,
"eval_accuracy": 0.33144742250442505,
"eval_loss": 1.5670545101165771,
"eval_runtime": 62.8235,
"eval_samples_per_second": 33.761,
"eval_steps_per_second": 1.066,
"step": 11
},
{
"epoch": 1.98,
"eval_accuracy": 0.39273926615715027,
"eval_loss": 1.3582004308700562,
"eval_runtime": 62.2914,
"eval_samples_per_second": 34.05,
"eval_steps_per_second": 1.076,
"step": 22
},
{
"epoch": 2.98,
"eval_accuracy": 0.380952388048172,
"eval_loss": 1.3765946626663208,
"eval_runtime": 63.9238,
"eval_samples_per_second": 33.18,
"eval_steps_per_second": 1.048,
"step": 33
},
{
"epoch": 3.98,
"eval_accuracy": 0.4186704456806183,
"eval_loss": 1.3837833404541016,
"eval_runtime": 63.6397,
"eval_samples_per_second": 33.328,
"eval_steps_per_second": 1.053,
"step": 44
},
{
"epoch": 4.98,
"eval_accuracy": 0.3663366436958313,
"eval_loss": 1.5986249446868896,
"eval_runtime": 63.7365,
"eval_samples_per_second": 33.278,
"eval_steps_per_second": 1.051,
"step": 55
},
{
"epoch": 5.98,
"eval_accuracy": 0.42904290556907654,
"eval_loss": 1.8822154998779297,
"eval_runtime": 63.6958,
"eval_samples_per_second": 33.299,
"eval_steps_per_second": 1.052,
"step": 66
},
{
"epoch": 6.98,
"eval_accuracy": 0.34983497858047485,
"eval_loss": 1.865776538848877,
"eval_runtime": 63.1847,
"eval_samples_per_second": 33.568,
"eval_steps_per_second": 1.06,
"step": 77
},
{
"epoch": 7.98,
"eval_accuracy": 0.4502592980861664,
"eval_loss": 1.966166377067566,
"eval_runtime": 63.6503,
"eval_samples_per_second": 33.323,
"eval_steps_per_second": 1.053,
"step": 88
},
{
"epoch": 8.98,
"eval_accuracy": 0.6855257153511047,
"eval_loss": 1.0679948329925537,
"eval_runtime": 63.1701,
"eval_samples_per_second": 33.576,
"eval_steps_per_second": 1.061,
"step": 99
},
{
"epoch": 9.98,
"eval_accuracy": 0.6539368033409119,
"eval_loss": 1.1463075876235962,
"eval_runtime": 63.3309,
"eval_samples_per_second": 33.491,
"eval_steps_per_second": 1.058,
"step": 110
},
{
"epoch": 10.98,
"eval_accuracy": 0.7157001495361328,
"eval_loss": 1.1053473949432373,
"eval_runtime": 63.7039,
"eval_samples_per_second": 33.295,
"eval_steps_per_second": 1.052,
"step": 121
},
{
"epoch": 11.98,
"eval_accuracy": 0.5836869478225708,
"eval_loss": 1.6300278902053833,
"eval_runtime": 63.4359,
"eval_samples_per_second": 33.435,
"eval_steps_per_second": 1.056,
"step": 132
},
{
"epoch": 12.98,
"eval_accuracy": 0.697312593460083,
"eval_loss": 1.190132975578308,
"eval_runtime": 62.8623,
"eval_samples_per_second": 33.74,
"eval_steps_per_second": 1.066,
"step": 143
},
{
"epoch": 13.98,
"eval_accuracy": 0.5761433243751526,
"eval_loss": 1.677795171737671,
"eval_runtime": 63.1508,
"eval_samples_per_second": 33.586,
"eval_steps_per_second": 1.061,
"step": 154
},
{
"epoch": 14.98,
"eval_accuracy": 0.7072135806083679,
"eval_loss": 1.2646026611328125,
"eval_runtime": 64.2737,
"eval_samples_per_second": 33.0,
"eval_steps_per_second": 1.042,
"step": 165
},
{
"epoch": 15.98,
"eval_accuracy": 0.5535125136375427,
"eval_loss": 1.866857647895813,
"eval_runtime": 63.6272,
"eval_samples_per_second": 33.335,
"eval_steps_per_second": 1.053,
"step": 176
},
{
"epoch": 16.98,
"eval_accuracy": 0.5700141191482544,
"eval_loss": 1.911484956741333,
"eval_runtime": 63.0574,
"eval_samples_per_second": 33.636,
"eval_steps_per_second": 1.063,
"step": 187
},
{
"epoch": 17.98,
"eval_accuracy": 0.608203649520874,
"eval_loss": 1.748372197151184,
"eval_runtime": 63.9869,
"eval_samples_per_second": 33.147,
"eval_steps_per_second": 1.047,
"step": 198
},
{
"epoch": 18.98,
"eval_accuracy": 0.6209335327148438,
"eval_loss": 1.736160159111023,
"eval_runtime": 63.5615,
"eval_samples_per_second": 33.369,
"eval_steps_per_second": 1.054,
"step": 209
},
{
"epoch": 19.98,
"eval_accuracy": 0.5535125136375427,
"eval_loss": 2.0504212379455566,
"eval_runtime": 63.6231,
"eval_samples_per_second": 33.337,
"eval_steps_per_second": 1.053,
"step": 220
},
{
"epoch": 20.98,
"eval_accuracy": 0.6520509123802185,
"eval_loss": 1.6594103574752808,
"eval_runtime": 63.6587,
"eval_samples_per_second": 33.318,
"eval_steps_per_second": 1.052,
"step": 231
},
{
"epoch": 21.98,
"eval_accuracy": 0.6779820919036865,
"eval_loss": 1.5675663948059082,
"eval_runtime": 64.5637,
"eval_samples_per_second": 32.851,
"eval_steps_per_second": 1.038,
"step": 242
},
{
"epoch": 22.98,
"eval_accuracy": 0.6737387776374817,
"eval_loss": 1.6316275596618652,
"eval_runtime": 63.4257,
"eval_samples_per_second": 33.441,
"eval_steps_per_second": 1.056,
"step": 253
},
{
"epoch": 23.98,
"eval_accuracy": 0.5983026623725891,
"eval_loss": 1.9427396059036255,
"eval_runtime": 63.6629,
"eval_samples_per_second": 33.316,
"eval_steps_per_second": 1.052,
"step": 264
},
{
"epoch": 24.98,
"eval_accuracy": 0.6619518995285034,
"eval_loss": 1.7251100540161133,
"eval_runtime": 63.8986,
"eval_samples_per_second": 33.193,
"eval_steps_per_second": 1.049,
"step": 275
},
{
"epoch": 25.98,
"eval_accuracy": 0.7133427858352661,
"eval_loss": 1.4861173629760742,
"eval_runtime": 63.105,
"eval_samples_per_second": 33.611,
"eval_steps_per_second": 1.062,
"step": 286
},
{
"epoch": 26.98,
"eval_accuracy": 0.6388496160507202,
"eval_loss": 1.8551920652389526,
"eval_runtime": 63.3692,
"eval_samples_per_second": 33.471,
"eval_steps_per_second": 1.057,
"step": 297
},
{
"epoch": 27.98,
"eval_accuracy": 0.6218764781951904,
"eval_loss": 1.9755550622940063,
"eval_runtime": 63.7438,
"eval_samples_per_second": 33.274,
"eval_steps_per_second": 1.051,
"step": 308
},
{
"epoch": 28.98,
"eval_accuracy": 0.5879302024841309,
"eval_loss": 2.2480831146240234,
"eval_runtime": 62.9459,
"eval_samples_per_second": 33.696,
"eval_steps_per_second": 1.064,
"step": 319
},
{
"epoch": 29.98,
"eval_accuracy": 0.6176331639289856,
"eval_loss": 1.9868534803390503,
"eval_runtime": 63.9115,
"eval_samples_per_second": 33.187,
"eval_steps_per_second": 1.048,
"step": 330
},
{
"epoch": 30.98,
"eval_accuracy": 0.6991984844207764,
"eval_loss": 1.6001139879226685,
"eval_runtime": 62.9701,
"eval_samples_per_second": 33.683,
"eval_steps_per_second": 1.064,
"step": 341
},
{
"epoch": 31.98,
"eval_accuracy": 0.6562942266464233,
"eval_loss": 1.80760657787323,
"eval_runtime": 64.5355,
"eval_samples_per_second": 32.866,
"eval_steps_per_second": 1.038,
"step": 352
},
{
"epoch": 32.98,
"eval_accuracy": 0.6539368033409119,
"eval_loss": 1.8803389072418213,
"eval_runtime": 63.8068,
"eval_samples_per_second": 33.241,
"eval_steps_per_second": 1.05,
"step": 363
},
{
"epoch": 33.98,
"eval_accuracy": 0.6308345198631287,
"eval_loss": 1.9857879877090454,
"eval_runtime": 63.5545,
"eval_samples_per_second": 33.373,
"eval_steps_per_second": 1.054,
"step": 374
},
{
"epoch": 34.98,
"eval_accuracy": 0.6228194236755371,
"eval_loss": 2.016218900680542,
"eval_runtime": 63.1093,
"eval_samples_per_second": 33.608,
"eval_steps_per_second": 1.062,
"step": 385
},
{
"epoch": 35.98,
"eval_accuracy": 0.6247053146362305,
"eval_loss": 1.9806338548660278,
"eval_runtime": 63.643,
"eval_samples_per_second": 33.327,
"eval_steps_per_second": 1.053,
"step": 396
},
{
"epoch": 36.98,
"eval_accuracy": 0.6148043274879456,
"eval_loss": 2.0684027671813965,
"eval_runtime": 63.1391,
"eval_samples_per_second": 33.593,
"eval_steps_per_second": 1.061,
"step": 407
},
{
"epoch": 37.98,
"eval_accuracy": 0.6826968193054199,
"eval_loss": 1.7208051681518555,
"eval_runtime": 63.3764,
"eval_samples_per_second": 33.467,
"eval_steps_per_second": 1.057,
"step": 418
},
{
"epoch": 38.98,
"eval_accuracy": 0.6676096320152283,
"eval_loss": 1.7736769914627075,
"eval_runtime": 63.0716,
"eval_samples_per_second": 33.628,
"eval_steps_per_second": 1.062,
"step": 429
},
{
"epoch": 39.98,
"eval_accuracy": 0.6940122842788696,
"eval_loss": 1.7225761413574219,
"eval_runtime": 64.0078,
"eval_samples_per_second": 33.137,
"eval_steps_per_second": 1.047,
"step": 440
},
{
"epoch": 40.98,
"eval_accuracy": 0.606789231300354,
"eval_loss": 2.0414962768554688,
"eval_runtime": 63.4689,
"eval_samples_per_second": 33.418,
"eval_steps_per_second": 1.056,
"step": 451
},
{
"epoch": 41.98,
"eval_accuracy": 0.6214050054550171,
"eval_loss": 2.019111394882202,
"eval_runtime": 63.5976,
"eval_samples_per_second": 33.35,
"eval_steps_per_second": 1.053,
"step": 462
},
{
"epoch": 42.98,
"eval_accuracy": 0.6379066705703735,
"eval_loss": 1.947460412979126,
"eval_runtime": 63.6957,
"eval_samples_per_second": 33.299,
"eval_steps_per_second": 1.052,
"step": 473
},
{
"epoch": 43.98,
"eval_accuracy": 0.669966995716095,
"eval_loss": 1.8389097452163696,
"eval_runtime": 64.1144,
"eval_samples_per_second": 33.081,
"eval_steps_per_second": 1.045,
"step": 484
},
{
"epoch": 44.98,
"eval_accuracy": 0.6666666865348816,
"eval_loss": 1.814638376235962,
"eval_runtime": 63.7225,
"eval_samples_per_second": 33.285,
"eval_steps_per_second": 1.051,
"step": 495
},
{
"epoch": 45.44,
"learning_rate": 3.03030303030303e-05,
"loss": 0.3177,
"step": 500
},
{
"epoch": 45.98,
"eval_accuracy": 0.6718528866767883,
"eval_loss": 1.79548978805542,
"eval_runtime": 63.2169,
"eval_samples_per_second": 33.551,
"eval_steps_per_second": 1.06,
"step": 506
},
{
"epoch": 46.98,
"eval_accuracy": 0.65865159034729,
"eval_loss": 1.9061682224273682,
"eval_runtime": 64.47,
"eval_samples_per_second": 32.899,
"eval_steps_per_second": 1.039,
"step": 517
},
{
"epoch": 47.98,
"eval_accuracy": 0.6643092632293701,
"eval_loss": 1.8877029418945312,
"eval_runtime": 63.3351,
"eval_samples_per_second": 33.489,
"eval_steps_per_second": 1.058,
"step": 528
},
{
"epoch": 48.98,
"eval_accuracy": 0.6694955229759216,
"eval_loss": 1.8578468561172485,
"eval_runtime": 63.6561,
"eval_samples_per_second": 33.32,
"eval_steps_per_second": 1.053,
"step": 539
},
{
"epoch": 49.98,
"eval_accuracy": 0.6690240502357483,
"eval_loss": 1.8590630292892456,
"eval_runtime": 62.2809,
"eval_samples_per_second": 34.055,
"eval_steps_per_second": 1.076,
"step": 550
}
],
"max_steps": 550,
"num_train_epochs": 50,
"total_flos": 1.6031529967362595e+20,
"trial_name": null,
"trial_params": null
}