whisper-small-keyword-spotting / trainer_state.json
qmeeus's picture
End of training
ac75440
{
"best_metric": 0.9998191681735985,
"best_model_checkpoint": "outputs/whisper-small-keyword-spotting/checkpoint-637",
"epoch": 4.988235294117647,
"global_step": 1590,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.03,
"learning_rate": 6.289308176100629e-05,
"loss": 0.6892,
"step": 10
},
{
"epoch": 0.06,
"learning_rate": 0.00012578616352201257,
"loss": 0.6605,
"step": 20
},
{
"epoch": 0.09,
"learning_rate": 0.00018867924528301889,
"loss": 0.6284,
"step": 30
},
{
"epoch": 0.13,
"learning_rate": 0.00025157232704402514,
"loss": 0.577,
"step": 40
},
{
"epoch": 0.16,
"learning_rate": 0.00031446540880503143,
"loss": 0.5128,
"step": 50
},
{
"epoch": 0.19,
"learning_rate": 0.00037735849056603777,
"loss": 0.4114,
"step": 60
},
{
"epoch": 0.22,
"learning_rate": 0.00044025157232704406,
"loss": 0.3091,
"step": 70
},
{
"epoch": 0.25,
"learning_rate": 0.0005031446540880503,
"loss": 0.2469,
"step": 80
},
{
"epoch": 0.28,
"learning_rate": 0.0005660377358490566,
"loss": 0.1943,
"step": 90
},
{
"epoch": 0.31,
"learning_rate": 0.0006289308176100629,
"loss": 0.1421,
"step": 100
},
{
"epoch": 0.35,
"learning_rate": 0.0006918238993710692,
"loss": 0.1142,
"step": 110
},
{
"epoch": 0.38,
"learning_rate": 0.0007547169811320755,
"loss": 0.0857,
"step": 120
},
{
"epoch": 0.41,
"learning_rate": 0.0008176100628930818,
"loss": 0.0679,
"step": 130
},
{
"epoch": 0.44,
"learning_rate": 0.0008805031446540881,
"loss": 0.0663,
"step": 140
},
{
"epoch": 0.47,
"learning_rate": 0.0009433962264150943,
"loss": 0.0443,
"step": 150
},
{
"epoch": 0.5,
"learning_rate": 0.0009993011879804333,
"loss": 0.047,
"step": 160
},
{
"epoch": 0.53,
"learning_rate": 0.000992313067784766,
"loss": 0.0362,
"step": 170
},
{
"epoch": 0.56,
"learning_rate": 0.0009853249475890984,
"loss": 0.0382,
"step": 180
},
{
"epoch": 0.6,
"learning_rate": 0.0009783368273934311,
"loss": 0.0522,
"step": 190
},
{
"epoch": 0.63,
"learning_rate": 0.0009713487071977638,
"loss": 0.022,
"step": 200
},
{
"epoch": 0.66,
"learning_rate": 0.0009643605870020965,
"loss": 0.0408,
"step": 210
},
{
"epoch": 0.69,
"learning_rate": 0.0009573724668064291,
"loss": 0.0392,
"step": 220
},
{
"epoch": 0.72,
"learning_rate": 0.0009503843466107617,
"loss": 0.0289,
"step": 230
},
{
"epoch": 0.75,
"learning_rate": 0.0009433962264150943,
"loss": 0.0249,
"step": 240
},
{
"epoch": 0.78,
"learning_rate": 0.0009364081062194269,
"loss": 0.0434,
"step": 250
},
{
"epoch": 0.82,
"learning_rate": 0.0009294199860237596,
"loss": 0.036,
"step": 260
},
{
"epoch": 0.85,
"learning_rate": 0.0009224318658280922,
"loss": 0.0372,
"step": 270
},
{
"epoch": 0.88,
"learning_rate": 0.0009154437456324249,
"loss": 0.0438,
"step": 280
},
{
"epoch": 0.91,
"learning_rate": 0.0009084556254367576,
"loss": 0.0273,
"step": 290
},
{
"epoch": 0.94,
"learning_rate": 0.0009014675052410902,
"loss": 0.022,
"step": 300
},
{
"epoch": 0.97,
"learning_rate": 0.0008944793850454228,
"loss": 0.0268,
"step": 310
},
{
"epoch": 1.0,
"eval_accuracy": 0.9685352622061483,
"eval_loss": 0.0720464363694191,
"eval_runtime": 218.3559,
"eval_samples_per_second": 25.326,
"eval_steps_per_second": 0.792,
"step": 318
},
{
"epoch": 1.0,
"learning_rate": 0.0008874912648497554,
"loss": 0.0216,
"step": 320
},
{
"epoch": 1.04,
"learning_rate": 0.0008805031446540881,
"loss": 0.0128,
"step": 330
},
{
"epoch": 1.07,
"learning_rate": 0.0008735150244584207,
"loss": 0.0152,
"step": 340
},
{
"epoch": 1.1,
"learning_rate": 0.0008665269042627534,
"loss": 0.0225,
"step": 350
},
{
"epoch": 1.13,
"learning_rate": 0.000859538784067086,
"loss": 0.022,
"step": 360
},
{
"epoch": 1.16,
"learning_rate": 0.0008525506638714185,
"loss": 0.019,
"step": 370
},
{
"epoch": 1.19,
"learning_rate": 0.0008455625436757512,
"loss": 0.0228,
"step": 380
},
{
"epoch": 1.22,
"learning_rate": 0.0008385744234800838,
"loss": 0.0206,
"step": 390
},
{
"epoch": 1.25,
"learning_rate": 0.0008315863032844165,
"loss": 0.0163,
"step": 400
},
{
"epoch": 1.29,
"learning_rate": 0.0008245981830887491,
"loss": 0.0193,
"step": 410
},
{
"epoch": 1.32,
"learning_rate": 0.0008176100628930818,
"loss": 0.0239,
"step": 420
},
{
"epoch": 1.35,
"learning_rate": 0.0008106219426974144,
"loss": 0.0268,
"step": 430
},
{
"epoch": 1.38,
"learning_rate": 0.000803633822501747,
"loss": 0.0201,
"step": 440
},
{
"epoch": 1.41,
"learning_rate": 0.0007966457023060797,
"loss": 0.0159,
"step": 450
},
{
"epoch": 1.44,
"learning_rate": 0.0007896575821104123,
"loss": 0.0171,
"step": 460
},
{
"epoch": 1.47,
"learning_rate": 0.000782669461914745,
"loss": 0.0201,
"step": 470
},
{
"epoch": 1.51,
"learning_rate": 0.0007756813417190776,
"loss": 0.016,
"step": 480
},
{
"epoch": 1.54,
"learning_rate": 0.0007686932215234103,
"loss": 0.0155,
"step": 490
},
{
"epoch": 1.57,
"learning_rate": 0.0007617051013277429,
"loss": 0.0144,
"step": 500
},
{
"epoch": 1.6,
"learning_rate": 0.0007547169811320755,
"loss": 0.0065,
"step": 510
},
{
"epoch": 1.63,
"learning_rate": 0.0007477288609364081,
"loss": 0.0117,
"step": 520
},
{
"epoch": 1.66,
"learning_rate": 0.0007407407407407407,
"loss": 0.0174,
"step": 530
},
{
"epoch": 1.69,
"learning_rate": 0.0007337526205450734,
"loss": 0.0117,
"step": 540
},
{
"epoch": 1.73,
"learning_rate": 0.000726764500349406,
"loss": 0.0165,
"step": 550
},
{
"epoch": 1.76,
"learning_rate": 0.0007197763801537387,
"loss": 0.0152,
"step": 560
},
{
"epoch": 1.79,
"learning_rate": 0.0007127882599580712,
"loss": 0.0111,
"step": 570
},
{
"epoch": 1.82,
"learning_rate": 0.0007058001397624039,
"loss": 0.0119,
"step": 580
},
{
"epoch": 1.85,
"learning_rate": 0.0006988120195667366,
"loss": 0.0134,
"step": 590
},
{
"epoch": 1.88,
"learning_rate": 0.0006918238993710692,
"loss": 0.0166,
"step": 600
},
{
"epoch": 1.91,
"learning_rate": 0.0006848357791754019,
"loss": 0.0271,
"step": 610
},
{
"epoch": 1.95,
"learning_rate": 0.0006778476589797345,
"loss": 0.0186,
"step": 620
},
{
"epoch": 1.98,
"learning_rate": 0.0006708595387840672,
"loss": 0.0195,
"step": 630
},
{
"epoch": 2.0,
"eval_accuracy": 0.9998191681735985,
"eval_loss": 0.01826309971511364,
"eval_runtime": 324.2355,
"eval_samples_per_second": 17.056,
"eval_steps_per_second": 0.534,
"step": 637
},
{
"epoch": 2.01,
"learning_rate": 0.0006638714185883997,
"loss": 0.0159,
"step": 640
},
{
"epoch": 2.04,
"learning_rate": 0.0006568832983927324,
"loss": 0.0125,
"step": 650
},
{
"epoch": 2.07,
"learning_rate": 0.000649895178197065,
"loss": 0.0205,
"step": 660
},
{
"epoch": 2.1,
"learning_rate": 0.0006429070580013976,
"loss": 0.0187,
"step": 670
},
{
"epoch": 2.13,
"learning_rate": 0.0006359189378057303,
"loss": 0.0138,
"step": 680
},
{
"epoch": 2.16,
"learning_rate": 0.0006289308176100629,
"loss": 0.0104,
"step": 690
},
{
"epoch": 2.2,
"learning_rate": 0.0006219426974143956,
"loss": 0.0114,
"step": 700
},
{
"epoch": 2.23,
"learning_rate": 0.0006149545772187281,
"loss": 0.0128,
"step": 710
},
{
"epoch": 2.26,
"learning_rate": 0.0006079664570230608,
"loss": 0.0073,
"step": 720
},
{
"epoch": 2.29,
"learning_rate": 0.0006009783368273934,
"loss": 0.0056,
"step": 730
},
{
"epoch": 2.32,
"learning_rate": 0.000593990216631726,
"loss": 0.0041,
"step": 740
},
{
"epoch": 2.35,
"learning_rate": 0.0005870020964360588,
"loss": 0.0106,
"step": 750
},
{
"epoch": 2.38,
"learning_rate": 0.0005800139762403914,
"loss": 0.0126,
"step": 760
},
{
"epoch": 2.42,
"learning_rate": 0.000573025856044724,
"loss": 0.0123,
"step": 770
},
{
"epoch": 2.45,
"learning_rate": 0.0005660377358490566,
"loss": 0.0117,
"step": 780
},
{
"epoch": 2.48,
"learning_rate": 0.0005590496156533893,
"loss": 0.0162,
"step": 790
},
{
"epoch": 2.51,
"learning_rate": 0.0005520614954577219,
"loss": 0.0107,
"step": 800
},
{
"epoch": 2.54,
"learning_rate": 0.0005450733752620545,
"loss": 0.0156,
"step": 810
},
{
"epoch": 2.57,
"learning_rate": 0.0005380852550663872,
"loss": 0.0108,
"step": 820
},
{
"epoch": 2.6,
"learning_rate": 0.0005310971348707198,
"loss": 0.0096,
"step": 830
},
{
"epoch": 2.64,
"learning_rate": 0.0005241090146750524,
"loss": 0.0139,
"step": 840
},
{
"epoch": 2.67,
"learning_rate": 0.000517120894479385,
"loss": 0.0089,
"step": 850
},
{
"epoch": 2.7,
"learning_rate": 0.0005101327742837177,
"loss": 0.0097,
"step": 860
},
{
"epoch": 2.73,
"learning_rate": 0.0005031446540880503,
"loss": 0.0096,
"step": 870
},
{
"epoch": 2.76,
"learning_rate": 0.000496156533892383,
"loss": 0.0063,
"step": 880
},
{
"epoch": 2.79,
"learning_rate": 0.0004891684136967156,
"loss": 0.0092,
"step": 890
},
{
"epoch": 2.82,
"learning_rate": 0.00048218029350104825,
"loss": 0.0113,
"step": 900
},
{
"epoch": 2.85,
"learning_rate": 0.00047519217330538083,
"loss": 0.0079,
"step": 910
},
{
"epoch": 2.89,
"learning_rate": 0.00046820405310971346,
"loss": 0.0112,
"step": 920
},
{
"epoch": 2.92,
"learning_rate": 0.0004612159329140461,
"loss": 0.0045,
"step": 930
},
{
"epoch": 2.95,
"learning_rate": 0.0004542278127183788,
"loss": 0.0069,
"step": 940
},
{
"epoch": 2.98,
"learning_rate": 0.0004472396925227114,
"loss": 0.0111,
"step": 950
},
{
"epoch": 3.0,
"eval_accuracy": 0.9168173598553345,
"eval_loss": 0.20090103149414062,
"eval_runtime": 323.1789,
"eval_samples_per_second": 17.111,
"eval_steps_per_second": 0.535,
"step": 956
},
{
"epoch": 3.01,
"learning_rate": 0.00044025157232704406,
"loss": 0.0061,
"step": 960
},
{
"epoch": 3.04,
"learning_rate": 0.0004332634521313767,
"loss": 0.0069,
"step": 970
},
{
"epoch": 3.07,
"learning_rate": 0.0004262753319357093,
"loss": 0.017,
"step": 980
},
{
"epoch": 3.11,
"learning_rate": 0.0004192872117400419,
"loss": 0.0054,
"step": 990
},
{
"epoch": 3.14,
"learning_rate": 0.00041229909154437454,
"loss": 0.0112,
"step": 1000
},
{
"epoch": 3.17,
"learning_rate": 0.0004053109713487072,
"loss": 0.0132,
"step": 1010
},
{
"epoch": 3.2,
"learning_rate": 0.00039832285115303987,
"loss": 0.0105,
"step": 1020
},
{
"epoch": 3.23,
"learning_rate": 0.0003913347309573725,
"loss": 0.0121,
"step": 1030
},
{
"epoch": 3.26,
"learning_rate": 0.00038434661076170514,
"loss": 0.0077,
"step": 1040
},
{
"epoch": 3.29,
"learning_rate": 0.00037735849056603777,
"loss": 0.0039,
"step": 1050
},
{
"epoch": 3.33,
"learning_rate": 0.00037037037037037035,
"loss": 0.0074,
"step": 1060
},
{
"epoch": 3.36,
"learning_rate": 0.000363382250174703,
"loss": 0.0107,
"step": 1070
},
{
"epoch": 3.39,
"learning_rate": 0.0003563941299790356,
"loss": 0.0092,
"step": 1080
},
{
"epoch": 3.42,
"learning_rate": 0.0003494060097833683,
"loss": 0.0032,
"step": 1090
},
{
"epoch": 3.45,
"learning_rate": 0.00034241788958770095,
"loss": 0.0145,
"step": 1100
},
{
"epoch": 3.48,
"learning_rate": 0.0003354297693920336,
"loss": 0.0044,
"step": 1110
},
{
"epoch": 3.51,
"learning_rate": 0.0003284416491963662,
"loss": 0.0059,
"step": 1120
},
{
"epoch": 3.55,
"learning_rate": 0.0003214535290006988,
"loss": 0.0052,
"step": 1130
},
{
"epoch": 3.58,
"learning_rate": 0.00031446540880503143,
"loss": 0.0101,
"step": 1140
},
{
"epoch": 3.61,
"learning_rate": 0.00030747728860936407,
"loss": 0.0125,
"step": 1150
},
{
"epoch": 3.64,
"learning_rate": 0.0003004891684136967,
"loss": 0.0097,
"step": 1160
},
{
"epoch": 3.67,
"learning_rate": 0.0002935010482180294,
"loss": 0.0075,
"step": 1170
},
{
"epoch": 3.7,
"learning_rate": 0.000286512928022362,
"loss": 0.0057,
"step": 1180
},
{
"epoch": 3.73,
"learning_rate": 0.00027952480782669466,
"loss": 0.008,
"step": 1190
},
{
"epoch": 3.76,
"learning_rate": 0.00027253668763102724,
"loss": 0.0081,
"step": 1200
},
{
"epoch": 3.8,
"learning_rate": 0.0002655485674353599,
"loss": 0.0046,
"step": 1210
},
{
"epoch": 3.83,
"learning_rate": 0.0002585604472396925,
"loss": 0.0087,
"step": 1220
},
{
"epoch": 3.86,
"learning_rate": 0.00025157232704402514,
"loss": 0.0067,
"step": 1230
},
{
"epoch": 3.89,
"learning_rate": 0.0002445842068483578,
"loss": 0.0062,
"step": 1240
},
{
"epoch": 3.92,
"learning_rate": 0.00023759608665269041,
"loss": 0.0037,
"step": 1250
},
{
"epoch": 3.95,
"learning_rate": 0.00023060796645702305,
"loss": 0.006,
"step": 1260
},
{
"epoch": 3.98,
"learning_rate": 0.0002236198462613557,
"loss": 0.0065,
"step": 1270
},
{
"epoch": 4.0,
"eval_accuracy": 0.8544303797468354,
"eval_loss": 0.28469616174697876,
"eval_runtime": 254.8847,
"eval_samples_per_second": 21.696,
"eval_steps_per_second": 0.679,
"step": 1275
},
{
"epoch": 4.02,
"learning_rate": 0.00021663172606568835,
"loss": 0.0092,
"step": 1280
},
{
"epoch": 4.05,
"learning_rate": 0.00020964360587002095,
"loss": 0.0068,
"step": 1290
},
{
"epoch": 4.08,
"learning_rate": 0.0002026554856743536,
"loss": 0.0058,
"step": 1300
},
{
"epoch": 4.11,
"learning_rate": 0.00019566736547868625,
"loss": 0.0083,
"step": 1310
},
{
"epoch": 4.14,
"learning_rate": 0.00018867924528301889,
"loss": 0.0049,
"step": 1320
},
{
"epoch": 4.17,
"learning_rate": 0.0001816911250873515,
"loss": 0.0085,
"step": 1330
},
{
"epoch": 4.2,
"learning_rate": 0.00017470300489168416,
"loss": 0.0071,
"step": 1340
},
{
"epoch": 4.24,
"learning_rate": 0.0001677148846960168,
"loss": 0.0047,
"step": 1350
},
{
"epoch": 4.27,
"learning_rate": 0.0001607267645003494,
"loss": 0.0073,
"step": 1360
},
{
"epoch": 4.3,
"learning_rate": 0.00015373864430468203,
"loss": 0.0051,
"step": 1370
},
{
"epoch": 4.33,
"learning_rate": 0.0001467505241090147,
"loss": 0.0061,
"step": 1380
},
{
"epoch": 4.36,
"learning_rate": 0.00013976240391334733,
"loss": 0.0043,
"step": 1390
},
{
"epoch": 4.39,
"learning_rate": 0.00013277428371767994,
"loss": 0.0046,
"step": 1400
},
{
"epoch": 4.42,
"learning_rate": 0.00012578616352201257,
"loss": 0.0102,
"step": 1410
},
{
"epoch": 4.45,
"learning_rate": 0.00011879804332634521,
"loss": 0.0061,
"step": 1420
},
{
"epoch": 4.49,
"learning_rate": 0.00011180992313067786,
"loss": 0.0089,
"step": 1430
},
{
"epoch": 4.52,
"learning_rate": 0.00010482180293501048,
"loss": 0.0038,
"step": 1440
},
{
"epoch": 4.55,
"learning_rate": 9.783368273934313e-05,
"loss": 0.0033,
"step": 1450
},
{
"epoch": 4.58,
"learning_rate": 9.084556254367575e-05,
"loss": 0.0078,
"step": 1460
},
{
"epoch": 4.61,
"learning_rate": 8.38574423480084e-05,
"loss": 0.006,
"step": 1470
},
{
"epoch": 4.64,
"learning_rate": 7.686932215234102e-05,
"loss": 0.0077,
"step": 1480
},
{
"epoch": 4.67,
"learning_rate": 6.988120195667366e-05,
"loss": 0.005,
"step": 1490
},
{
"epoch": 4.71,
"learning_rate": 6.289308176100629e-05,
"loss": 0.005,
"step": 1500
},
{
"epoch": 4.74,
"learning_rate": 5.590496156533893e-05,
"loss": 0.0046,
"step": 1510
},
{
"epoch": 4.77,
"learning_rate": 4.891684136967156e-05,
"loss": 0.0044,
"step": 1520
},
{
"epoch": 4.8,
"learning_rate": 4.19287211740042e-05,
"loss": 0.0051,
"step": 1530
},
{
"epoch": 4.83,
"learning_rate": 3.494060097833683e-05,
"loss": 0.0078,
"step": 1540
},
{
"epoch": 4.86,
"learning_rate": 2.7952480782669464e-05,
"loss": 0.0021,
"step": 1550
},
{
"epoch": 4.89,
"learning_rate": 2.09643605870021e-05,
"loss": 0.0043,
"step": 1560
},
{
"epoch": 4.93,
"learning_rate": 1.3976240391334732e-05,
"loss": 0.0041,
"step": 1570
},
{
"epoch": 4.96,
"learning_rate": 6.988120195667366e-06,
"loss": 0.0049,
"step": 1580
},
{
"epoch": 4.99,
"learning_rate": 0.0,
"loss": 0.0086,
"step": 1590
},
{
"epoch": 4.99,
"eval_accuracy": 0.9168173598553345,
"eval_loss": 0.18948502838611603,
"eval_runtime": 224.532,
"eval_samples_per_second": 24.629,
"eval_steps_per_second": 0.77,
"step": 1590
},
{
"epoch": 4.99,
"step": 1590,
"total_flos": 2.5540381823039996e+19,
"train_loss": 0.042007273906525575,
"train_runtime": 10719.7329,
"train_samples_per_second": 19.016,
"train_steps_per_second": 0.148
}
],
"max_steps": 1590,
"num_train_epochs": 5,
"total_flos": 2.5540381823039996e+19,
"trial_name": null,
"trial_params": null
}