|
{ |
|
"best_metric": 0.6930379746835443, |
|
"best_model_checkpoint": "/scratch/mrahma45/pixel/finetuned_models/canine/canine-base-finetuned-masakhaner-ibo/checkpoint-4000", |
|
"epoch": 77.14285714285714, |
|
"global_step": 5400, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 2.86, |
|
"eval_accuracy_score": 0.9000158704967466, |
|
"eval_f1": 0.49961449498843485, |
|
"eval_loss": 0.331222265958786, |
|
"eval_precision": 0.4648493543758967, |
|
"eval_recall": 0.54, |
|
"eval_runtime": 2.4906, |
|
"eval_samples_per_second": 128.481, |
|
"eval_steps_per_second": 16.06, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 5.71, |
|
"eval_accuracy_score": 0.9298524043802571, |
|
"eval_f1": 0.6056224899598394, |
|
"eval_loss": 0.24286046624183655, |
|
"eval_precision": 0.5844961240310077, |
|
"eval_recall": 0.6283333333333333, |
|
"eval_runtime": 2.4939, |
|
"eval_samples_per_second": 128.313, |
|
"eval_steps_per_second": 16.039, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 7.14, |
|
"learning_rate": 4.865771812080537e-05, |
|
"loss": 0.3252, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 8.57, |
|
"eval_accuracy_score": 0.9366767179812728, |
|
"eval_f1": 0.6445131375579597, |
|
"eval_loss": 0.2310349941253662, |
|
"eval_precision": 0.600864553314121, |
|
"eval_recall": 0.695, |
|
"eval_runtime": 2.4876, |
|
"eval_samples_per_second": 128.637, |
|
"eval_steps_per_second": 16.08, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 11.43, |
|
"eval_accuracy_score": 0.9381050626884622, |
|
"eval_f1": 0.6501930501930501, |
|
"eval_loss": 0.22948996722698212, |
|
"eval_precision": 0.6057553956834533, |
|
"eval_recall": 0.7016666666666667, |
|
"eval_runtime": 2.4897, |
|
"eval_samples_per_second": 128.529, |
|
"eval_steps_per_second": 16.066, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 14.29, |
|
"learning_rate": 4.697986577181208e-05, |
|
"loss": 0.0722, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 14.29, |
|
"eval_accuracy_score": 0.9406443421679098, |
|
"eval_f1": 0.6508313539192399, |
|
"eval_loss": 0.2520008981227875, |
|
"eval_precision": 0.6199095022624435, |
|
"eval_recall": 0.685, |
|
"eval_runtime": 2.4823, |
|
"eval_samples_per_second": 128.915, |
|
"eval_steps_per_second": 16.114, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 17.14, |
|
"eval_accuracy_score": 0.9444532613870814, |
|
"eval_f1": 0.6714399363564041, |
|
"eval_loss": 0.25240662693977356, |
|
"eval_precision": 0.6423135464231354, |
|
"eval_recall": 0.7033333333333334, |
|
"eval_runtime": 2.482, |
|
"eval_samples_per_second": 128.93, |
|
"eval_steps_per_second": 16.116, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy_score": 0.9408030471353753, |
|
"eval_f1": 0.6698039215686274, |
|
"eval_loss": 0.2890109419822693, |
|
"eval_precision": 0.6325925925925926, |
|
"eval_recall": 0.7116666666666667, |
|
"eval_runtime": 2.4863, |
|
"eval_samples_per_second": 128.707, |
|
"eval_steps_per_second": 16.088, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 21.43, |
|
"learning_rate": 4.530201342281879e-05, |
|
"loss": 0.0227, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 22.86, |
|
"eval_accuracy_score": 0.9430249166798921, |
|
"eval_f1": 0.6810897435897436, |
|
"eval_loss": 0.2938888967037201, |
|
"eval_precision": 0.6558641975308642, |
|
"eval_recall": 0.7083333333333334, |
|
"eval_runtime": 2.4899, |
|
"eval_samples_per_second": 128.52, |
|
"eval_steps_per_second": 16.065, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 25.71, |
|
"eval_accuracy_score": 0.9404856372004444, |
|
"eval_f1": 0.665090622537431, |
|
"eval_loss": 0.30078476667404175, |
|
"eval_precision": 0.6307922272047832, |
|
"eval_recall": 0.7033333333333334, |
|
"eval_runtime": 2.4945, |
|
"eval_samples_per_second": 128.281, |
|
"eval_steps_per_second": 16.035, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 28.57, |
|
"learning_rate": 4.36241610738255e-05, |
|
"loss": 0.0104, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 28.57, |
|
"eval_accuracy_score": 0.9468338358990637, |
|
"eval_f1": 0.6836813611755608, |
|
"eval_loss": 0.2752661406993866, |
|
"eval_precision": 0.6378066378066378, |
|
"eval_recall": 0.7366666666666667, |
|
"eval_runtime": 2.6818, |
|
"eval_samples_per_second": 119.321, |
|
"eval_steps_per_second": 14.915, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 31.43, |
|
"eval_accuracy_score": 0.9441358514521504, |
|
"eval_f1": 0.6817813765182186, |
|
"eval_loss": 0.32004353404045105, |
|
"eval_precision": 0.662992125984252, |
|
"eval_recall": 0.7016666666666667, |
|
"eval_runtime": 2.487, |
|
"eval_samples_per_second": 128.671, |
|
"eval_steps_per_second": 16.084, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 34.29, |
|
"eval_accuracy_score": 0.9444532613870814, |
|
"eval_f1": 0.6868525896414344, |
|
"eval_loss": 0.32289382815361023, |
|
"eval_precision": 0.6580152671755726, |
|
"eval_recall": 0.7183333333333334, |
|
"eval_runtime": 2.4893, |
|
"eval_samples_per_second": 128.549, |
|
"eval_steps_per_second": 16.069, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 35.71, |
|
"learning_rate": 4.194630872483222e-05, |
|
"loss": 0.0065, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 37.14, |
|
"eval_accuracy_score": 0.9444532613870814, |
|
"eval_f1": 0.6874003189792663, |
|
"eval_loss": 0.324036180973053, |
|
"eval_precision": 0.6590214067278287, |
|
"eval_recall": 0.7183333333333334, |
|
"eval_runtime": 2.4838, |
|
"eval_samples_per_second": 128.837, |
|
"eval_steps_per_second": 16.105, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_accuracy_score": 0.9427075067449611, |
|
"eval_f1": 0.669848846459825, |
|
"eval_loss": 0.3424355089664459, |
|
"eval_precision": 0.6407914764079148, |
|
"eval_recall": 0.7016666666666667, |
|
"eval_runtime": 2.489, |
|
"eval_samples_per_second": 128.566, |
|
"eval_steps_per_second": 16.071, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 42.86, |
|
"learning_rate": 4.026845637583892e-05, |
|
"loss": 0.0042, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 42.86, |
|
"eval_accuracy_score": 0.9442945564196159, |
|
"eval_f1": 0.6758064516129032, |
|
"eval_loss": 0.33911556005477905, |
|
"eval_precision": 0.6546875, |
|
"eval_recall": 0.6983333333333334, |
|
"eval_runtime": 2.478, |
|
"eval_samples_per_second": 129.136, |
|
"eval_steps_per_second": 16.142, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 45.71, |
|
"eval_accuracy_score": 0.9457229011268052, |
|
"eval_f1": 0.6880877742946709, |
|
"eval_loss": 0.3264969289302826, |
|
"eval_precision": 0.6494082840236687, |
|
"eval_recall": 0.7316666666666667, |
|
"eval_runtime": 2.4815, |
|
"eval_samples_per_second": 128.956, |
|
"eval_steps_per_second": 16.119, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 48.57, |
|
"eval_accuracy_score": 0.9422313918425647, |
|
"eval_f1": 0.6761904761904762, |
|
"eval_loss": 0.35728639364242554, |
|
"eval_precision": 0.6454545454545455, |
|
"eval_recall": 0.71, |
|
"eval_runtime": 2.4775, |
|
"eval_samples_per_second": 129.162, |
|
"eval_steps_per_second": 16.145, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"learning_rate": 3.859060402684564e-05, |
|
"loss": 0.0033, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 51.43, |
|
"eval_accuracy_score": 0.9441358514521504, |
|
"eval_f1": 0.6907051282051282, |
|
"eval_loss": 0.35023757815361023, |
|
"eval_precision": 0.6651234567901234, |
|
"eval_recall": 0.7183333333333334, |
|
"eval_runtime": 2.477, |
|
"eval_samples_per_second": 129.186, |
|
"eval_steps_per_second": 16.148, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 54.29, |
|
"eval_accuracy_score": 0.943977146484685, |
|
"eval_f1": 0.6825775656324582, |
|
"eval_loss": 0.3428173363208771, |
|
"eval_precision": 0.6529680365296804, |
|
"eval_recall": 0.715, |
|
"eval_runtime": 2.4863, |
|
"eval_samples_per_second": 128.705, |
|
"eval_steps_per_second": 16.088, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 57.14, |
|
"learning_rate": 3.6912751677852356e-05, |
|
"loss": 0.0024, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 57.14, |
|
"eval_accuracy_score": 0.9460403110617362, |
|
"eval_f1": 0.6930379746835443, |
|
"eval_loss": 0.33534663915634155, |
|
"eval_precision": 0.6596385542168675, |
|
"eval_recall": 0.73, |
|
"eval_runtime": 2.4857, |
|
"eval_samples_per_second": 128.737, |
|
"eval_steps_per_second": 16.092, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_accuracy_score": 0.943659736549754, |
|
"eval_f1": 0.6714285714285714, |
|
"eval_loss": 0.3531126081943512, |
|
"eval_precision": 0.6409090909090909, |
|
"eval_recall": 0.705, |
|
"eval_runtime": 2.4736, |
|
"eval_samples_per_second": 129.364, |
|
"eval_steps_per_second": 16.171, |
|
"step": 4200 |
|
}, |
|
{ |
|
"epoch": 62.86, |
|
"eval_accuracy_score": 0.9458816060942707, |
|
"eval_f1": 0.695582329317269, |
|
"eval_loss": 0.36536940932273865, |
|
"eval_precision": 0.6713178294573643, |
|
"eval_recall": 0.7216666666666667, |
|
"eval_runtime": 2.4795, |
|
"eval_samples_per_second": 129.059, |
|
"eval_steps_per_second": 16.132, |
|
"step": 4400 |
|
}, |
|
{ |
|
"epoch": 64.29, |
|
"learning_rate": 3.523489932885906e-05, |
|
"loss": 0.0024, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 65.71, |
|
"eval_accuracy_score": 0.9435010315822885, |
|
"eval_f1": 0.6821457165732587, |
|
"eval_loss": 0.3702266812324524, |
|
"eval_precision": 0.6563944530046225, |
|
"eval_recall": 0.71, |
|
"eval_runtime": 2.4782, |
|
"eval_samples_per_second": 129.126, |
|
"eval_steps_per_second": 16.141, |
|
"step": 4600 |
|
}, |
|
{ |
|
"epoch": 68.57, |
|
"eval_accuracy_score": 0.9425488017774957, |
|
"eval_f1": 0.6838709677419355, |
|
"eval_loss": 0.3876664936542511, |
|
"eval_precision": 0.6625, |
|
"eval_recall": 0.7066666666666667, |
|
"eval_runtime": 2.4834, |
|
"eval_samples_per_second": 128.858, |
|
"eval_steps_per_second": 16.107, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 71.43, |
|
"learning_rate": 3.3557046979865775e-05, |
|
"loss": 0.0019, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 71.43, |
|
"eval_accuracy_score": 0.9441358514521504, |
|
"eval_f1": 0.6751188589540411, |
|
"eval_loss": 0.35965150594711304, |
|
"eval_precision": 0.6435045317220544, |
|
"eval_recall": 0.71, |
|
"eval_runtime": 2.4894, |
|
"eval_samples_per_second": 128.547, |
|
"eval_steps_per_second": 16.068, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 74.29, |
|
"eval_accuracy_score": 0.9422313918425647, |
|
"eval_f1": 0.6736334405144694, |
|
"eval_loss": 0.4093686044216156, |
|
"eval_precision": 0.6506211180124224, |
|
"eval_recall": 0.6983333333333334, |
|
"eval_runtime": 2.495, |
|
"eval_samples_per_second": 128.258, |
|
"eval_steps_per_second": 16.032, |
|
"step": 5200 |
|
}, |
|
{ |
|
"epoch": 77.14, |
|
"eval_accuracy_score": 0.9423900968100302, |
|
"eval_f1": 0.675098814229249, |
|
"eval_loss": 0.3733450174331665, |
|
"eval_precision": 0.6421052631578947, |
|
"eval_recall": 0.7116666666666667, |
|
"eval_runtime": 2.4781, |
|
"eval_samples_per_second": 129.13, |
|
"eval_steps_per_second": 16.141, |
|
"step": 5400 |
|
}, |
|
{ |
|
"epoch": 77.14, |
|
"step": 5400, |
|
"total_flos": 2.831337967640832e+16, |
|
"train_loss": 0.041913371869811304, |
|
"train_runtime": 4784.712, |
|
"train_samples_per_second": 100.32, |
|
"train_steps_per_second": 3.135 |
|
} |
|
], |
|
"max_steps": 15000, |
|
"num_train_epochs": 215, |
|
"total_flos": 2.831337967640832e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|