Md Mushfiqur Rahman
Upload with huggingface_hub
55590ed
{
"best_metric": 0.5146198830409356,
"best_model_checkpoint": "/scratch/mrahma45/pixel/finetuned_models/canine/canine-base-finetuned-masakhaner-yor/checkpoint-2000",
"epoch": 44.11764705882353,
"global_step": 3000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 2.94,
"eval_accuracy_score": 0.918060435699227,
"eval_f1": 0.29637305699481864,
"eval_loss": 0.27648022770881653,
"eval_precision": 0.23636363636363636,
"eval_recall": 0.3972222222222222,
"eval_runtime": 2.3819,
"eval_samples_per_second": 128.049,
"eval_steps_per_second": 16.373,
"step": 200
},
{
"epoch": 5.88,
"eval_accuracy_score": 0.9343640196767393,
"eval_f1": 0.407185628742515,
"eval_loss": 0.21811498701572418,
"eval_precision": 0.35789473684210527,
"eval_recall": 0.4722222222222222,
"eval_runtime": 2.3801,
"eval_samples_per_second": 128.145,
"eval_steps_per_second": 16.386,
"step": 400
},
{
"epoch": 7.35,
"learning_rate": 4.865771812080537e-05,
"loss": 0.3062,
"step": 500
},
{
"epoch": 8.82,
"eval_accuracy_score": 0.9374560787069571,
"eval_f1": 0.42857142857142855,
"eval_loss": 0.22281676530838013,
"eval_precision": 0.3620689655172414,
"eval_recall": 0.525,
"eval_runtime": 2.3751,
"eval_samples_per_second": 128.418,
"eval_steps_per_second": 16.421,
"step": 600
},
{
"epoch": 11.76,
"eval_accuracy_score": 0.9422347153900211,
"eval_f1": 0.48,
"eval_loss": 0.22548547387123108,
"eval_precision": 0.4163265306122449,
"eval_recall": 0.5666666666666667,
"eval_runtime": 2.3756,
"eval_samples_per_second": 128.388,
"eval_steps_per_second": 16.417,
"step": 800
},
{
"epoch": 14.71,
"learning_rate": 4.697986577181208e-05,
"loss": 0.0666,
"step": 1000
},
{
"epoch": 14.71,
"eval_accuracy_score": 0.9457484188334505,
"eval_f1": 0.5048076923076923,
"eval_loss": 0.2493690848350525,
"eval_precision": 0.4449152542372881,
"eval_recall": 0.5833333333333334,
"eval_runtime": 2.3673,
"eval_samples_per_second": 128.84,
"eval_steps_per_second": 16.475,
"step": 1000
},
{
"epoch": 17.65,
"eval_accuracy_score": 0.9447645818692902,
"eval_f1": 0.49325153374233127,
"eval_loss": 0.2621992826461792,
"eval_precision": 0.44175824175824174,
"eval_recall": 0.5583333333333333,
"eval_runtime": 2.3771,
"eval_samples_per_second": 128.306,
"eval_steps_per_second": 16.406,
"step": 1200
},
{
"epoch": 20.59,
"eval_accuracy_score": 0.9436401967673929,
"eval_f1": 0.5073891625615763,
"eval_loss": 0.2808593511581421,
"eval_precision": 0.4557522123893805,
"eval_recall": 0.5722222222222222,
"eval_runtime": 2.3795,
"eval_samples_per_second": 128.177,
"eval_steps_per_second": 16.39,
"step": 1400
},
{
"epoch": 22.06,
"learning_rate": 4.530201342281879e-05,
"loss": 0.0187,
"step": 1500
},
{
"epoch": 23.53,
"eval_accuracy_score": 0.9425158116654955,
"eval_f1": 0.4976190476190476,
"eval_loss": 0.3069038391113281,
"eval_precision": 0.4354166666666667,
"eval_recall": 0.5805555555555556,
"eval_runtime": 2.3752,
"eval_samples_per_second": 128.408,
"eval_steps_per_second": 16.419,
"step": 1600
},
{
"epoch": 26.47,
"eval_accuracy_score": 0.9429374560787069,
"eval_f1": 0.4959443800695249,
"eval_loss": 0.2936417758464813,
"eval_precision": 0.4254473161033797,
"eval_recall": 0.5944444444444444,
"eval_runtime": 2.3751,
"eval_samples_per_second": 128.415,
"eval_steps_per_second": 16.42,
"step": 1800
},
{
"epoch": 29.41,
"learning_rate": 4.36241610738255e-05,
"loss": 0.0071,
"step": 2000
},
{
"epoch": 29.41,
"eval_accuracy_score": 0.9432185523541813,
"eval_f1": 0.5146198830409356,
"eval_loss": 0.3124857544898987,
"eval_precision": 0.4444444444444444,
"eval_recall": 0.6111111111111112,
"eval_runtime": 2.3658,
"eval_samples_per_second": 128.919,
"eval_steps_per_second": 16.485,
"step": 2000
},
{
"epoch": 32.35,
"eval_accuracy_score": 0.9450456781447646,
"eval_f1": 0.49709639953542395,
"eval_loss": 0.3202134370803833,
"eval_precision": 0.42714570858283435,
"eval_recall": 0.5944444444444444,
"eval_runtime": 2.3712,
"eval_samples_per_second": 128.625,
"eval_steps_per_second": 16.447,
"step": 2200
},
{
"epoch": 35.29,
"eval_accuracy_score": 0.9444834855938159,
"eval_f1": 0.49446494464944646,
"eval_loss": 0.3432020843029022,
"eval_precision": 0.44370860927152317,
"eval_recall": 0.5583333333333333,
"eval_runtime": 2.372,
"eval_samples_per_second": 128.582,
"eval_steps_per_second": 16.442,
"step": 2400
},
{
"epoch": 36.76,
"learning_rate": 4.194630872483222e-05,
"loss": 0.0045,
"step": 2500
},
{
"epoch": 38.24,
"eval_accuracy_score": 0.946170063246662,
"eval_f1": 0.5048543689320388,
"eval_loss": 0.33581680059432983,
"eval_precision": 0.4482758620689655,
"eval_recall": 0.5777777777777777,
"eval_runtime": 2.3711,
"eval_samples_per_second": 128.633,
"eval_steps_per_second": 16.448,
"step": 2600
},
{
"epoch": 41.18,
"eval_accuracy_score": 0.9467322557976107,
"eval_f1": 0.5108433734939758,
"eval_loss": 0.3493315279483795,
"eval_precision": 0.451063829787234,
"eval_recall": 0.5888888888888889,
"eval_runtime": 2.3774,
"eval_samples_per_second": 128.29,
"eval_steps_per_second": 16.404,
"step": 2800
},
{
"epoch": 44.12,
"learning_rate": 4.026845637583892e-05,
"loss": 0.0024,
"step": 3000
},
{
"epoch": 44.12,
"eval_accuracy_score": 0.9456078706957133,
"eval_f1": 0.5047393364928909,
"eval_loss": 0.3553647994995117,
"eval_precision": 0.44008264462809915,
"eval_recall": 0.5916666666666667,
"eval_runtime": 2.3665,
"eval_samples_per_second": 128.88,
"eval_steps_per_second": 16.48,
"step": 3000
},
{
"epoch": 44.12,
"step": 3000,
"total_flos": 1.572865183079424e+16,
"train_loss": 0.06757608306407928,
"train_runtime": 1505.3266,
"train_samples_per_second": 318.868,
"train_steps_per_second": 9.965
}
],
"max_steps": 15000,
"num_train_epochs": 221,
"total_flos": 1.572865183079424e+16,
"trial_name": null,
"trial_params": null
}