HueyNemud
model data
359d820
{
"best_metric": 0.9595484477892756,
"best_model_checkpoint": "/content/drive/MyDrive/SODUCO/article_das_2022/43-camembert_pretrained_finetuned_pero/checkpoint-1500",
"epoch": 3.9893617021276597,
"global_step": 1500,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.27,
"eval_accuracy": 0.9711394302848576,
"eval_f1": 0.9418582912693962,
"eval_loss": 0.24740596115589142,
"eval_precision": 0.9343471810089021,
"eval_recall": 0.9494911421032793,
"eval_runtime": 2.7876,
"eval_samples_per_second": 239.631,
"eval_steps_per_second": 15.067,
"step": 100
},
{
"epoch": 0.53,
"eval_accuracy": 0.9741379310344828,
"eval_f1": 0.950751879699248,
"eval_loss": 0.15050481259822845,
"eval_precision": 0.9482564679415073,
"eval_recall": 0.9532604598567659,
"eval_runtime": 2.5926,
"eval_samples_per_second": 257.656,
"eval_steps_per_second": 16.2,
"step": 200
},
{
"epoch": 0.8,
"eval_accuracy": 0.9730134932533733,
"eval_f1": 0.9475262368815591,
"eval_loss": 0.12827223539352417,
"eval_precision": 0.9422288483041371,
"eval_recall": 0.9528835280814173,
"eval_runtime": 2.73,
"eval_samples_per_second": 244.686,
"eval_steps_per_second": 15.384,
"step": 300
},
{
"epoch": 1.06,
"eval_accuracy": 0.9710144927536232,
"eval_f1": 0.9431689875799775,
"eval_loss": 0.1230660155415535,
"eval_precision": 0.9417512213453589,
"eval_recall": 0.9445910290237467,
"eval_runtime": 2.7678,
"eval_samples_per_second": 241.348,
"eval_steps_per_second": 15.175,
"step": 400
},
{
"epoch": 1.33,
"learning_rate": 9e-05,
"loss": 0.2505,
"step": 500
},
{
"epoch": 1.33,
"eval_accuracy": 0.9786356821589205,
"eval_f1": 0.9521306551529942,
"eval_loss": 0.08949972689151764,
"eval_precision": 0.9483919222139118,
"eval_recall": 0.9558989822842066,
"eval_runtime": 2.9407,
"eval_samples_per_second": 227.154,
"eval_steps_per_second": 14.282,
"step": 500
},
{
"epoch": 1.6,
"eval_accuracy": 0.9768865567216392,
"eval_f1": 0.9537420082737871,
"eval_loss": 0.09133146703243256,
"eval_precision": 0.951594746716698,
"eval_recall": 0.9558989822842066,
"eval_runtime": 2.8849,
"eval_samples_per_second": 231.55,
"eval_steps_per_second": 14.559,
"step": 600
},
{
"epoch": 1.86,
"eval_accuracy": 0.9765117441279361,
"eval_f1": 0.9579800263802524,
"eval_loss": 0.09044157713651657,
"eval_precision": 0.9577995478522984,
"eval_recall": 0.9581605729362985,
"eval_runtime": 2.8752,
"eval_samples_per_second": 232.332,
"eval_steps_per_second": 14.608,
"step": 700
},
{
"epoch": 2.13,
"eval_accuracy": 0.9801349325337332,
"eval_f1": 0.9586621570838031,
"eval_loss": 0.07938132435083389,
"eval_precision": 0.9557886849007119,
"eval_recall": 0.9615529589144365,
"eval_runtime": 2.8692,
"eval_samples_per_second": 232.816,
"eval_steps_per_second": 14.638,
"step": 800
},
{
"epoch": 2.39,
"eval_accuracy": 0.9771364317841079,
"eval_f1": 0.9548872180451128,
"eval_loss": 0.09603337943553925,
"eval_precision": 0.9523809523809523,
"eval_recall": 0.9574067093856012,
"eval_runtime": 2.8538,
"eval_samples_per_second": 234.072,
"eval_steps_per_second": 14.717,
"step": 900
},
{
"epoch": 2.66,
"learning_rate": 8e-05,
"loss": 0.0748,
"step": 1000
},
{
"epoch": 2.66,
"eval_accuracy": 0.9761369315342329,
"eval_f1": 0.9575871819038644,
"eval_loss": 0.09003584831953049,
"eval_precision": 0.9577677224736049,
"eval_recall": 0.9574067093856012,
"eval_runtime": 2.9061,
"eval_samples_per_second": 229.858,
"eval_steps_per_second": 14.452,
"step": 1000
},
{
"epoch": 2.93,
"eval_accuracy": 0.9730134932533733,
"eval_f1": 0.954383330204618,
"eval_loss": 0.10545289516448975,
"eval_precision": 0.9506357516828721,
"eval_recall": 0.9581605729362985,
"eval_runtime": 2.9384,
"eval_samples_per_second": 227.334,
"eval_steps_per_second": 14.293,
"step": 1100
},
{
"epoch": 3.19,
"eval_accuracy": 0.9761369315342329,
"eval_f1": 0.9593220338983051,
"eval_loss": 0.099028080701828,
"eval_precision": 0.9585999247271358,
"eval_recall": 0.9600452318130418,
"eval_runtime": 3.0033,
"eval_samples_per_second": 222.419,
"eval_steps_per_second": 13.984,
"step": 1200
},
{
"epoch": 3.46,
"eval_accuracy": 0.9752623688155923,
"eval_f1": 0.9561782960315968,
"eval_loss": 0.09300831705331802,
"eval_precision": 0.9542042042042042,
"eval_recall": 0.9581605729362985,
"eval_runtime": 2.8431,
"eval_samples_per_second": 234.956,
"eval_steps_per_second": 14.773,
"step": 1300
},
{
"epoch": 3.72,
"eval_accuracy": 0.9775112443778111,
"eval_f1": 0.9578471960858111,
"eval_loss": 0.0967017412185669,
"eval_precision": 0.9564073656520106,
"eval_recall": 0.9592913682623445,
"eval_runtime": 2.8669,
"eval_samples_per_second": 233.003,
"eval_steps_per_second": 14.65,
"step": 1400
},
{
"epoch": 3.99,
"learning_rate": 7e-05,
"loss": 0.0497,
"step": 1500
},
{
"epoch": 3.99,
"eval_accuracy": 0.9776361819090454,
"eval_f1": 0.9595484477892756,
"eval_loss": 0.0839652568101883,
"eval_precision": 0.9579263711495116,
"eval_recall": 0.9611760271390878,
"eval_runtime": 2.8628,
"eval_samples_per_second": 233.335,
"eval_steps_per_second": 14.671,
"step": 1500
}
],
"max_steps": 5000,
"num_train_epochs": 14,
"total_flos": 592464605771736.0,
"trial_name": null,
"trial_params": null
}