|
{
|
|
"best_params": {
|
|
"epochs": 2,
|
|
"batch_size": 32,
|
|
"warmup_steps": 0,
|
|
"weight_decay": 0.01
|
|
},
|
|
"all_results": [
|
|
{
|
|
"params": {
|
|
"epochs": 2,
|
|
"batch_size": 32,
|
|
"warmup_steps": 0,
|
|
"weight_decay": 0.01
|
|
},
|
|
"eval_result": {
|
|
"eval_loss": 0.31092265248298645,
|
|
"eval_accuracy": 0.89128,
|
|
"eval_f1": 0.8922112944162437,
|
|
"eval_precision": 0.884633532557408,
|
|
"eval_recall": 0.89992,
|
|
"eval_runtime": 32.9216,
|
|
"eval_samples_per_second": 759.379,
|
|
"eval_steps_per_second": 23.753,
|
|
"epoch": 2.0
|
|
}
|
|
},
|
|
{
|
|
"params": {
|
|
"epochs": 2,
|
|
"batch_size": 16,
|
|
"warmup_steps": 100,
|
|
"weight_decay": 0.01
|
|
},
|
|
"eval_result": {
|
|
"eval_loss": 0.3510156273841858,
|
|
"eval_accuracy": 0.8912,
|
|
"eval_f1": 0.8914431673052363,
|
|
"eval_precision": 0.8894552405224594,
|
|
"eval_recall": 0.89344,
|
|
"eval_runtime": 34.3301,
|
|
"eval_samples_per_second": 728.223,
|
|
"eval_steps_per_second": 45.529,
|
|
"epoch": 2.0
|
|
}
|
|
},
|
|
{
|
|
"params": {
|
|
"epochs": 2,
|
|
"batch_size": 16,
|
|
"warmup_steps": 100,
|
|
"weight_decay": 0.01
|
|
},
|
|
"eval_result": {
|
|
"eval_loss": 0.3510156273841858,
|
|
"eval_accuracy": 0.8912,
|
|
"eval_f1": 0.8914431673052363,
|
|
"eval_precision": 0.8894552405224594,
|
|
"eval_recall": 0.89344,
|
|
"eval_runtime": 34.4751,
|
|
"eval_samples_per_second": 725.161,
|
|
"eval_steps_per_second": 45.337,
|
|
"epoch": 2.0
|
|
}
|
|
},
|
|
{
|
|
"params": {
|
|
"epochs": 2,
|
|
"batch_size": 16,
|
|
"warmup_steps": 100,
|
|
"weight_decay": 0.01
|
|
},
|
|
"eval_result": {
|
|
"eval_loss": 0.3510156273841858,
|
|
"eval_accuracy": 0.8912,
|
|
"eval_f1": 0.8914431673052363,
|
|
"eval_precision": 0.8894552405224594,
|
|
"eval_recall": 0.89344,
|
|
"eval_runtime": 34.5714,
|
|
"eval_samples_per_second": 723.14,
|
|
"eval_steps_per_second": 45.211,
|
|
"epoch": 2.0
|
|
}
|
|
},
|
|
{
|
|
"params": {
|
|
"epochs": 2,
|
|
"batch_size": 16,
|
|
"warmup_steps": 100,
|
|
"weight_decay": 0.01
|
|
},
|
|
"eval_result": {
|
|
"eval_loss": 0.3510156273841858,
|
|
"eval_accuracy": 0.8912,
|
|
"eval_f1": 0.8914431673052363,
|
|
"eval_precision": 0.8894552405224594,
|
|
"eval_recall": 0.89344,
|
|
"eval_runtime": 34.3958,
|
|
"eval_samples_per_second": 726.832,
|
|
"eval_steps_per_second": 45.442,
|
|
"epoch": 2.0
|
|
}
|
|
},
|
|
{
|
|
"params": {
|
|
"epochs": 2,
|
|
"batch_size": 16,
|
|
"warmup_steps": 100,
|
|
"weight_decay": 0.01
|
|
},
|
|
"eval_result": {
|
|
"eval_loss": 0.3510156273841858,
|
|
"eval_accuracy": 0.8912,
|
|
"eval_f1": 0.8914431673052363,
|
|
"eval_precision": 0.8894552405224594,
|
|
"eval_recall": 0.89344,
|
|
"eval_runtime": 34.3952,
|
|
"eval_samples_per_second": 726.845,
|
|
"eval_steps_per_second": 45.442,
|
|
"epoch": 2.0
|
|
}
|
|
},
|
|
{
|
|
"params": {
|
|
"epochs": 2,
|
|
"batch_size": 16,
|
|
"warmup_steps": 100,
|
|
"weight_decay": 0.01
|
|
},
|
|
"eval_result": {
|
|
"eval_loss": 0.3510156273841858,
|
|
"eval_accuracy": 0.8912,
|
|
"eval_f1": 0.8914431673052363,
|
|
"eval_precision": 0.8894552405224594,
|
|
"eval_recall": 0.89344,
|
|
"eval_runtime": 34.5864,
|
|
"eval_samples_per_second": 722.827,
|
|
"eval_steps_per_second": 45.191,
|
|
"epoch": 2.0
|
|
}
|
|
},
|
|
{
|
|
"params": {
|
|
"epochs": 2,
|
|
"batch_size": 16,
|
|
"warmup_steps": 100,
|
|
"weight_decay": 0.01
|
|
},
|
|
"eval_result": {
|
|
"eval_loss": 0.3510156273841858,
|
|
"eval_accuracy": 0.8912,
|
|
"eval_f1": 0.8914431673052363,
|
|
"eval_precision": 0.8894552405224594,
|
|
"eval_recall": 0.89344,
|
|
"eval_runtime": 34.4644,
|
|
"eval_samples_per_second": 725.386,
|
|
"eval_steps_per_second": 45.351,
|
|
"epoch": 2.0
|
|
}
|
|
},
|
|
{
|
|
"params": {
|
|
"epochs": 2,
|
|
"batch_size": 16,
|
|
"warmup_steps": 100,
|
|
"weight_decay": 0.01
|
|
},
|
|
"eval_result": {
|
|
"eval_loss": 0.3510156273841858,
|
|
"eval_accuracy": 0.8912,
|
|
"eval_f1": 0.8914431673052363,
|
|
"eval_precision": 0.8894552405224594,
|
|
"eval_recall": 0.89344,
|
|
"eval_runtime": 34.5881,
|
|
"eval_samples_per_second": 722.792,
|
|
"eval_steps_per_second": 45.189,
|
|
"epoch": 2.0
|
|
}
|
|
},
|
|
{
|
|
"params": {
|
|
"epochs": 2,
|
|
"batch_size": 16,
|
|
"warmup_steps": 100,
|
|
"weight_decay": 0.01
|
|
},
|
|
"eval_result": {
|
|
"eval_loss": 0.3510156273841858,
|
|
"eval_accuracy": 0.8912,
|
|
"eval_f1": 0.8914431673052363,
|
|
"eval_precision": 0.8894552405224594,
|
|
"eval_recall": 0.89344,
|
|
"eval_runtime": 34.3332,
|
|
"eval_samples_per_second": 728.157,
|
|
"eval_steps_per_second": 45.524,
|
|
"epoch": 2.0
|
|
}
|
|
}
|
|
]
|
|
} |