PT-UP-mBERT-FalseTrue-0_1_BEST / trainer_state.json
Harish Tayyar Madabushi
added model
2178d2e
{
"best_metric": 0.6961807093052775,
"best_model_checkpoint": "OUTPUT/bert-base-multilingual-cased/FalseTrue-0/1/checkpoint-259",
"epoch": 7.0,
"global_step": 259,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.6739926934242249,
"eval_f1": 0.6497000267492071,
"eval_loss": 0.7328909635543823,
"eval_runtime": 0.8296,
"eval_samples_per_second": 329.057,
"eval_steps_per_second": 42.187,
"step": 37
},
{
"epoch": 2.0,
"eval_accuracy": 0.6556776762008667,
"eval_f1": 0.6136253516088647,
"eval_loss": 1.3869595527648926,
"eval_runtime": 0.8297,
"eval_samples_per_second": 329.048,
"eval_steps_per_second": 42.186,
"step": 74
},
{
"epoch": 3.0,
"eval_accuracy": 0.6739926934242249,
"eval_f1": 0.6567661423596487,
"eval_loss": 1.3877439498901367,
"eval_runtime": 0.8294,
"eval_samples_per_second": 329.156,
"eval_steps_per_second": 42.199,
"step": 111
},
{
"epoch": 4.0,
"eval_accuracy": 0.6703296899795532,
"eval_f1": 0.6620879120879122,
"eval_loss": 1.5405205488204956,
"eval_runtime": 0.8255,
"eval_samples_per_second": 330.712,
"eval_steps_per_second": 42.399,
"step": 148
},
{
"epoch": 5.0,
"eval_accuracy": 0.6996337175369263,
"eval_f1": 0.680666672762239,
"eval_loss": 1.6668964624404907,
"eval_runtime": 0.8301,
"eval_samples_per_second": 328.874,
"eval_steps_per_second": 42.163,
"step": 185
},
{
"epoch": 6.0,
"eval_accuracy": 0.6959707140922546,
"eval_f1": 0.683264100001968,
"eval_loss": 1.7306524515151978,
"eval_runtime": 0.829,
"eval_samples_per_second": 329.311,
"eval_steps_per_second": 42.219,
"step": 222
},
{
"epoch": 7.0,
"eval_accuracy": 0.7069597244262695,
"eval_f1": 0.6961807093052775,
"eval_loss": 1.8631714582443237,
"eval_runtime": 0.8263,
"eval_samples_per_second": 330.372,
"eval_steps_per_second": 42.355,
"step": 259
}
],
"max_steps": 333,
"num_train_epochs": 9,
"total_flos": 1112956693051392.0,
"trial_name": null,
"trial_params": null
}