|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 5.0, |
|
"eval_steps": 500, |
|
"global_step": 405, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_B": { |
|
"f1-score": 0.8087666523420713, |
|
"precision": 0.8189730200174065, |
|
"recall": 0.7988115449915111, |
|
"support": 1178.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9374597034171502, |
|
"precision": 0.9521418826739427, |
|
"recall": 0.9232234509762421, |
|
"support": 18899.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.8881362400419788, |
|
"precision": 0.863303347862376, |
|
"recall": 0.9144400785854617, |
|
"support": 10180.0 |
|
}, |
|
"eval_accuracy": 0.9154245298608586, |
|
"eval_loss": 0.2228638380765915, |
|
"eval_macro avg": { |
|
"f1-score": 0.8781208652670669, |
|
"precision": 0.8781394168512416, |
|
"recall": 0.8788250248510717, |
|
"support": 30257.0 |
|
}, |
|
"eval_runtime": 4.7167, |
|
"eval_samples_per_second": 17.173, |
|
"eval_steps_per_second": 2.332, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9158543469268937, |
|
"precision": 0.9170673807540184, |
|
"recall": 0.9154245298608586, |
|
"support": 30257.0 |
|
}, |
|
"step": 81 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_B": { |
|
"f1-score": 0.8401515151515152, |
|
"precision": 0.7585499316005472, |
|
"recall": 0.9414261460101867, |
|
"support": 1178.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9568235603470944, |
|
"precision": 0.9510219016256338, |
|
"recall": 0.9626964389650247, |
|
"support": 18899.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9185648054827655, |
|
"precision": 0.9430877483443708, |
|
"recall": 0.8952848722986247, |
|
"support": 10180.0 |
|
}, |
|
"eval_accuracy": 0.9391876260038999, |
|
"eval_loss": 0.16692574322223663, |
|
"eval_macro avg": { |
|
"f1-score": 0.905179960327125, |
|
"precision": 0.8842198605235172, |
|
"recall": 0.9331358190912787, |
|
"support": 30257.0 |
|
}, |
|
"eval_runtime": 4.7116, |
|
"eval_samples_per_second": 17.192, |
|
"eval_steps_per_second": 2.335, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9394089523635119, |
|
"precision": 0.9408589092241132, |
|
"recall": 0.9391876260038999, |
|
"support": 30257.0 |
|
}, |
|
"step": 162 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_B": { |
|
"f1-score": 0.8612244897959184, |
|
"precision": 0.8294025157232704, |
|
"recall": 0.8955857385398981, |
|
"support": 1178.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.951106371634231, |
|
"precision": 0.9584654236741712, |
|
"recall": 0.9438594634636753, |
|
"support": 18899.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9106743212999903, |
|
"precision": 0.9021592442645074, |
|
"recall": 0.9193516699410609, |
|
"support": 10180.0 |
|
}, |
|
"eval_accuracy": 0.9337343424662061, |
|
"eval_loss": 0.1742253601551056, |
|
"eval_macro avg": { |
|
"f1-score": 0.9076683942433799, |
|
"precision": 0.8966757278873163, |
|
"recall": 0.9195989573148781, |
|
"support": 30257.0 |
|
}, |
|
"eval_runtime": 4.7094, |
|
"eval_samples_per_second": 17.2, |
|
"eval_steps_per_second": 2.336, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9340035812317422, |
|
"precision": 0.9344963252190521, |
|
"recall": 0.9337343424662061, |
|
"support": 30257.0 |
|
}, |
|
"step": 243 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_B": { |
|
"f1-score": 0.8717948717948719, |
|
"precision": 0.8254931714719271, |
|
"recall": 0.9235993208828522, |
|
"support": 1178.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9561271586371415, |
|
"precision": 0.9374586871408959, |
|
"recall": 0.9755542621302714, |
|
"support": 18899.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9117828500925355, |
|
"precision": 0.956427955133736, |
|
"recall": 0.8711198428290766, |
|
"support": 10180.0 |
|
}, |
|
"eval_accuracy": 0.9383944211256899, |
|
"eval_loss": 0.18792153894901276, |
|
"eval_macro avg": { |
|
"f1-score": 0.9132349601748496, |
|
"precision": 0.9064599379155197, |
|
"recall": 0.9234244752807333, |
|
"support": 30257.0 |
|
}, |
|
"eval_runtime": 4.7342, |
|
"eval_samples_per_second": 17.11, |
|
"eval_steps_per_second": 2.324, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9379241479327001, |
|
"precision": 0.9394817486046585, |
|
"recall": 0.9383944211256899, |
|
"support": 30257.0 |
|
}, |
|
"step": 324 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_B": { |
|
"f1-score": 0.8742949234488315, |
|
"precision": 0.8320552147239264, |
|
"recall": 0.9210526315789473, |
|
"support": 1178.0 |
|
}, |
|
"eval_I": { |
|
"f1-score": 0.9583957528450158, |
|
"precision": 0.9521148825065274, |
|
"recall": 0.9647600402137679, |
|
"support": 18899.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9198818996146724, |
|
"precision": 0.9375701315923697, |
|
"recall": 0.9028487229862475, |
|
"support": 10180.0 |
|
}, |
|
"eval_accuracy": 0.9422282447037049, |
|
"eval_loss": 0.19990424811840057, |
|
"eval_macro avg": { |
|
"f1-score": 0.9175241919695066, |
|
"precision": 0.9072467429409411, |
|
"recall": 0.9295537982596542, |
|
"support": 30257.0 |
|
}, |
|
"eval_runtime": 4.7101, |
|
"eval_samples_per_second": 17.197, |
|
"eval_steps_per_second": 2.335, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9421634164298524, |
|
"precision": 0.9425469857238316, |
|
"recall": 0.9422282447037049, |
|
"support": 30257.0 |
|
}, |
|
"step": 405 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 4050, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 50, |
|
"save_steps": 500, |
|
"total_flos": 716700551679000.0, |
|
"train_batch_size": 4, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|