{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.560974358974359, | |
"eval_loss": 2.2417104244232178, | |
"eval_runtime": 5.9255, | |
"eval_samples": 500, | |
"eval_samples_per_second": 84.381, | |
"eval_steps_per_second": 10.632, | |
"perplexity": 9.409411618867681, | |
"total_flos": 6.517631969856061e+17, | |
"train_loss": 0.6977483630405708, | |
"train_runtime": 24342.3236, | |
"train_samples": 16925, | |
"train_samples_per_second": 13.906, | |
"train_steps_per_second": 0.435 | |
} |