{ | |
"epoch": 2.98, | |
"eval_accuracy": 0.7246660149885956, | |
"eval_loss": 1.3612703084945679, | |
"eval_runtime": 4.7367, | |
"eval_samples": 12, | |
"eval_samples_per_second": 2.533, | |
"eval_steps_per_second": 0.422, | |
"perplexity": 3.901145814186261, | |
"total_flos": 4887048754298880.0, | |
"train_loss": 0.6763701610076122, | |
"train_runtime": 1261.3832, | |
"train_samples": 262, | |
"train_samples_per_second": 0.623, | |
"train_steps_per_second": 0.155 | |
} |