{ | |
"epoch": 9.852216748768473, | |
"eval_accuracy": 0.3451256113828368, | |
"eval_loss": 3.7245092391967773, | |
"eval_runtime": 6.0968, | |
"eval_samples": 44, | |
"eval_samples_per_second": 7.217, | |
"eval_steps_per_second": 7.217, | |
"perplexity": 41.4508852826151, | |
"total_flos": 3.70944044433408e+17, | |
"train_loss": 4.3953623046875, | |
"train_runtime": 3726.3159, | |
"train_samples": 812, | |
"train_samples_per_second": 2.179, | |
"train_steps_per_second": 0.134 | |
} |