{ | |
"epoch": 0.0067933301849093615, | |
"eval_accuracy": 0.09167533902983765, | |
"eval_loss": 8.9140625, | |
"eval_runtime": 492.4035, | |
"eval_samples": 33767, | |
"eval_samples_per_second": 68.576, | |
"eval_steps_per_second": 2.857, | |
"perplexity": 7435.807790500043, | |
"total_flos": 1043124562427904.0, | |
"train_loss": 9.606408756684491, | |
"train_runtime": 94484.0244, | |
"train_samples": 660643, | |
"train_samples_per_second": 699.211, | |
"train_steps_per_second": 29.134 | |
} |