{ | |
"epoch": 0.9999786256278722, | |
"eval_accuracy": 0.1880817456440319, | |
"eval_loss": 5.653779983520508, | |
"eval_runtime": 112.4797, | |
"eval_samples": 300, | |
"eval_samples_per_second": 2.667, | |
"eval_steps_per_second": 1.334, | |
"num_input_tokens_seen": 766509056, | |
"perplexity": 285.3681164586281, | |
"total_flos": 4.708536848052388e+17, | |
"train_loss": 5.594264277028972, | |
"train_runtime": 134120.2101, | |
"train_samples": 374280, | |
"train_samples_per_second": 2.791, | |
"train_steps_per_second": 0.044 | |
} |