{ "epoch": 5.0, "eval_loss": 1.1778761148452759, "eval_mem_cpu_alloc_delta": 89380, "eval_mem_cpu_peaked_delta": 18278, "eval_mem_gpu_alloc_delta": 0, "eval_mem_gpu_peaked_delta": 471300608, "eval_runtime": 1.5089, "eval_samples": 18, "eval_samples_per_second": 11.929, "init_mem_cpu_alloc_delta": 10338468, "init_mem_cpu_peaked_delta": 18306, "init_mem_gpu_alloc_delta": 334744576, "init_mem_gpu_peaked_delta": 0, "perplexity": 3.247469620697528, "train_mem_cpu_alloc_delta": 1179270, "train_mem_cpu_peaked_delta": 576384, "train_mem_gpu_alloc_delta": 987446784, "train_mem_gpu_peaked_delta": 2037095424, "train_runtime": 145.1649, "train_samples": 160, "train_samples_per_second": 5.511 }