{ "before_init_mem_cpu": 699817984, "before_init_mem_gpu": 0, "epoch": 5.98, "eval_accuracy": 0.544073054441718, "eval_loss": 1.9982993602752686, "eval_mem_cpu_alloc_delta": 9977856, "eval_mem_cpu_peaked_delta": 60305408, "eval_mem_gpu_alloc_delta": 0, "eval_mem_gpu_peaked_delta": 2357757952, "eval_runtime": 481.5484, "eval_samples": 588, "eval_samples_per_second": 1.221, "eval_steps_per_second": 0.305, "init_mem_cpu_alloc_delta": -283938816, "init_mem_cpu_peaked_delta": 332918784, "init_mem_gpu_alloc_delta": 334744576, "init_mem_gpu_peaked_delta": 0, "perplexity": 7.376500655769286, "train_loss": 2.0183091745143984, "train_mem_cpu_alloc_delta": 1155149824, "train_mem_cpu_peaked_delta": 308719616, "train_mem_gpu_alloc_delta": 988995584, "train_mem_gpu_peaked_delta": 4500811776, "train_runtime": 35067.5673, "train_samples": 5325, "train_samples_per_second": 0.911, "train_steps_per_second": 0.007 }