{ "epoch": 30.0, "eval_loss": 0.027720022946596146, "eval_mem_cpu_alloc_delta": 0, "eval_mem_cpu_peaked_delta": 0, "eval_mem_gpu_alloc_delta": 0, "eval_mem_gpu_peaked_delta": 569275904, "eval_runtime": 8.6733, "eval_samples": 49, "eval_samples_per_second": 5.65, "init_mem_cpu_alloc_delta": 702398464, "init_mem_cpu_peaked_delta": 0, "init_mem_gpu_alloc_delta": 1370738688, "init_mem_gpu_peaked_delta": 0, "perplexity": 1.0281077975307098, "train_mem_cpu_alloc_delta": 18444288, "train_mem_cpu_peaked_delta": 0, "train_mem_gpu_alloc_delta": 4036706816, "train_mem_gpu_peaked_delta": 8663361536, "train_runtime": 924.1697, "train_samples": 49, "train_samples_per_second": 1.591 }