{ "before_init_mem_cpu": 19409301504, "before_init_mem_gpu": 514785792, "epoch": 5.0, "eval_accuracy": 0.5020384866275277, "eval_loss": 2.396484375, "eval_mem_cpu_alloc_delta": 1241088, "eval_mem_cpu_peaked_delta": 0, "eval_mem_gpu_alloc_delta": 0, "eval_mem_gpu_peaked_delta": 13894116352, "eval_runtime": 7.6383, "eval_samples": 24, "eval_samples_per_second": 3.142, "eval_steps_per_second": 0.131, "init_mem_cpu_alloc_delta": 20480, "init_mem_cpu_peaked_delta": 0, "init_mem_gpu_alloc_delta": 0, "init_mem_gpu_peaked_delta": 0, "perplexity": 10.984491067549964, "train_loss": 2.6133464177449546, "train_mem_cpu_alloc_delta": 87850864640, "train_mem_cpu_peaked_delta": 4164583424, "train_mem_gpu_alloc_delta": -456804352, "train_mem_gpu_peaked_delta": 13894116352, "train_runtime": 736.506, "train_samples": 165, "train_samples_per_second": 1.12, "train_steps_per_second": 0.02 }