{ "epoch": 3.0, "eval_gen_len": 59.9829, "eval_loss": 1.3891159296035767, "eval_mem_cpu_alloc_delta": 78528783, "eval_mem_cpu_peaked_delta": 2605953, "eval_mem_gpu_alloc_delta": 0, "eval_mem_gpu_peaked_delta": 980464128, "eval_rouge1": 42.621, "eval_rouge2": 21.9825, "eval_rougeL": 33.034, "eval_rougeLsum": 39.6783, "eval_runtime": 29.301, "eval_samples": 818, "eval_samples_per_second": 27.917, "init_mem_cpu_alloc_delta": 180674, "init_mem_cpu_peaked_delta": 18282, "init_mem_gpu_alloc_delta": 1625362944, "init_mem_gpu_peaked_delta": 0, "test_gen_len": 60.0757, "test_loss": 1.4224162101745605, "test_mem_cpu_alloc_delta": 82666029, "test_mem_cpu_peaked_delta": 2572070, "test_mem_gpu_alloc_delta": 0, "test_mem_gpu_peaked_delta": 1441433088, "test_rouge1": 41.3174, "test_rouge2": 20.8716, "test_rougeL": 32.1337, "test_rougeLsum": 38.4149, "test_runtime": 34.32, "test_samples": 819, "test_samples_per_second": 23.864, "train_mem_cpu_alloc_delta": 7544164, "train_mem_cpu_peaked_delta": 413671172, "train_mem_gpu_alloc_delta": 6524230144, "train_mem_gpu_peaked_delta": 12734977024, "train_runtime": 363.7124, "train_samples": 14732, "train_samples_per_second": 1.905 }