xlnet-base-cased-best / train_results.json
Edward Gow-Smith
added model
ede4aa7
{
"epoch": 3.0,
"init_mem_cpu_alloc_delta": 894615552,
"init_mem_cpu_peaked_delta": 464302080,
"init_mem_gpu_alloc_delta": 469504512,
"init_mem_gpu_peaked_delta": 0,
"train_mem_cpu_alloc_delta": 32620544,
"train_mem_cpu_peaked_delta": 0,
"train_mem_gpu_alloc_delta": 1454737920,
"train_mem_gpu_peaked_delta": 4411375616,
"train_runtime": 539.9891,
"train_samples": 3327,
"train_samples_per_second": 0.578
}