roberta_new / train_results.json
prajjwal1
better; improved; added tests :)
abd1737
{
"epoch": 4.0,
"init_mem_cpu_alloc_delta": 1738252288,
"init_mem_cpu_peaked_delta": 205234176,
"init_mem_gpu_alloc_delta": 1421448192,
"init_mem_gpu_peaked_delta": 0,
"train_mem_cpu_alloc_delta": 96493568,
"train_mem_cpu_peaked_delta": 411959296,
"train_mem_gpu_alloc_delta": 4272819712,
"train_mem_gpu_peaked_delta": 10925989888,
"train_runtime": 11120.1386,
"train_samples_per_second": 1.865
}