roberta_hellaswag / train_results.json
prajjwal1
v1
4014e15
{
"epoch": 4.0,
"init_mem_cpu_alloc_delta": 2172727296,
"init_mem_cpu_peaked_delta": 1010765824,
"init_mem_gpu_alloc_delta": 1421448192,
"init_mem_gpu_peaked_delta": 0,
"train_mem_cpu_alloc_delta": 360235008,
"train_mem_cpu_peaked_delta": 411705344,
"train_mem_gpu_alloc_delta": 4275038720,
"train_mem_gpu_peaked_delta": 15916604928,
"train_runtime": 4895.7804,
"train_samples": 39905,
"train_samples_per_second": 1.02
}