ADDI-CH-XLM-R / train_results.json
gantenbe
swiss training
3f24058
{
"epoch": 1.0,
"init_mem_cpu_alloc_delta": 347038,
"init_mem_cpu_peaked_delta": 18306,
"init_mem_gpu_alloc_delta": 1109893120,
"init_mem_gpu_peaked_delta": 0,
"train_mem_cpu_alloc_delta": 894426,
"train_mem_cpu_peaked_delta": 4141937,
"train_mem_gpu_alloc_delta": 3345894400,
"train_mem_gpu_peaked_delta": 3577686016,
"train_runtime": 4566.3645,
"train_samples": 90000,
"train_samples_per_second": 2.464
}