ADDI-IT-GPT2 / train_results.json
gantenbe
italian finetuning
060a8d4
{
"epoch": 1.0,
"init_mem_cpu_alloc_delta": 336807,
"init_mem_cpu_peaked_delta": 18306,
"init_mem_gpu_alloc_delta": 511148032,
"init_mem_gpu_peaked_delta": 0,
"train_mem_cpu_alloc_delta": 488444,
"train_mem_cpu_peaked_delta": 195767,
"train_mem_gpu_alloc_delta": 1501967872,
"train_mem_gpu_peaked_delta": 3374894592,
"train_runtime": 34.4014,
"train_samples": 128,
"train_samples_per_second": 3.721
}