gpt2_xl_discovery / train_results.txt
prajjwal1
v1
738a15a
epoch = 3.0
train_runtime = 251423.0864
train_samples_per_second = 0.419