danish-legal-lm-base / all_results.json
kiddothe2b
500k training steps with 128 tokens
5443746
{
"epoch": 53.58,
"eval_loss": 0.7302267551422119,
"eval_runtime": 3.6523,
"eval_samples_per_second": 2738.025,
"eval_steps_per_second": 21.63,
"perplexity": 2.0755511962245876,
"train_loss": 1.193239736328125,
"train_runtime": 102111.9968,
"train_samples_per_second": 1253.526,
"train_steps_per_second": 4.897
}