ce-lery's picture
feat: fine-tuning japanese-mistral-300M-base with databricks-dolly-15k-ja
025d0db
{
"epoch": 193.14,
"eval_loss": 2.513946056365967,
"eval_runtime": 4.6377,
"eval_samples": 313,
"eval_samples_per_second": 67.49,
"eval_steps_per_second": 17.034,
"perplexity": 12.353581936499637,
"train_loss": 2.2616969472711737,
"train_runtime": 20093.6832,
"train_samples": 2916,
"train_samples_per_second": 29.024,
"train_steps_per_second": 0.109
}