japanese-mistral-300m-base / all_results.json
ce-lery's picture
feat: pretrained by recipe v0.1.0
c783850
{
"epoch": 1.0,
"eval_loss": 3.5582468509674072,
"eval_runtime": 6274.8366,
"eval_samples": 551057,
"eval_samples_per_second": 87.82,
"eval_steps_per_second": 21.955,
"perplexity": 35.10160482608155,
"train_loss": 3.89913355111991,
"train_runtime": 393554.9634,
"train_samples": 10794765,
"train_samples_per_second": 27.429,
"train_steps_per_second": 0.107
}