{ "base_model_name": "mpasila_gpt3-finnish-8B-gptq-4bit", "base_model_class": "BloomForCausalLM", "base_loaded_in_4bit": false, "base_loaded_in_8bit": false, "projections": "query_key_value", "loss": 2.0361, "grad_norm": 0.1468171924352646, "learning_rate": 3.1034482758620685e-05, "epoch": 2.98, "current_steps": 1051, "train_runtime": 8426.1409, "train_samples_per_second": 0.504, "train_steps_per_second": 0.004, "total_flos": 2618215184203776.0, "train_loss": 2.226992231426817 }