{ "base_model_name": "NousResearch_Llama-2-7b-hf", "base_model_class": "LlamaForCausalLM", "base_loaded_in_4bit": true, "base_loaded_in_8bit": false, "projections": "q, v", "loss": 1.0448, "learning_rate": 0.0, "epoch": 1.99, "current_steps": 18900, "train_runtime": 59350.6837, "train_samples_per_second": 0.641, "train_steps_per_second": 0.005, "total_flos": 7.999500885153546e+17, "train_loss": 1.075667697835613 }