Phi_3_Luna_LoRA / training_log.json
jeiku's picture
Upload 6 files
23939ae verified
{
"base_model_name": "kaitchup_Phi-3-mini-4k-instruct-gptq-4bit",
"base_model_class": "Phi3ForCausalLM",
"base_loaded_in_4bit": false,
"base_loaded_in_8bit": false,
"projections": "gate, down, up, q, v, k, o",
"loss": 2.3226,
"grad_norm": 0.7724075317382812,
"learning_rate": 3.968661679220468e-06,
"epoch": 4.68,
"current_steps": 375,
"train_runtime": 6909.537,
"train_samples_per_second": 0.284,
"train_steps_per_second": 0.002,
"total_flos": 6400703559892992.0,
"train_loss": 2.412670890490214
}