zephyr7b_prompts / training_log.json
Jon
Upload 8 files
eb03016
raw
history blame contribute delete
519 Bytes
{
"base_model_name": "HuggingFaceH4_zephyr-7b-alpha",
"base_model_class": "MistralForCausalLM",
"base_loaded_in_4bit": true,
"base_loaded_in_8bit": false,
"projections": "q, v",
"loss": 0.5865,
"learning_rate": 2.727272727272727e-05,
"epoch": 3.0,
"current_steps": 209,
"current_steps_adjusted": 209,
"epoch_adjusted": 3.0,
"train_runtime": 152.7978,
"train_samples_per_second": 5.478,
"train_steps_per_second": 1.374,
"total_flos": 9159217237721088.0,
"train_loss": 1.2863307027589708
}