3.68 kB
{ | |
"best_metric": null, | |
"best_model_checkpoint": null, | |
"epoch": 0.5266468686454935, | |
"global_step": 4500, | |
"is_hyper_param_search": false, | |
"is_local_process_zero": true, | |
"is_world_process_zero": true, | |
"log_history": [ | |
{ | |
"epoch": 0.06, | |
"learning_rate": 0.00015, | |
"loss": 2.5393, | |
"step": 500 | |
}, | |
{ | |
"epoch": 0.06, | |
"eval_loss": 0.4428945779800415, | |
"eval_phone_accuracy": 0.9003876271495096, | |
"eval_runtime": 16.8778, | |
"eval_samples_per_second": 11.85, | |
"eval_steps_per_second": 2.962, | |
"step": 500 | |
}, | |
{ | |
"epoch": 0.12, | |
"learning_rate": 0.0003, | |
"loss": 0.4474, | |
"step": 1000 | |
}, | |
{ | |
"epoch": 0.12, | |
"eval_loss": 0.2071739137172699, | |
"eval_phone_accuracy": 0.9347190787134594, | |
"eval_runtime": 15.9974, | |
"eval_samples_per_second": 12.502, | |
"eval_steps_per_second": 3.126, | |
"step": 1000 | |
}, | |
{ | |
"epoch": 0.18, | |
"learning_rate": 0.00028011664899257687, | |
"loss": 0.3105, | |
"step": 1500 | |
}, | |
{ | |
"epoch": 0.18, | |
"eval_loss": 0.174857959151268, | |
"eval_phone_accuracy": 0.94312200282699, | |
"eval_runtime": 16.5779, | |
"eval_samples_per_second": 12.064, | |
"eval_steps_per_second": 3.016, | |
"step": 1500 | |
}, | |
{ | |
"epoch": 0.23, | |
"learning_rate": 0.0002602332979851537, | |
"loss": 0.2682, | |
"step": 2000 | |
}, | |
{ | |
"epoch": 0.23, | |
"eval_loss": 0.16749557852745056, | |
"eval_phone_accuracy": 0.9447956502510471, | |
"eval_runtime": 15.1084, | |
"eval_samples_per_second": 13.238, | |
"eval_steps_per_second": 3.309, | |
"step": 2000 | |
}, | |
{ | |
"epoch": 0.29, | |
"learning_rate": 0.0002403499469777306, | |
"loss": 0.2467, | |
"step": 2500 | |
}, | |
{ | |
"epoch": 0.29, | |
"eval_loss": 0.15832921862602234, | |
"eval_phone_accuracy": 0.9478567774048926, | |
"eval_runtime": 14.9641, | |
"eval_samples_per_second": 13.365, | |
"eval_steps_per_second": 3.341, | |
"step": 2500 | |
}, | |
{ | |
"epoch": 0.35, | |
"learning_rate": 0.00022046659597030753, | |
"loss": 0.2324, | |
"step": 3000 | |
}, | |
{ | |
"epoch": 0.35, | |
"eval_loss": 0.14310674369335175, | |
"eval_phone_accuracy": 0.949885966509708, | |
"eval_runtime": 15.0339, | |
"eval_samples_per_second": 13.303, | |
"eval_steps_per_second": 3.326, | |
"step": 3000 | |
}, | |
{ | |
"epoch": 0.41, | |
"learning_rate": 0.0002005832449628844, | |
"loss": 0.22, | |
"step": 3500 | |
}, | |
{ | |
"epoch": 0.41, | |
"eval_loss": 0.13784204423427582, | |
"eval_phone_accuracy": 0.9521579645672364, | |
"eval_runtime": 16.1699, | |
"eval_samples_per_second": 12.369, | |
"eval_steps_per_second": 3.092, | |
"step": 3500 | |
}, | |
{ | |
"epoch": 0.47, | |
"learning_rate": 0.0001806998939554613, | |
"loss": 0.2109, | |
"step": 4000 | |
}, | |
{ | |
"epoch": 0.47, | |
"eval_loss": 0.1341935396194458, | |
"eval_phone_accuracy": 0.9543519168899642, | |
"eval_runtime": 15.6229, | |
"eval_samples_per_second": 12.802, | |
"eval_steps_per_second": 3.2, | |
"step": 4000 | |
}, | |
{ | |
"epoch": 0.53, | |
"learning_rate": 0.00016081654294803816, | |
"loss": 0.2039, | |
"step": 4500 | |
}, | |
{ | |
"epoch": 0.53, | |
"eval_loss": 0.13459673523902893, | |
"eval_phone_accuracy": 0.9526435824726623, | |
"eval_runtime": 15.5354, | |
"eval_samples_per_second": 12.874, | |
"eval_steps_per_second": 3.218, | |
"step": 4500 | |
} | |
], | |
"max_steps": 8544, | |
"num_train_epochs": 1, | |
"total_flos": 7.300030651149006e+19, | |
"trial_name": null, | |
"trial_params": null | |
} | |