{ "best_metric": 0.14910581707954407, "best_model_checkpoint": "speech-multiclassifier-run-2/checkpoint-3192", "epoch": 5.0, "global_step": 15960, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.16, "learning_rate": 1.9373433583959903e-05, "loss": 0.2984, "step": 500 }, { "epoch": 0.31, "learning_rate": 1.87468671679198e-05, "loss": 0.2101, "step": 1000 }, { "epoch": 0.47, "learning_rate": 1.81203007518797e-05, "loss": 0.2104, "step": 1500 }, { "epoch": 0.63, "learning_rate": 1.74937343358396e-05, "loss": 0.1926, "step": 2000 }, { "epoch": 0.78, "learning_rate": 1.68671679197995e-05, "loss": 0.1981, "step": 2500 }, { "epoch": 0.94, "learning_rate": 1.62406015037594e-05, "loss": 0.1808, "step": 3000 }, { "epoch": 1.0, "eval_loss": 0.14910581707954407, "eval_overall-accuracy": 0.9499647639182522, "eval_overall-f1": 0.9499647639182522, "eval_overall-precision": 0.9499647639182522, "eval_overall-recall": 0.9499647639182522, "eval_runtime": 79.4483, "eval_samples_per_second": 35.721, "eval_steps_per_second": 2.24, "step": 3192 }, { "epoch": 1.1, "learning_rate": 1.56140350877193e-05, "loss": 0.1611, "step": 3500 }, { "epoch": 1.25, "learning_rate": 1.49874686716792e-05, "loss": 0.1598, "step": 4000 }, { "epoch": 1.41, "learning_rate": 1.43609022556391e-05, "loss": 0.1544, "step": 4500 }, { "epoch": 1.57, "learning_rate": 1.3734335839598997e-05, "loss": 0.1536, "step": 5000 }, { "epoch": 1.72, "learning_rate": 1.3107769423558898e-05, "loss": 0.1518, "step": 5500 }, { "epoch": 1.88, "learning_rate": 1.2481203007518798e-05, "loss": 0.1567, "step": 6000 }, { "epoch": 2.0, "eval_loss": 0.1555911898612976, "eval_overall-accuracy": 0.9513742071881607, "eval_overall-f1": 0.9513742071881607, "eval_overall-precision": 0.9513742071881607, "eval_overall-recall": 0.9513742071881607, "eval_runtime": 78.9404, "eval_samples_per_second": 35.951, "eval_steps_per_second": 2.255, "step": 6384 }, { "epoch": 2.04, "learning_rate": 1.18546365914787e-05, "loss": 0.1468, "step": 6500 }, { "epoch": 2.19, "learning_rate": 1.1228070175438597e-05, "loss": 0.1265, "step": 7000 }, { "epoch": 2.35, "learning_rate": 1.0601503759398497e-05, "loss": 0.1211, "step": 7500 }, { "epoch": 2.51, "learning_rate": 9.974937343358396e-06, "loss": 0.1232, "step": 8000 }, { "epoch": 2.66, "learning_rate": 9.348370927318296e-06, "loss": 0.1215, "step": 8500 }, { "epoch": 2.82, "learning_rate": 8.721804511278195e-06, "loss": 0.114, "step": 9000 }, { "epoch": 2.98, "learning_rate": 8.095238095238097e-06, "loss": 0.1328, "step": 9500 }, { "epoch": 3.0, "eval_loss": 0.17720717191696167, "eval_overall-accuracy": 0.952431289640592, "eval_overall-f1": 0.952431289640592, "eval_overall-precision": 0.952431289640592, "eval_overall-recall": 0.952431289640592, "eval_runtime": 78.7543, "eval_samples_per_second": 36.036, "eval_steps_per_second": 2.26, "step": 9576 }, { "epoch": 3.13, "learning_rate": 7.468671679197995e-06, "loss": 0.1011, "step": 10000 }, { "epoch": 3.29, "learning_rate": 6.842105263157896e-06, "loss": 0.0942, "step": 10500 }, { "epoch": 3.45, "learning_rate": 6.215538847117794e-06, "loss": 0.0994, "step": 11000 }, { "epoch": 3.6, "learning_rate": 5.588972431077695e-06, "loss": 0.1042, "step": 11500 }, { "epoch": 3.76, "learning_rate": 4.962406015037594e-06, "loss": 0.0993, "step": 12000 }, { "epoch": 3.92, "learning_rate": 4.335839598997494e-06, "loss": 0.0954, "step": 12500 }, { "epoch": 4.0, "eval_loss": 0.1867782473564148, "eval_overall-accuracy": 0.95630725863284, "eval_overall-f1": 0.95630725863284, "eval_overall-precision": 0.95630725863284, "eval_overall-recall": 0.95630725863284, "eval_runtime": 79.4309, "eval_samples_per_second": 35.729, "eval_steps_per_second": 2.241, "step": 12768 }, { "epoch": 4.07, "learning_rate": 3.7092731829573934e-06, "loss": 0.0798, "step": 13000 }, { "epoch": 4.23, "learning_rate": 3.0827067669172934e-06, "loss": 0.0773, "step": 13500 }, { "epoch": 4.39, "learning_rate": 2.456140350877193e-06, "loss": 0.0827, "step": 14000 }, { "epoch": 4.54, "learning_rate": 1.8295739348370927e-06, "loss": 0.0857, "step": 14500 }, { "epoch": 4.7, "learning_rate": 1.2030075187969925e-06, "loss": 0.0758, "step": 15000 }, { "epoch": 4.86, "learning_rate": 5.764411027568922e-07, "loss": 0.0756, "step": 15500 }, { "epoch": 5.0, "eval_loss": 0.20741401612758636, "eval_overall-accuracy": 0.9570119802677942, "eval_overall-f1": 0.9570119802677942, "eval_overall-precision": 0.9570119802677942, "eval_overall-recall": 0.9570119802677942, "eval_runtime": 80.2735, "eval_samples_per_second": 35.354, "eval_steps_per_second": 2.217, "step": 15960 } ], "max_steps": 15960, "num_train_epochs": 5, "total_flos": 4401666409805172.0, "trial_name": null, "trial_params": null }