{ "best_metric": 0.8918716694264321, "best_model_checkpoint": "/mnt/disks/vikram-disk-video-umd-2/macd/Hindi-/mnt/disks/vikram-disk-video-umd-2/macd/macd_finetuned_epoch_50/checkpoint-3020000-combined-1.0-5-393-5/checkpoint-22864", "epoch": 2.0, "global_step": 22864, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.04, "learning_rate": 1.9825052484254726e-05, "loss": 0.4099, "step": 500 }, { "epoch": 0.09, "learning_rate": 1.965010496850945e-05, "loss": 0.3527, "step": 1000 }, { "epoch": 0.13, "learning_rate": 1.9475157452764174e-05, "loss": 0.3385, "step": 1500 }, { "epoch": 0.17, "learning_rate": 1.9300209937018895e-05, "loss": 0.3327, "step": 2000 }, { "epoch": 0.22, "learning_rate": 1.912526242127362e-05, "loss": 0.3485, "step": 2500 }, { "epoch": 0.26, "learning_rate": 1.8950314905528343e-05, "loss": 0.3163, "step": 3000 }, { "epoch": 0.31, "learning_rate": 1.8775367389783064e-05, "loss": 0.3376, "step": 3500 }, { "epoch": 0.35, "learning_rate": 1.860041987403779e-05, "loss": 0.3247, "step": 4000 }, { "epoch": 0.39, "learning_rate": 1.8425472358292513e-05, "loss": 0.3302, "step": 4500 }, { "epoch": 0.44, "learning_rate": 1.8250524842547237e-05, "loss": 0.3297, "step": 5000 }, { "epoch": 0.48, "learning_rate": 1.807557732680196e-05, "loss": 0.3146, "step": 5500 }, { "epoch": 0.52, "learning_rate": 1.7900629811056685e-05, "loss": 0.3082, "step": 6000 }, { "epoch": 0.57, "learning_rate": 1.772568229531141e-05, "loss": 0.3276, "step": 6500 }, { "epoch": 0.61, "learning_rate": 1.7550734779566134e-05, "loss": 0.3217, "step": 7000 }, { "epoch": 0.66, "learning_rate": 1.7375787263820854e-05, "loss": 0.3191, "step": 7500 }, { "epoch": 0.7, "learning_rate": 1.720083974807558e-05, "loss": 0.3303, "step": 8000 }, { "epoch": 0.74, "learning_rate": 1.7025892232330303e-05, "loss": 0.3088, "step": 8500 }, { "epoch": 0.79, "learning_rate": 1.6850944716585024e-05, "loss": 0.3182, "step": 9000 }, { "epoch": 0.83, "learning_rate": 1.6675997200839748e-05, "loss": 0.3187, "step": 9500 }, { "epoch": 0.87, "learning_rate": 1.6501049685094472e-05, "loss": 0.3116, "step": 10000 }, { "epoch": 0.92, "learning_rate": 1.6326102169349196e-05, "loss": 0.2925, "step": 10500 }, { "epoch": 0.96, "learning_rate": 1.615115465360392e-05, "loss": 0.3108, "step": 11000 }, { "epoch": 1.0, "eval_accuracy": 0.8909299655568312, "eval_f1_macro": 0.8909188308491909, "eval_loss": 0.2862579822540283, "eval_runtime": 87.3812, "eval_samples_per_second": 348.874, "eval_steps_per_second": 43.613, "step": 11432 }, { "epoch": 1.01, "learning_rate": 1.5976207137858644e-05, "loss": 0.3088, "step": 11500 }, { "epoch": 1.05, "learning_rate": 1.580125962211337e-05, "loss": 0.2665, "step": 12000 }, { "epoch": 1.09, "learning_rate": 1.562631210636809e-05, "loss": 0.2772, "step": 12500 }, { "epoch": 1.14, "learning_rate": 1.5451364590622814e-05, "loss": 0.2747, "step": 13000 }, { "epoch": 1.18, "learning_rate": 1.5276417074877538e-05, "loss": 0.2672, "step": 13500 }, { "epoch": 1.22, "learning_rate": 1.5101469559132262e-05, "loss": 0.2632, "step": 14000 }, { "epoch": 1.27, "learning_rate": 1.4926522043386986e-05, "loss": 0.2531, "step": 14500 }, { "epoch": 1.31, "learning_rate": 1.4751574527641707e-05, "loss": 0.2885, "step": 15000 }, { "epoch": 1.36, "learning_rate": 1.4576627011896431e-05, "loss": 0.2643, "step": 15500 }, { "epoch": 1.4, "learning_rate": 1.4401679496151155e-05, "loss": 0.2834, "step": 16000 }, { "epoch": 1.44, "learning_rate": 1.422673198040588e-05, "loss": 0.2915, "step": 16500 }, { "epoch": 1.49, "learning_rate": 1.4051784464660602e-05, "loss": 0.265, "step": 17000 }, { "epoch": 1.53, "learning_rate": 1.3876836948915326e-05, "loss": 0.2729, "step": 17500 }, { "epoch": 1.57, "learning_rate": 1.370188943317005e-05, "loss": 0.2719, "step": 18000 }, { "epoch": 1.62, "learning_rate": 1.3526941917424775e-05, "loss": 0.2621, "step": 18500 }, { "epoch": 1.66, "learning_rate": 1.3351994401679497e-05, "loss": 0.2862, "step": 19000 }, { "epoch": 1.71, "learning_rate": 1.3177046885934221e-05, "loss": 0.2662, "step": 19500 }, { "epoch": 1.75, "learning_rate": 1.3002099370188946e-05, "loss": 0.2905, "step": 20000 }, { "epoch": 1.79, "learning_rate": 1.2827151854443666e-05, "loss": 0.271, "step": 20500 }, { "epoch": 1.84, "learning_rate": 1.265220433869839e-05, "loss": 0.277, "step": 21000 }, { "epoch": 1.88, "learning_rate": 1.2477256822953115e-05, "loss": 0.2681, "step": 21500 }, { "epoch": 1.92, "learning_rate": 1.2302309307207839e-05, "loss": 0.2685, "step": 22000 }, { "epoch": 1.97, "learning_rate": 1.2127361791462561e-05, "loss": 0.2595, "step": 22500 }, { "epoch": 2.0, "eval_accuracy": 0.8918812530752829, "eval_f1_macro": 0.8918716694264321, "eval_loss": 0.39037129282951355, "eval_runtime": 87.141, "eval_samples_per_second": 349.835, "eval_steps_per_second": 43.734, "step": 22864 } ], "max_steps": 57160, "num_train_epochs": 5, "total_flos": 4.812406446956544e+16, "trial_name": null, "trial_params": null }