|
{ |
|
"best_metric": 0.8918716694264321, |
|
"best_model_checkpoint": "/mnt/disks/vikram-disk-video-umd-2/macd/Hindi-/mnt/disks/vikram-disk-video-umd-2/macd/macd_finetuned_epoch_50/checkpoint-3020000-combined-1.0-5-393-5/checkpoint-22864", |
|
"epoch": 2.0, |
|
"global_step": 22864, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.04, |
|
"learning_rate": 1.9825052484254726e-05, |
|
"loss": 0.4099, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.09, |
|
"learning_rate": 1.965010496850945e-05, |
|
"loss": 0.3527, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"learning_rate": 1.9475157452764174e-05, |
|
"loss": 0.3385, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"learning_rate": 1.9300209937018895e-05, |
|
"loss": 0.3327, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.22, |
|
"learning_rate": 1.912526242127362e-05, |
|
"loss": 0.3485, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.26, |
|
"learning_rate": 1.8950314905528343e-05, |
|
"loss": 0.3163, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.31, |
|
"learning_rate": 1.8775367389783064e-05, |
|
"loss": 0.3376, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 0.35, |
|
"learning_rate": 1.860041987403779e-05, |
|
"loss": 0.3247, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"learning_rate": 1.8425472358292513e-05, |
|
"loss": 0.3302, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"learning_rate": 1.8250524842547237e-05, |
|
"loss": 0.3297, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"learning_rate": 1.807557732680196e-05, |
|
"loss": 0.3146, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 0.52, |
|
"learning_rate": 1.7900629811056685e-05, |
|
"loss": 0.3082, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"learning_rate": 1.772568229531141e-05, |
|
"loss": 0.3276, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"learning_rate": 1.7550734779566134e-05, |
|
"loss": 0.3217, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 0.66, |
|
"learning_rate": 1.7375787263820854e-05, |
|
"loss": 0.3191, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"learning_rate": 1.720083974807558e-05, |
|
"loss": 0.3303, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"learning_rate": 1.7025892232330303e-05, |
|
"loss": 0.3088, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 0.79, |
|
"learning_rate": 1.6850944716585024e-05, |
|
"loss": 0.3182, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 0.83, |
|
"learning_rate": 1.6675997200839748e-05, |
|
"loss": 0.3187, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 0.87, |
|
"learning_rate": 1.6501049685094472e-05, |
|
"loss": 0.3116, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 0.92, |
|
"learning_rate": 1.6326102169349196e-05, |
|
"loss": 0.2925, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 0.96, |
|
"learning_rate": 1.615115465360392e-05, |
|
"loss": 0.3108, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.8909299655568312, |
|
"eval_f1_macro": 0.8909188308491909, |
|
"eval_loss": 0.2862579822540283, |
|
"eval_runtime": 87.3812, |
|
"eval_samples_per_second": 348.874, |
|
"eval_steps_per_second": 43.613, |
|
"step": 11432 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"learning_rate": 1.5976207137858644e-05, |
|
"loss": 0.3088, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 1.05, |
|
"learning_rate": 1.580125962211337e-05, |
|
"loss": 0.2665, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 1.09, |
|
"learning_rate": 1.562631210636809e-05, |
|
"loss": 0.2772, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 1.14, |
|
"learning_rate": 1.5451364590622814e-05, |
|
"loss": 0.2747, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"learning_rate": 1.5276417074877538e-05, |
|
"loss": 0.2672, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 1.22, |
|
"learning_rate": 1.5101469559132262e-05, |
|
"loss": 0.2632, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 1.27, |
|
"learning_rate": 1.4926522043386986e-05, |
|
"loss": 0.2531, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 1.31, |
|
"learning_rate": 1.4751574527641707e-05, |
|
"loss": 0.2885, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 1.36, |
|
"learning_rate": 1.4576627011896431e-05, |
|
"loss": 0.2643, |
|
"step": 15500 |
|
}, |
|
{ |
|
"epoch": 1.4, |
|
"learning_rate": 1.4401679496151155e-05, |
|
"loss": 0.2834, |
|
"step": 16000 |
|
}, |
|
{ |
|
"epoch": 1.44, |
|
"learning_rate": 1.422673198040588e-05, |
|
"loss": 0.2915, |
|
"step": 16500 |
|
}, |
|
{ |
|
"epoch": 1.49, |
|
"learning_rate": 1.4051784464660602e-05, |
|
"loss": 0.265, |
|
"step": 17000 |
|
}, |
|
{ |
|
"epoch": 1.53, |
|
"learning_rate": 1.3876836948915326e-05, |
|
"loss": 0.2729, |
|
"step": 17500 |
|
}, |
|
{ |
|
"epoch": 1.57, |
|
"learning_rate": 1.370188943317005e-05, |
|
"loss": 0.2719, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 1.62, |
|
"learning_rate": 1.3526941917424775e-05, |
|
"loss": 0.2621, |
|
"step": 18500 |
|
}, |
|
{ |
|
"epoch": 1.66, |
|
"learning_rate": 1.3351994401679497e-05, |
|
"loss": 0.2862, |
|
"step": 19000 |
|
}, |
|
{ |
|
"epoch": 1.71, |
|
"learning_rate": 1.3177046885934221e-05, |
|
"loss": 0.2662, |
|
"step": 19500 |
|
}, |
|
{ |
|
"epoch": 1.75, |
|
"learning_rate": 1.3002099370188946e-05, |
|
"loss": 0.2905, |
|
"step": 20000 |
|
}, |
|
{ |
|
"epoch": 1.79, |
|
"learning_rate": 1.2827151854443666e-05, |
|
"loss": 0.271, |
|
"step": 20500 |
|
}, |
|
{ |
|
"epoch": 1.84, |
|
"learning_rate": 1.265220433869839e-05, |
|
"loss": 0.277, |
|
"step": 21000 |
|
}, |
|
{ |
|
"epoch": 1.88, |
|
"learning_rate": 1.2477256822953115e-05, |
|
"loss": 0.2681, |
|
"step": 21500 |
|
}, |
|
{ |
|
"epoch": 1.92, |
|
"learning_rate": 1.2302309307207839e-05, |
|
"loss": 0.2685, |
|
"step": 22000 |
|
}, |
|
{ |
|
"epoch": 1.97, |
|
"learning_rate": 1.2127361791462561e-05, |
|
"loss": 0.2595, |
|
"step": 22500 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.8918812530752829, |
|
"eval_f1_macro": 0.8918716694264321, |
|
"eval_loss": 0.39037129282951355, |
|
"eval_runtime": 87.141, |
|
"eval_samples_per_second": 349.835, |
|
"eval_steps_per_second": 43.734, |
|
"step": 22864 |
|
} |
|
], |
|
"max_steps": 57160, |
|
"num_train_epochs": 5, |
|
"total_flos": 4.812406446956544e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|