|
{ |
|
"best_metric": 0.8, |
|
"best_model_checkpoint": "videomae-base-ipm_first_videos/checkpoint-123", |
|
"epoch": 48.00606060606061, |
|
"global_step": 146, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.01, |
|
"eval_accuracy": 0.22857142857142856, |
|
"eval_loss": 1.7709606885910034, |
|
"eval_runtime": 56.0244, |
|
"eval_samples_per_second": 0.625, |
|
"eval_steps_per_second": 0.161, |
|
"step": 3 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"eval_accuracy": 0.14285714285714285, |
|
"eval_loss": 1.7788584232330322, |
|
"eval_runtime": 54.8936, |
|
"eval_samples_per_second": 0.638, |
|
"eval_steps_per_second": 0.164, |
|
"step": 6 |
|
}, |
|
{ |
|
"epoch": 2.01, |
|
"eval_accuracy": 0.08571428571428572, |
|
"eval_loss": 1.7939355373382568, |
|
"eval_runtime": 57.093, |
|
"eval_samples_per_second": 0.613, |
|
"eval_steps_per_second": 0.158, |
|
"step": 9 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 1.5151515151515153e-05, |
|
"loss": 1.7369, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 3.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 1.8259599208831787, |
|
"eval_runtime": 49.6198, |
|
"eval_samples_per_second": 0.705, |
|
"eval_steps_per_second": 0.181, |
|
"step": 12 |
|
}, |
|
{ |
|
"epoch": 4.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 1.8636661767959595, |
|
"eval_runtime": 47.6299, |
|
"eval_samples_per_second": 0.735, |
|
"eval_steps_per_second": 0.189, |
|
"step": 15 |
|
}, |
|
{ |
|
"epoch": 5.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 1.916202187538147, |
|
"eval_runtime": 54.478, |
|
"eval_samples_per_second": 0.642, |
|
"eval_steps_per_second": 0.165, |
|
"step": 18 |
|
}, |
|
{ |
|
"epoch": 6.01, |
|
"learning_rate": 3.0303030303030306e-05, |
|
"loss": 1.6934, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 6.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 1.979854702949524, |
|
"eval_runtime": 47.3817, |
|
"eval_samples_per_second": 0.739, |
|
"eval_steps_per_second": 0.19, |
|
"step": 21 |
|
}, |
|
{ |
|
"epoch": 7.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 2.032222270965576, |
|
"eval_runtime": 47.048, |
|
"eval_samples_per_second": 0.744, |
|
"eval_steps_per_second": 0.191, |
|
"step": 24 |
|
}, |
|
{ |
|
"epoch": 8.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 2.147186756134033, |
|
"eval_runtime": 56.4896, |
|
"eval_samples_per_second": 0.62, |
|
"eval_steps_per_second": 0.159, |
|
"step": 27 |
|
}, |
|
{ |
|
"epoch": 9.01, |
|
"learning_rate": 4.545454545454546e-05, |
|
"loss": 1.636, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 9.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 2.201059103012085, |
|
"eval_runtime": 47.193, |
|
"eval_samples_per_second": 0.742, |
|
"eval_steps_per_second": 0.191, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 10.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 2.3041186332702637, |
|
"eval_runtime": 49.6007, |
|
"eval_samples_per_second": 0.706, |
|
"eval_steps_per_second": 0.181, |
|
"step": 33 |
|
}, |
|
{ |
|
"epoch": 11.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 2.202650785446167, |
|
"eval_runtime": 51.3674, |
|
"eval_samples_per_second": 0.681, |
|
"eval_steps_per_second": 0.175, |
|
"step": 36 |
|
}, |
|
{ |
|
"epoch": 12.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 2.1011433601379395, |
|
"eval_runtime": 47.3736, |
|
"eval_samples_per_second": 0.739, |
|
"eval_steps_per_second": 0.19, |
|
"step": 39 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"learning_rate": 4.882154882154882e-05, |
|
"loss": 1.6069, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 13.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 2.0470354557037354, |
|
"eval_runtime": 52.7055, |
|
"eval_samples_per_second": 0.664, |
|
"eval_steps_per_second": 0.171, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 14.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 1.9688891172409058, |
|
"eval_runtime": 46.2559, |
|
"eval_samples_per_second": 0.757, |
|
"eval_steps_per_second": 0.195, |
|
"step": 45 |
|
}, |
|
{ |
|
"epoch": 15.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 1.911560297012329, |
|
"eval_runtime": 55.4227, |
|
"eval_samples_per_second": 0.632, |
|
"eval_steps_per_second": 0.162, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 16.01, |
|
"learning_rate": 4.713804713804714e-05, |
|
"loss": 1.6509, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 16.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 1.9125531911849976, |
|
"eval_runtime": 55.4531, |
|
"eval_samples_per_second": 0.631, |
|
"eval_steps_per_second": 0.162, |
|
"step": 51 |
|
}, |
|
{ |
|
"epoch": 17.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 2.038973808288574, |
|
"eval_runtime": 47.6175, |
|
"eval_samples_per_second": 0.735, |
|
"eval_steps_per_second": 0.189, |
|
"step": 54 |
|
}, |
|
{ |
|
"epoch": 18.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 1.904532551765442, |
|
"eval_runtime": 47.9854, |
|
"eval_samples_per_second": 0.729, |
|
"eval_steps_per_second": 0.188, |
|
"step": 57 |
|
}, |
|
{ |
|
"epoch": 19.01, |
|
"learning_rate": 4.545454545454546e-05, |
|
"loss": 1.5023, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 19.01, |
|
"eval_accuracy": 0.11428571428571428, |
|
"eval_loss": 1.796205759048462, |
|
"eval_runtime": 51.1635, |
|
"eval_samples_per_second": 0.684, |
|
"eval_steps_per_second": 0.176, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 20.01, |
|
"eval_accuracy": 0.34285714285714286, |
|
"eval_loss": 1.618465542793274, |
|
"eval_runtime": 54.8541, |
|
"eval_samples_per_second": 0.638, |
|
"eval_steps_per_second": 0.164, |
|
"step": 63 |
|
}, |
|
{ |
|
"epoch": 21.01, |
|
"eval_accuracy": 0.34285714285714286, |
|
"eval_loss": 1.4067193269729614, |
|
"eval_runtime": 56.983, |
|
"eval_samples_per_second": 0.614, |
|
"eval_steps_per_second": 0.158, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 22.01, |
|
"eval_accuracy": 0.5142857142857142, |
|
"eval_loss": 1.342714548110962, |
|
"eval_runtime": 49.6455, |
|
"eval_samples_per_second": 0.705, |
|
"eval_steps_per_second": 0.181, |
|
"step": 69 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"learning_rate": 4.3771043771043774e-05, |
|
"loss": 1.2231, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 23.01, |
|
"eval_accuracy": 0.37142857142857144, |
|
"eval_loss": 1.199639081954956, |
|
"eval_runtime": 46.5204, |
|
"eval_samples_per_second": 0.752, |
|
"eval_steps_per_second": 0.193, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 24.01, |
|
"eval_accuracy": 0.5428571428571428, |
|
"eval_loss": 1.067163348197937, |
|
"eval_runtime": 47.5503, |
|
"eval_samples_per_second": 0.736, |
|
"eval_steps_per_second": 0.189, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 25.01, |
|
"eval_accuracy": 0.5142857142857142, |
|
"eval_loss": 1.1605939865112305, |
|
"eval_runtime": 46.8125, |
|
"eval_samples_per_second": 0.748, |
|
"eval_steps_per_second": 0.192, |
|
"step": 78 |
|
}, |
|
{ |
|
"epoch": 26.01, |
|
"learning_rate": 4.208754208754209e-05, |
|
"loss": 1.086, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 26.01, |
|
"eval_accuracy": 0.5142857142857142, |
|
"eval_loss": 1.0507373809814453, |
|
"eval_runtime": 47.2904, |
|
"eval_samples_per_second": 0.74, |
|
"eval_steps_per_second": 0.19, |
|
"step": 81 |
|
}, |
|
{ |
|
"epoch": 27.01, |
|
"eval_accuracy": 0.6571428571428571, |
|
"eval_loss": 0.8726997971534729, |
|
"eval_runtime": 47.448, |
|
"eval_samples_per_second": 0.738, |
|
"eval_steps_per_second": 0.19, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 28.01, |
|
"eval_accuracy": 0.5714285714285714, |
|
"eval_loss": 1.1010727882385254, |
|
"eval_runtime": 46.68, |
|
"eval_samples_per_second": 0.75, |
|
"eval_steps_per_second": 0.193, |
|
"step": 87 |
|
}, |
|
{ |
|
"epoch": 29.01, |
|
"learning_rate": 4.0404040404040405e-05, |
|
"loss": 1.1221, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 29.01, |
|
"eval_accuracy": 0.6285714285714286, |
|
"eval_loss": 1.070949673652649, |
|
"eval_runtime": 47.7392, |
|
"eval_samples_per_second": 0.733, |
|
"eval_steps_per_second": 0.189, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 30.01, |
|
"eval_accuracy": 0.34285714285714286, |
|
"eval_loss": 1.2051596641540527, |
|
"eval_runtime": 52.6759, |
|
"eval_samples_per_second": 0.664, |
|
"eval_steps_per_second": 0.171, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 31.01, |
|
"eval_accuracy": 0.3142857142857143, |
|
"eval_loss": 1.1637940406799316, |
|
"eval_runtime": 47.6299, |
|
"eval_samples_per_second": 0.735, |
|
"eval_steps_per_second": 0.189, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 32.01, |
|
"eval_accuracy": 0.5714285714285714, |
|
"eval_loss": 1.0540904998779297, |
|
"eval_runtime": 47.2579, |
|
"eval_samples_per_second": 0.741, |
|
"eval_steps_per_second": 0.19, |
|
"step": 99 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"learning_rate": 3.872053872053872e-05, |
|
"loss": 1.0483, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 33.01, |
|
"eval_accuracy": 0.5428571428571428, |
|
"eval_loss": 0.9793229103088379, |
|
"eval_runtime": 48.2595, |
|
"eval_samples_per_second": 0.725, |
|
"eval_steps_per_second": 0.186, |
|
"step": 102 |
|
}, |
|
{ |
|
"epoch": 34.01, |
|
"eval_accuracy": 0.7142857142857143, |
|
"eval_loss": 0.9788510203361511, |
|
"eval_runtime": 46.729, |
|
"eval_samples_per_second": 0.749, |
|
"eval_steps_per_second": 0.193, |
|
"step": 105 |
|
}, |
|
{ |
|
"epoch": 35.01, |
|
"eval_accuracy": 0.6285714285714286, |
|
"eval_loss": 1.0231552124023438, |
|
"eval_runtime": 47.7551, |
|
"eval_samples_per_second": 0.733, |
|
"eval_steps_per_second": 0.188, |
|
"step": 108 |
|
}, |
|
{ |
|
"epoch": 36.01, |
|
"learning_rate": 3.7037037037037037e-05, |
|
"loss": 0.8313, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 36.01, |
|
"eval_accuracy": 0.6857142857142857, |
|
"eval_loss": 1.0134854316711426, |
|
"eval_runtime": 50.8022, |
|
"eval_samples_per_second": 0.689, |
|
"eval_steps_per_second": 0.177, |
|
"step": 111 |
|
}, |
|
{ |
|
"epoch": 37.01, |
|
"eval_accuracy": 0.7142857142857143, |
|
"eval_loss": 0.9512158036231995, |
|
"eval_runtime": 47.6931, |
|
"eval_samples_per_second": 0.734, |
|
"eval_steps_per_second": 0.189, |
|
"step": 114 |
|
}, |
|
{ |
|
"epoch": 38.01, |
|
"eval_accuracy": 0.7428571428571429, |
|
"eval_loss": 0.6964335441589355, |
|
"eval_runtime": 48.6009, |
|
"eval_samples_per_second": 0.72, |
|
"eval_steps_per_second": 0.185, |
|
"step": 117 |
|
}, |
|
{ |
|
"epoch": 39.01, |
|
"learning_rate": 3.535353535353535e-05, |
|
"loss": 0.9314, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 39.01, |
|
"eval_accuracy": 0.6, |
|
"eval_loss": 0.7565953135490417, |
|
"eval_runtime": 48.8407, |
|
"eval_samples_per_second": 0.717, |
|
"eval_steps_per_second": 0.184, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 40.01, |
|
"eval_accuracy": 0.8, |
|
"eval_loss": 0.6933528184890747, |
|
"eval_runtime": 46.6051, |
|
"eval_samples_per_second": 0.751, |
|
"eval_steps_per_second": 0.193, |
|
"step": 123 |
|
}, |
|
{ |
|
"epoch": 41.01, |
|
"eval_accuracy": 0.7714285714285715, |
|
"eval_loss": 0.7758246064186096, |
|
"eval_runtime": 46.5497, |
|
"eval_samples_per_second": 0.752, |
|
"eval_steps_per_second": 0.193, |
|
"step": 126 |
|
}, |
|
{ |
|
"epoch": 42.01, |
|
"eval_accuracy": 0.5714285714285714, |
|
"eval_loss": 0.8644936084747314, |
|
"eval_runtime": 47.6569, |
|
"eval_samples_per_second": 0.734, |
|
"eval_steps_per_second": 0.189, |
|
"step": 129 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"learning_rate": 3.3670033670033675e-05, |
|
"loss": 0.9863, |
|
"step": 130 |
|
}, |
|
{ |
|
"epoch": 43.01, |
|
"eval_accuracy": 0.7714285714285715, |
|
"eval_loss": 0.8204832673072815, |
|
"eval_runtime": 53.1222, |
|
"eval_samples_per_second": 0.659, |
|
"eval_steps_per_second": 0.169, |
|
"step": 132 |
|
}, |
|
{ |
|
"epoch": 44.01, |
|
"eval_accuracy": 0.7714285714285715, |
|
"eval_loss": 0.7429643273353577, |
|
"eval_runtime": 47.3081, |
|
"eval_samples_per_second": 0.74, |
|
"eval_steps_per_second": 0.19, |
|
"step": 135 |
|
}, |
|
{ |
|
"epoch": 45.01, |
|
"eval_accuracy": 0.6857142857142857, |
|
"eval_loss": 0.7228943705558777, |
|
"eval_runtime": 45.8699, |
|
"eval_samples_per_second": 0.763, |
|
"eval_steps_per_second": 0.196, |
|
"step": 138 |
|
}, |
|
{ |
|
"epoch": 46.01, |
|
"learning_rate": 3.198653198653199e-05, |
|
"loss": 0.6828, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 46.01, |
|
"eval_accuracy": 0.6571428571428571, |
|
"eval_loss": 0.684984028339386, |
|
"eval_runtime": 52.7837, |
|
"eval_samples_per_second": 0.663, |
|
"eval_steps_per_second": 0.171, |
|
"step": 141 |
|
}, |
|
{ |
|
"epoch": 47.01, |
|
"eval_accuracy": 0.7714285714285715, |
|
"eval_loss": 0.6505874395370483, |
|
"eval_runtime": 47.1631, |
|
"eval_samples_per_second": 0.742, |
|
"eval_steps_per_second": 0.191, |
|
"step": 144 |
|
}, |
|
{ |
|
"epoch": 48.01, |
|
"eval_accuracy": 0.7894736842105263, |
|
"eval_loss": 0.6245588660240173, |
|
"eval_runtime": 50.9021, |
|
"eval_samples_per_second": 0.747, |
|
"eval_steps_per_second": 0.196, |
|
"step": 146 |
|
}, |
|
{ |
|
"epoch": 48.01, |
|
"eval_accuracy": 0.75, |
|
"eval_loss": 0.7047864198684692, |
|
"eval_runtime": 43.3232, |
|
"eval_samples_per_second": 0.739, |
|
"eval_steps_per_second": 0.185, |
|
"step": 146 |
|
} |
|
], |
|
"max_steps": 330, |
|
"num_train_epochs": 9223372036854775807, |
|
"total_flos": 6.579455730080809e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|