videomae-base-ipm_first_videos / trainer_state.json
rickysk's picture
Training in progress, epoch 0
f6a6d29
raw
history blame
14.2 kB
{
"best_metric": 0.8,
"best_model_checkpoint": "videomae-base-ipm_first_videos/checkpoint-123",
"epoch": 48.00606060606061,
"global_step": 146,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.01,
"eval_accuracy": 0.22857142857142856,
"eval_loss": 1.7709606885910034,
"eval_runtime": 56.0244,
"eval_samples_per_second": 0.625,
"eval_steps_per_second": 0.161,
"step": 3
},
{
"epoch": 1.01,
"eval_accuracy": 0.14285714285714285,
"eval_loss": 1.7788584232330322,
"eval_runtime": 54.8936,
"eval_samples_per_second": 0.638,
"eval_steps_per_second": 0.164,
"step": 6
},
{
"epoch": 2.01,
"eval_accuracy": 0.08571428571428572,
"eval_loss": 1.7939355373382568,
"eval_runtime": 57.093,
"eval_samples_per_second": 0.613,
"eval_steps_per_second": 0.158,
"step": 9
},
{
"epoch": 3.0,
"learning_rate": 1.5151515151515153e-05,
"loss": 1.7369,
"step": 10
},
{
"epoch": 3.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 1.8259599208831787,
"eval_runtime": 49.6198,
"eval_samples_per_second": 0.705,
"eval_steps_per_second": 0.181,
"step": 12
},
{
"epoch": 4.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 1.8636661767959595,
"eval_runtime": 47.6299,
"eval_samples_per_second": 0.735,
"eval_steps_per_second": 0.189,
"step": 15
},
{
"epoch": 5.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 1.916202187538147,
"eval_runtime": 54.478,
"eval_samples_per_second": 0.642,
"eval_steps_per_second": 0.165,
"step": 18
},
{
"epoch": 6.01,
"learning_rate": 3.0303030303030306e-05,
"loss": 1.6934,
"step": 20
},
{
"epoch": 6.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 1.979854702949524,
"eval_runtime": 47.3817,
"eval_samples_per_second": 0.739,
"eval_steps_per_second": 0.19,
"step": 21
},
{
"epoch": 7.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 2.032222270965576,
"eval_runtime": 47.048,
"eval_samples_per_second": 0.744,
"eval_steps_per_second": 0.191,
"step": 24
},
{
"epoch": 8.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 2.147186756134033,
"eval_runtime": 56.4896,
"eval_samples_per_second": 0.62,
"eval_steps_per_second": 0.159,
"step": 27
},
{
"epoch": 9.01,
"learning_rate": 4.545454545454546e-05,
"loss": 1.636,
"step": 30
},
{
"epoch": 9.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 2.201059103012085,
"eval_runtime": 47.193,
"eval_samples_per_second": 0.742,
"eval_steps_per_second": 0.191,
"step": 30
},
{
"epoch": 10.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 2.3041186332702637,
"eval_runtime": 49.6007,
"eval_samples_per_second": 0.706,
"eval_steps_per_second": 0.181,
"step": 33
},
{
"epoch": 11.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 2.202650785446167,
"eval_runtime": 51.3674,
"eval_samples_per_second": 0.681,
"eval_steps_per_second": 0.175,
"step": 36
},
{
"epoch": 12.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 2.1011433601379395,
"eval_runtime": 47.3736,
"eval_samples_per_second": 0.739,
"eval_steps_per_second": 0.19,
"step": 39
},
{
"epoch": 13.0,
"learning_rate": 4.882154882154882e-05,
"loss": 1.6069,
"step": 40
},
{
"epoch": 13.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 2.0470354557037354,
"eval_runtime": 52.7055,
"eval_samples_per_second": 0.664,
"eval_steps_per_second": 0.171,
"step": 42
},
{
"epoch": 14.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 1.9688891172409058,
"eval_runtime": 46.2559,
"eval_samples_per_second": 0.757,
"eval_steps_per_second": 0.195,
"step": 45
},
{
"epoch": 15.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 1.911560297012329,
"eval_runtime": 55.4227,
"eval_samples_per_second": 0.632,
"eval_steps_per_second": 0.162,
"step": 48
},
{
"epoch": 16.01,
"learning_rate": 4.713804713804714e-05,
"loss": 1.6509,
"step": 50
},
{
"epoch": 16.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 1.9125531911849976,
"eval_runtime": 55.4531,
"eval_samples_per_second": 0.631,
"eval_steps_per_second": 0.162,
"step": 51
},
{
"epoch": 17.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 2.038973808288574,
"eval_runtime": 47.6175,
"eval_samples_per_second": 0.735,
"eval_steps_per_second": 0.189,
"step": 54
},
{
"epoch": 18.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 1.904532551765442,
"eval_runtime": 47.9854,
"eval_samples_per_second": 0.729,
"eval_steps_per_second": 0.188,
"step": 57
},
{
"epoch": 19.01,
"learning_rate": 4.545454545454546e-05,
"loss": 1.5023,
"step": 60
},
{
"epoch": 19.01,
"eval_accuracy": 0.11428571428571428,
"eval_loss": 1.796205759048462,
"eval_runtime": 51.1635,
"eval_samples_per_second": 0.684,
"eval_steps_per_second": 0.176,
"step": 60
},
{
"epoch": 20.01,
"eval_accuracy": 0.34285714285714286,
"eval_loss": 1.618465542793274,
"eval_runtime": 54.8541,
"eval_samples_per_second": 0.638,
"eval_steps_per_second": 0.164,
"step": 63
},
{
"epoch": 21.01,
"eval_accuracy": 0.34285714285714286,
"eval_loss": 1.4067193269729614,
"eval_runtime": 56.983,
"eval_samples_per_second": 0.614,
"eval_steps_per_second": 0.158,
"step": 66
},
{
"epoch": 22.01,
"eval_accuracy": 0.5142857142857142,
"eval_loss": 1.342714548110962,
"eval_runtime": 49.6455,
"eval_samples_per_second": 0.705,
"eval_steps_per_second": 0.181,
"step": 69
},
{
"epoch": 23.0,
"learning_rate": 4.3771043771043774e-05,
"loss": 1.2231,
"step": 70
},
{
"epoch": 23.01,
"eval_accuracy": 0.37142857142857144,
"eval_loss": 1.199639081954956,
"eval_runtime": 46.5204,
"eval_samples_per_second": 0.752,
"eval_steps_per_second": 0.193,
"step": 72
},
{
"epoch": 24.01,
"eval_accuracy": 0.5428571428571428,
"eval_loss": 1.067163348197937,
"eval_runtime": 47.5503,
"eval_samples_per_second": 0.736,
"eval_steps_per_second": 0.189,
"step": 75
},
{
"epoch": 25.01,
"eval_accuracy": 0.5142857142857142,
"eval_loss": 1.1605939865112305,
"eval_runtime": 46.8125,
"eval_samples_per_second": 0.748,
"eval_steps_per_second": 0.192,
"step": 78
},
{
"epoch": 26.01,
"learning_rate": 4.208754208754209e-05,
"loss": 1.086,
"step": 80
},
{
"epoch": 26.01,
"eval_accuracy": 0.5142857142857142,
"eval_loss": 1.0507373809814453,
"eval_runtime": 47.2904,
"eval_samples_per_second": 0.74,
"eval_steps_per_second": 0.19,
"step": 81
},
{
"epoch": 27.01,
"eval_accuracy": 0.6571428571428571,
"eval_loss": 0.8726997971534729,
"eval_runtime": 47.448,
"eval_samples_per_second": 0.738,
"eval_steps_per_second": 0.19,
"step": 84
},
{
"epoch": 28.01,
"eval_accuracy": 0.5714285714285714,
"eval_loss": 1.1010727882385254,
"eval_runtime": 46.68,
"eval_samples_per_second": 0.75,
"eval_steps_per_second": 0.193,
"step": 87
},
{
"epoch": 29.01,
"learning_rate": 4.0404040404040405e-05,
"loss": 1.1221,
"step": 90
},
{
"epoch": 29.01,
"eval_accuracy": 0.6285714285714286,
"eval_loss": 1.070949673652649,
"eval_runtime": 47.7392,
"eval_samples_per_second": 0.733,
"eval_steps_per_second": 0.189,
"step": 90
},
{
"epoch": 30.01,
"eval_accuracy": 0.34285714285714286,
"eval_loss": 1.2051596641540527,
"eval_runtime": 52.6759,
"eval_samples_per_second": 0.664,
"eval_steps_per_second": 0.171,
"step": 93
},
{
"epoch": 31.01,
"eval_accuracy": 0.3142857142857143,
"eval_loss": 1.1637940406799316,
"eval_runtime": 47.6299,
"eval_samples_per_second": 0.735,
"eval_steps_per_second": 0.189,
"step": 96
},
{
"epoch": 32.01,
"eval_accuracy": 0.5714285714285714,
"eval_loss": 1.0540904998779297,
"eval_runtime": 47.2579,
"eval_samples_per_second": 0.741,
"eval_steps_per_second": 0.19,
"step": 99
},
{
"epoch": 33.0,
"learning_rate": 3.872053872053872e-05,
"loss": 1.0483,
"step": 100
},
{
"epoch": 33.01,
"eval_accuracy": 0.5428571428571428,
"eval_loss": 0.9793229103088379,
"eval_runtime": 48.2595,
"eval_samples_per_second": 0.725,
"eval_steps_per_second": 0.186,
"step": 102
},
{
"epoch": 34.01,
"eval_accuracy": 0.7142857142857143,
"eval_loss": 0.9788510203361511,
"eval_runtime": 46.729,
"eval_samples_per_second": 0.749,
"eval_steps_per_second": 0.193,
"step": 105
},
{
"epoch": 35.01,
"eval_accuracy": 0.6285714285714286,
"eval_loss": 1.0231552124023438,
"eval_runtime": 47.7551,
"eval_samples_per_second": 0.733,
"eval_steps_per_second": 0.188,
"step": 108
},
{
"epoch": 36.01,
"learning_rate": 3.7037037037037037e-05,
"loss": 0.8313,
"step": 110
},
{
"epoch": 36.01,
"eval_accuracy": 0.6857142857142857,
"eval_loss": 1.0134854316711426,
"eval_runtime": 50.8022,
"eval_samples_per_second": 0.689,
"eval_steps_per_second": 0.177,
"step": 111
},
{
"epoch": 37.01,
"eval_accuracy": 0.7142857142857143,
"eval_loss": 0.9512158036231995,
"eval_runtime": 47.6931,
"eval_samples_per_second": 0.734,
"eval_steps_per_second": 0.189,
"step": 114
},
{
"epoch": 38.01,
"eval_accuracy": 0.7428571428571429,
"eval_loss": 0.6964335441589355,
"eval_runtime": 48.6009,
"eval_samples_per_second": 0.72,
"eval_steps_per_second": 0.185,
"step": 117
},
{
"epoch": 39.01,
"learning_rate": 3.535353535353535e-05,
"loss": 0.9314,
"step": 120
},
{
"epoch": 39.01,
"eval_accuracy": 0.6,
"eval_loss": 0.7565953135490417,
"eval_runtime": 48.8407,
"eval_samples_per_second": 0.717,
"eval_steps_per_second": 0.184,
"step": 120
},
{
"epoch": 40.01,
"eval_accuracy": 0.8,
"eval_loss": 0.6933528184890747,
"eval_runtime": 46.6051,
"eval_samples_per_second": 0.751,
"eval_steps_per_second": 0.193,
"step": 123
},
{
"epoch": 41.01,
"eval_accuracy": 0.7714285714285715,
"eval_loss": 0.7758246064186096,
"eval_runtime": 46.5497,
"eval_samples_per_second": 0.752,
"eval_steps_per_second": 0.193,
"step": 126
},
{
"epoch": 42.01,
"eval_accuracy": 0.5714285714285714,
"eval_loss": 0.8644936084747314,
"eval_runtime": 47.6569,
"eval_samples_per_second": 0.734,
"eval_steps_per_second": 0.189,
"step": 129
},
{
"epoch": 43.0,
"learning_rate": 3.3670033670033675e-05,
"loss": 0.9863,
"step": 130
},
{
"epoch": 43.01,
"eval_accuracy": 0.7714285714285715,
"eval_loss": 0.8204832673072815,
"eval_runtime": 53.1222,
"eval_samples_per_second": 0.659,
"eval_steps_per_second": 0.169,
"step": 132
},
{
"epoch": 44.01,
"eval_accuracy": 0.7714285714285715,
"eval_loss": 0.7429643273353577,
"eval_runtime": 47.3081,
"eval_samples_per_second": 0.74,
"eval_steps_per_second": 0.19,
"step": 135
},
{
"epoch": 45.01,
"eval_accuracy": 0.6857142857142857,
"eval_loss": 0.7228943705558777,
"eval_runtime": 45.8699,
"eval_samples_per_second": 0.763,
"eval_steps_per_second": 0.196,
"step": 138
},
{
"epoch": 46.01,
"learning_rate": 3.198653198653199e-05,
"loss": 0.6828,
"step": 140
},
{
"epoch": 46.01,
"eval_accuracy": 0.6571428571428571,
"eval_loss": 0.684984028339386,
"eval_runtime": 52.7837,
"eval_samples_per_second": 0.663,
"eval_steps_per_second": 0.171,
"step": 141
},
{
"epoch": 47.01,
"eval_accuracy": 0.7714285714285715,
"eval_loss": 0.6505874395370483,
"eval_runtime": 47.1631,
"eval_samples_per_second": 0.742,
"eval_steps_per_second": 0.191,
"step": 144
},
{
"epoch": 48.01,
"eval_accuracy": 0.7894736842105263,
"eval_loss": 0.6245588660240173,
"eval_runtime": 50.9021,
"eval_samples_per_second": 0.747,
"eval_steps_per_second": 0.196,
"step": 146
},
{
"epoch": 48.01,
"eval_accuracy": 0.75,
"eval_loss": 0.7047864198684692,
"eval_runtime": 43.3232,
"eval_samples_per_second": 0.739,
"eval_steps_per_second": 0.185,
"step": 146
}
],
"max_steps": 330,
"num_train_epochs": 9223372036854775807,
"total_flos": 6.579455730080809e+17,
"trial_name": null,
"trial_params": null
}