|
{ |
|
"best_metric": 0.7875, |
|
"best_model_checkpoint": "videomae-base-finetuned-gesturePhasev2/checkpoint-95", |
|
"epoch": 4.125, |
|
"eval_steps": 500, |
|
"global_step": 237, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.026595744680851064, |
|
"grad_norm": 9.288494110107422, |
|
"learning_rate": 6.578947368421053e-07, |
|
"loss": 1.4443, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.05319148936170213, |
|
"grad_norm": 10.334871292114258, |
|
"learning_rate": 1.3157894736842106e-06, |
|
"loss": 1.418, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 0.0797872340425532, |
|
"grad_norm": 7.731433391571045, |
|
"learning_rate": 1.973684210526316e-06, |
|
"loss": 1.3362, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 0.10638297872340426, |
|
"grad_norm": 10.242834091186523, |
|
"learning_rate": 2.631578947368421e-06, |
|
"loss": 1.1665, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 0.125, |
|
"eval_accuracy": 0.775, |
|
"eval_loss": 1.0642327070236206, |
|
"eval_runtime": 15.1556, |
|
"eval_samples_per_second": 10.557, |
|
"eval_steps_per_second": 1.32, |
|
"step": 47 |
|
}, |
|
{ |
|
"epoch": 1.0066489361702127, |
|
"grad_norm": 5.333619594573975, |
|
"learning_rate": 3.289473684210527e-06, |
|
"loss": 1.0034, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 1.0332446808510638, |
|
"grad_norm": 4.666859149932861, |
|
"learning_rate": 3.947368421052632e-06, |
|
"loss": 0.8562, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 1.059840425531915, |
|
"grad_norm": 4.381842136383057, |
|
"learning_rate": 4.605263157894737e-06, |
|
"loss": 0.7196, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 1.086436170212766, |
|
"grad_norm": 4.5117340087890625, |
|
"learning_rate": 4.997807075247147e-06, |
|
"loss": 0.7522, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 1.113031914893617, |
|
"grad_norm": 3.7782816886901855, |
|
"learning_rate": 4.973180832407471e-06, |
|
"loss": 0.7316, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 1.1263297872340425, |
|
"eval_accuracy": 0.7875, |
|
"eval_loss": 0.7825992703437805, |
|
"eval_runtime": 11.6767, |
|
"eval_samples_per_second": 13.703, |
|
"eval_steps_per_second": 1.713, |
|
"step": 95 |
|
}, |
|
{ |
|
"epoch": 2.0132978723404253, |
|
"grad_norm": 3.1058461666107178, |
|
"learning_rate": 4.921457902821578e-06, |
|
"loss": 0.785, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 2.0398936170212765, |
|
"grad_norm": 3.0555734634399414, |
|
"learning_rate": 4.84320497372973e-06, |
|
"loss": 0.7795, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 2.0664893617021276, |
|
"grad_norm": 3.8933866024017334, |
|
"learning_rate": 4.7392794005985324e-06, |
|
"loss": 0.774, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 2.0930851063829787, |
|
"grad_norm": 4.3550591468811035, |
|
"learning_rate": 4.610819813755038e-06, |
|
"loss": 0.7218, |
|
"step": 130 |
|
}, |
|
{ |
|
"epoch": 2.11968085106383, |
|
"grad_norm": 4.537750720977783, |
|
"learning_rate": 4.4592336433146e-06, |
|
"loss": 0.7259, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 2.125, |
|
"eval_accuracy": 0.7875, |
|
"eval_loss": 0.8042387962341309, |
|
"eval_runtime": 10.5863, |
|
"eval_samples_per_second": 15.114, |
|
"eval_steps_per_second": 1.889, |
|
"step": 142 |
|
}, |
|
{ |
|
"epoch": 3.0199468085106385, |
|
"grad_norm": 3.3319995403289795, |
|
"learning_rate": 4.286181699082008e-06, |
|
"loss": 0.6222, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 3.046542553191489, |
|
"grad_norm": 4.209911823272705, |
|
"learning_rate": 4.093559974371725e-06, |
|
"loss": 0.7533, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 3.0731382978723403, |
|
"grad_norm": 2.9892210960388184, |
|
"learning_rate": 3.88347887310836e-06, |
|
"loss": 0.8408, |
|
"step": 170 |
|
}, |
|
{ |
|
"epoch": 3.0997340425531914, |
|
"grad_norm": 4.7717814445495605, |
|
"learning_rate": 3.658240087799655e-06, |
|
"loss": 0.7287, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 3.1263297872340425, |
|
"grad_norm": 5.496540546417236, |
|
"learning_rate": 3.4203113817116955e-06, |
|
"loss": 0.6643, |
|
"step": 190 |
|
}, |
|
{ |
|
"epoch": 3.1263297872340425, |
|
"eval_accuracy": 0.7875, |
|
"eval_loss": 0.8022773861885071, |
|
"eval_runtime": 10.4825, |
|
"eval_samples_per_second": 15.264, |
|
"eval_steps_per_second": 1.908, |
|
"step": 190 |
|
}, |
|
{ |
|
"epoch": 4.026595744680851, |
|
"grad_norm": 3.0813848972320557, |
|
"learning_rate": 3.1722995515381644e-06, |
|
"loss": 0.6386, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 4.053191489361702, |
|
"grad_norm": 3.0726428031921387, |
|
"learning_rate": 2.9169218667902562e-06, |
|
"loss": 0.6708, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 4.079787234042553, |
|
"grad_norm": 5.47495174407959, |
|
"learning_rate": 2.6569762988232838e-06, |
|
"loss": 0.8216, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 4.1063829787234045, |
|
"grad_norm": 3.801624059677124, |
|
"learning_rate": 2.3953108656770018e-06, |
|
"loss": 0.761, |
|
"step": 230 |
|
}, |
|
{ |
|
"epoch": 4.125, |
|
"eval_accuracy": 0.7875, |
|
"eval_loss": 0.8077355623245239, |
|
"eval_runtime": 16.5222, |
|
"eval_samples_per_second": 9.684, |
|
"eval_steps_per_second": 1.21, |
|
"step": 237 |
|
}, |
|
{ |
|
"epoch": 4.125, |
|
"step": 237, |
|
"total_flos": 4.691516857081528e+18, |
|
"train_loss": 0.8600665486814604, |
|
"train_runtime": 867.0351, |
|
"train_samples_per_second": 6.939, |
|
"train_steps_per_second": 0.434 |
|
}, |
|
{ |
|
"epoch": 4.125, |
|
"eval_accuracy": 0.7633136094674556, |
|
"eval_loss": 0.8172227144241333, |
|
"eval_runtime": 60.5871, |
|
"eval_samples_per_second": 2.789, |
|
"eval_steps_per_second": 0.363, |
|
"step": 237 |
|
}, |
|
{ |
|
"epoch": 4.125, |
|
"eval_accuracy": 0.7633136094674556, |
|
"eval_loss": 0.8172227144241333, |
|
"eval_runtime": 11.0103, |
|
"eval_samples_per_second": 15.349, |
|
"eval_steps_per_second": 1.998, |
|
"step": 237 |
|
} |
|
], |
|
"logging_steps": 10, |
|
"max_steps": 376, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 9223372036854775807, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"EarlyStoppingCallback": { |
|
"args": { |
|
"early_stopping_patience": 3, |
|
"early_stopping_threshold": 0.0 |
|
}, |
|
"attributes": { |
|
"early_stopping_patience_counter": 0 |
|
} |
|
}, |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 4.691516857081528e+18, |
|
"train_batch_size": 8, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|