sam1120's picture
Training in progress, step 40
7532c20
raw
history blame
No virus
7.62 kB
{
"best_metric": 0.5335736274719238,
"best_model_checkpoint": "/robodata/smodak/Projects/nspl/scripts/terrainseg/training/models/safety-utcustom-train-SF-RGBD-b5/checkpoint-40",
"epoch": 3.6363636363636362,
"global_step": 40,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.09,
"learning_rate": 7.272727272727273e-08,
"loss": 0.8005,
"step": 1
},
{
"epoch": 0.18,
"learning_rate": 1.4545454545454545e-07,
"loss": 0.7952,
"step": 2
},
{
"epoch": 0.27,
"learning_rate": 2.1818181818181815e-07,
"loss": 0.7806,
"step": 3
},
{
"epoch": 0.36,
"learning_rate": 2.909090909090909e-07,
"loss": 0.7985,
"step": 4
},
{
"epoch": 0.45,
"learning_rate": 3.636363636363636e-07,
"loss": 0.7916,
"step": 5
},
{
"epoch": 0.55,
"learning_rate": 4.363636363636363e-07,
"loss": 0.7885,
"step": 6
},
{
"epoch": 0.64,
"learning_rate": 5.090909090909091e-07,
"loss": 0.7869,
"step": 7
},
{
"epoch": 0.73,
"learning_rate": 5.818181818181818e-07,
"loss": 0.7871,
"step": 8
},
{
"epoch": 0.82,
"learning_rate": 6.545454545454546e-07,
"loss": 0.7895,
"step": 9
},
{
"epoch": 0.91,
"learning_rate": 7.272727272727272e-07,
"loss": 0.789,
"step": 10
},
{
"epoch": 0.91,
"eval_accuracy_safe": 0.020290978060994367,
"eval_accuracy_unlabeled": NaN,
"eval_accuracy_unsafe": 0.8956518586322223,
"eval_iou_safe": 0.009542102362547317,
"eval_iou_unlabeled": 0.0,
"eval_iou_unsafe": 0.872225496966486,
"eval_loss": 0.9554787278175354,
"eval_mean_accuracy": 0.4579714183466083,
"eval_mean_iou": 0.29392253310967775,
"eval_overall_accuracy": 0.8697951017920651,
"eval_runtime": 10.4712,
"eval_samples_per_second": 6.399,
"eval_steps_per_second": 0.478,
"step": 10
},
{
"epoch": 1.0,
"learning_rate": 8e-07,
"loss": 0.7808,
"step": 11
},
{
"epoch": 1.09,
"learning_rate": 8.727272727272726e-07,
"loss": 0.7854,
"step": 12
},
{
"epoch": 1.18,
"learning_rate": 9.454545454545454e-07,
"loss": 0.7698,
"step": 13
},
{
"epoch": 1.27,
"learning_rate": 1.0181818181818181e-06,
"loss": 0.7788,
"step": 14
},
{
"epoch": 1.36,
"learning_rate": 1.0909090909090908e-06,
"loss": 0.7783,
"step": 15
},
{
"epoch": 1.45,
"learning_rate": 1.1636363636363636e-06,
"loss": 0.7696,
"step": 16
},
{
"epoch": 1.55,
"learning_rate": 1.2363636363636363e-06,
"loss": 0.7638,
"step": 17
},
{
"epoch": 1.64,
"learning_rate": 1.3090909090909091e-06,
"loss": 0.7611,
"step": 18
},
{
"epoch": 1.73,
"learning_rate": 1.3818181818181818e-06,
"loss": 0.7597,
"step": 19
},
{
"epoch": 1.82,
"learning_rate": 1.4545454545454544e-06,
"loss": 0.7579,
"step": 20
},
{
"epoch": 1.82,
"eval_accuracy_safe": 0.011667264197131082,
"eval_accuracy_unlabeled": NaN,
"eval_accuracy_unsafe": 0.9614483463212281,
"eval_iou_safe": 0.006852036536648151,
"eval_iou_unlabeled": 0.0,
"eval_iou_unsafe": 0.9338335778122896,
"eval_loss": 0.8321800827980042,
"eval_mean_accuracy": 0.4865578052591796,
"eval_mean_iou": 0.3135618714496459,
"eval_overall_accuracy": 0.9333933360541045,
"eval_runtime": 11.8686,
"eval_samples_per_second": 5.645,
"eval_steps_per_second": 0.421,
"step": 20
},
{
"epoch": 1.91,
"learning_rate": 1.5272727272727273e-06,
"loss": 0.7626,
"step": 21
},
{
"epoch": 2.0,
"learning_rate": 1.6e-06,
"loss": 0.7399,
"step": 22
},
{
"epoch": 2.09,
"learning_rate": 1.6727272727272726e-06,
"loss": 0.7658,
"step": 23
},
{
"epoch": 2.18,
"learning_rate": 1.7454545454545452e-06,
"loss": 0.7404,
"step": 24
},
{
"epoch": 2.27,
"learning_rate": 1.818181818181818e-06,
"loss": 0.742,
"step": 25
},
{
"epoch": 2.36,
"learning_rate": 1.8909090909090907e-06,
"loss": 0.721,
"step": 26
},
{
"epoch": 2.45,
"learning_rate": 1.9636363636363636e-06,
"loss": 0.7222,
"step": 27
},
{
"epoch": 2.55,
"learning_rate": 2.0363636363636362e-06,
"loss": 0.7358,
"step": 28
},
{
"epoch": 2.64,
"learning_rate": 2.109090909090909e-06,
"loss": 0.7427,
"step": 29
},
{
"epoch": 2.73,
"learning_rate": 2.1818181818181815e-06,
"loss": 0.7103,
"step": 30
},
{
"epoch": 2.73,
"eval_accuracy_safe": 0.005111776747198353,
"eval_accuracy_unlabeled": NaN,
"eval_accuracy_unsafe": 0.9893036287919527,
"eval_iou_safe": 0.004283838202726343,
"eval_iou_unlabeled": 0.0,
"eval_iou_unsafe": 0.9604181920132638,
"eval_loss": 0.6728952527046204,
"eval_mean_accuracy": 0.4972077027695755,
"eval_mean_iou": 0.32156734340533005,
"eval_overall_accuracy": 0.96023217955632,
"eval_runtime": 12.232,
"eval_samples_per_second": 5.477,
"eval_steps_per_second": 0.409,
"step": 30
},
{
"epoch": 2.82,
"learning_rate": 2.254545454545454e-06,
"loss": 0.7102,
"step": 31
},
{
"epoch": 2.91,
"learning_rate": 2.3272727272727272e-06,
"loss": 0.7035,
"step": 32
},
{
"epoch": 3.0,
"learning_rate": 2.4e-06,
"loss": 0.6845,
"step": 33
},
{
"epoch": 3.09,
"learning_rate": 2.4727272727272725e-06,
"loss": 0.6932,
"step": 34
},
{
"epoch": 3.18,
"learning_rate": 2.545454545454545e-06,
"loss": 0.6848,
"step": 35
},
{
"epoch": 3.27,
"learning_rate": 2.6181818181818183e-06,
"loss": 0.6816,
"step": 36
},
{
"epoch": 3.36,
"learning_rate": 2.690909090909091e-06,
"loss": 0.6617,
"step": 37
},
{
"epoch": 3.45,
"learning_rate": 2.7636363636363635e-06,
"loss": 0.6924,
"step": 38
},
{
"epoch": 3.55,
"learning_rate": 2.836363636363636e-06,
"loss": 0.6775,
"step": 39
},
{
"epoch": 3.64,
"learning_rate": 2.909090909090909e-06,
"loss": 0.676,
"step": 40
},
{
"epoch": 3.64,
"eval_accuracy_safe": 0.0021453271190165035,
"eval_accuracy_unlabeled": NaN,
"eval_accuracy_unsafe": 0.9968958945126286,
"eval_iou_safe": 0.0020376330502982305,
"eval_iou_unlabeled": 0.0,
"eval_iou_unsafe": 0.9675401930395611,
"eval_loss": 0.5335736274719238,
"eval_mean_accuracy": 0.49952061081582255,
"eval_mean_iou": 0.32319260869661975,
"eval_overall_accuracy": 0.9675125577556554,
"eval_runtime": 10.8655,
"eval_samples_per_second": 6.166,
"eval_steps_per_second": 0.46,
"step": 40
}
],
"max_steps": 1100,
"num_train_epochs": 100,
"total_flos": 4.5271179966755635e+17,
"trial_name": null,
"trial_params": null
}