diff --git "a/multi_base.log" "b/multi_base.log" new file mode 100644--- /dev/null +++ "b/multi_base.log" @@ -0,0 +1,7713 @@ +2023/10/26 05:13:26 - mmengine - INFO - Iter(train) [ 500/640000] base_lr: 2.0000e-04 lr: 2.0000e-05 eta: 8 days, 9:26:36 time: 1.1340 data_time: 0.0212 memory: 21517 grad_norm: 5.5991 loss: 3.1054 caption_loss_cls: 5.5010 grounding_loss_reg: 6.5788 detection_loss_cls: 0.2814 detection_loss_reg: 0.6083 semantic_segmentation_loss_cls: 0.1106 instance_segmentation_loss_cls: 0.2234 instance_segmentation_loss_reg: 0.5892 instance_segmentation_loss_poly: 2.0360 +2023/10/26 05:22:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 05:22:31 - mmengine - INFO - Iter(train) [ 1000/640000] base_lr: 2.0000e-04 lr: 2.0000e-05 eta: 8 days, 5:22:44 time: 1.1120 data_time: 0.0200 memory: 21517 grad_norm: 4.3168 loss: 2.8875 caption_loss_cls: 4.8561 grounding_loss_reg: 6.3818 detection_loss_cls: 0.2063 detection_loss_reg: 0.5791 semantic_segmentation_loss_cls: 0.0739 instance_segmentation_loss_cls: 0.1814 instance_segmentation_loss_reg: 0.5638 instance_segmentation_loss_poly: 1.8633 +2023/10/26 05:22:31 - mmengine - INFO - Saving checkpoint at 1000 iterations +2023/10/26 05:31:55 - mmengine - INFO - Iter(train) [ 1500/640000] base_lr: 2.0000e-04 lr: 2.0000e-05 eta: 8 days, 6:12:42 time: 1.1176 data_time: 0.0288 memory: 21517 grad_norm: 3.7978 loss: 2.7619 caption_loss_cls: 4.4849 grounding_loss_reg: 6.2725 detection_loss_cls: 0.1745 detection_loss_reg: 0.5707 semantic_segmentation_loss_cls: 0.0609 instance_segmentation_loss_cls: 0.1671 instance_segmentation_loss_reg: 0.5663 instance_segmentation_loss_poly: 1.8181 +2023/10/26 05:40:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 05:40:50 - mmengine - INFO - Iter(train) [ 2000/640000] base_lr: 2.0000e-04 lr: 2.0000e-05 eta: 8 days, 3:56:27 time: 1.1056 data_time: 0.0273 memory: 21517 grad_norm: 3.5229 loss: 2.6887 caption_loss_cls: 4.2528 grounding_loss_reg: 6.1836 detection_loss_cls: 0.1584 detection_loss_reg: 0.5526 semantic_segmentation_loss_cls: 0.0526 instance_segmentation_loss_cls: 0.1525 instance_segmentation_loss_reg: 0.5543 instance_segmentation_loss_poly: 1.7487 +2023/10/26 05:40:50 - mmengine - INFO - Saving checkpoint at 2000 iterations +2023/10/26 05:50:20 - mmengine - INFO - Iter(train) [ 2500/640000] base_lr: 1.9999e-04 lr: 1.9999e-05 eta: 8 days, 4:58:28 time: 1.1123 data_time: 0.0316 memory: 21517 grad_norm: 3.3178 loss: 2.6274 caption_loss_cls: 4.0955 grounding_loss_reg: 6.1206 detection_loss_cls: 0.1483 detection_loss_reg: 0.5479 semantic_segmentation_loss_cls: 0.0479 instance_segmentation_loss_cls: 0.1423 instance_segmentation_loss_reg: 0.5537 instance_segmentation_loss_poly: 1.7187 +2023/10/26 05:59:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 05:59:41 - mmengine - INFO - Iter(train) [ 3000/640000] base_lr: 1.9999e-04 lr: 1.9999e-05 eta: 8 days, 5:07:54 time: 1.1141 data_time: 0.0296 memory: 21517 grad_norm: 3.1785 loss: 2.5769 caption_loss_cls: 4.0079 grounding_loss_reg: 6.0320 detection_loss_cls: 0.1402 detection_loss_reg: 0.5379 semantic_segmentation_loss_cls: 0.0439 instance_segmentation_loss_cls: 0.1332 instance_segmentation_loss_reg: 0.5380 instance_segmentation_loss_poly: 1.6623 +2023/10/26 05:59:41 - mmengine - INFO - Saving checkpoint at 3000 iterations +2023/10/26 06:09:23 - mmengine - INFO - Iter(train) [ 3500/640000] base_lr: 1.9999e-04 lr: 1.9999e-05 eta: 8 days, 6:11:47 time: 1.1210 data_time: 0.0320 memory: 21517 grad_norm: 3.0528 loss: 2.5137 caption_loss_cls: 3.9124 grounding_loss_reg: 5.9768 detection_loss_cls: 0.1325 detection_loss_reg: 0.5231 semantic_segmentation_loss_cls: 0.0408 instance_segmentation_loss_cls: 0.1244 instance_segmentation_loss_reg: 0.5191 instance_segmentation_loss_poly: 1.6022 +2023/10/26 06:18:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 06:18:47 - mmengine - INFO - Iter(train) [ 4000/640000] base_lr: 1.9998e-04 lr: 1.9998e-05 eta: 8 days, 6:14:05 time: 1.1221 data_time: 0.0306 memory: 21517 grad_norm: 2.9794 loss: 2.4900 caption_loss_cls: 3.8467 grounding_loss_reg: 5.9149 detection_loss_cls: 0.1280 detection_loss_reg: 0.5175 semantic_segmentation_loss_cls: 0.0388 instance_segmentation_loss_cls: 0.1195 instance_segmentation_loss_reg: 0.5127 instance_segmentation_loss_poly: 1.5688 +2023/10/26 06:18:48 - mmengine - INFO - Saving checkpoint at 4000 iterations +2023/10/26 06:28:21 - mmengine - INFO - Iter(train) [ 4500/640000] base_lr: 1.9998e-04 lr: 1.9998e-05 eta: 8 days, 6:33:32 time: 1.1237 data_time: 0.0340 memory: 21517 grad_norm: 2.5882 loss: 2.3972 caption_loss_cls: 3.7954 grounding_loss_reg: 5.8655 detection_loss_cls: 0.1239 detection_loss_reg: 0.5138 semantic_segmentation_loss_cls: 0.0372 instance_segmentation_loss_cls: 0.1160 instance_segmentation_loss_reg: 0.5098 instance_segmentation_loss_poly: 1.5546 +2023/10/26 06:36:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 06:36:27 - mmengine - INFO - Iter(train) [ 5000/640000] base_lr: 1.9997e-04 lr: 1.9997e-05 eta: 8 days, 3:42:29 time: 1.1089 data_time: 0.0336 memory: 21517 grad_norm: 2.5527 loss: 2.3700 caption_loss_cls: 3.7297 grounding_loss_reg: 5.8116 detection_loss_cls: 0.1205 detection_loss_reg: 0.5104 semantic_segmentation_loss_cls: 0.0359 instance_segmentation_loss_cls: 0.1143 instance_segmentation_loss_reg: 0.5067 instance_segmentation_loss_poly: 1.5381 +2023/10/26 06:36:27 - mmengine - INFO - Saving checkpoint at 5000 iterations +2023/10/26 06:46:06 - mmengine - INFO - Iter(train) [ 5500/640000] base_lr: 1.9996e-04 lr: 1.9997e-05 eta: 8 days, 4:21:13 time: 1.1128 data_time: 0.0337 memory: 21517 grad_norm: 2.5007 loss: 2.3274 caption_loss_cls: 3.6909 grounding_loss_reg: 5.7682 detection_loss_cls: 0.1171 detection_loss_reg: 0.5067 semantic_segmentation_loss_cls: 0.0346 instance_segmentation_loss_cls: 0.1117 instance_segmentation_loss_reg: 0.5036 instance_segmentation_loss_poly: 1.5209 +2023/10/26 06:55:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 06:55:38 - mmengine - INFO - Iter(train) [ 6000/640000] base_lr: 1.9996e-04 lr: 1.9996e-05 eta: 8 days, 4:36:42 time: 1.1218 data_time: 0.0332 memory: 21517 grad_norm: 2.4366 loss: 2.2657 caption_loss_cls: 3.6534 grounding_loss_reg: 5.7284 detection_loss_cls: 0.1130 detection_loss_reg: 0.5024 semantic_segmentation_loss_cls: 0.0335 instance_segmentation_loss_cls: 0.1094 instance_segmentation_loss_reg: 0.5012 instance_segmentation_loss_poly: 1.5051 +2023/10/26 06:55:38 - mmengine - INFO - Saving checkpoint at 6000 iterations +2023/10/26 07:05:24 - mmengine - INFO - Iter(train) [ 6500/640000] base_lr: 1.9995e-04 lr: 1.9995e-05 eta: 8 days, 5:12:34 time: 1.1259 data_time: 0.0331 memory: 21517 grad_norm: 2.4336 loss: 2.2452 caption_loss_cls: 3.6207 grounding_loss_reg: 5.6897 detection_loss_cls: 0.1099 detection_loss_reg: 0.4966 semantic_segmentation_loss_cls: 0.0325 instance_segmentation_loss_cls: 0.1068 instance_segmentation_loss_reg: 0.4978 instance_segmentation_loss_poly: 1.4858 +2023/10/26 07:14:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 07:14:48 - mmengine - INFO - Iter(train) [ 7000/640000] base_lr: 1.9994e-04 lr: 1.9995e-05 eta: 8 days, 5:09:47 time: 1.1267 data_time: 0.0350 memory: 21517 grad_norm: 2.4345 loss: 2.2262 caption_loss_cls: 3.6032 grounding_loss_reg: 5.6489 detection_loss_cls: 0.1077 detection_loss_reg: 0.4925 semantic_segmentation_loss_cls: 0.0317 instance_segmentation_loss_cls: 0.1044 instance_segmentation_loss_reg: 0.4926 instance_segmentation_loss_poly: 1.4691 +2023/10/26 07:14:48 - mmengine - INFO - Saving checkpoint at 7000 iterations +2023/10/26 07:23:19 - mmengine - INFO - Iter(train) [ 7500/640000] base_lr: 1.9993e-04 lr: 1.9994e-05 eta: 8 days, 3:50:13 time: 1.1091 data_time: 0.0346 memory: 21517 grad_norm: 2.4975 loss: 2.2388 caption_loss_cls: 3.5716 grounding_loss_reg: 5.5987 detection_loss_cls: 0.1061 detection_loss_reg: 0.4884 semantic_segmentation_loss_cls: 0.0309 instance_segmentation_loss_cls: 0.1026 instance_segmentation_loss_reg: 0.4877 instance_segmentation_loss_poly: 1.4546 +2023/10/26 07:32:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 07:32:02 - mmengine - INFO - Iter(train) [ 8000/640000] base_lr: 1.9992e-04 lr: 1.9993e-05 eta: 8 days, 2:55:14 time: 1.0985 data_time: 0.0343 memory: 21517 grad_norm: 2.5334 loss: 2.2306 caption_loss_cls: 3.5461 grounding_loss_reg: 5.5585 detection_loss_cls: 0.1045 detection_loss_reg: 0.4855 semantic_segmentation_loss_cls: 0.0303 instance_segmentation_loss_cls: 0.1008 instance_segmentation_loss_reg: 0.4850 instance_segmentation_loss_poly: 1.4423 +2023/10/26 07:32:02 - mmengine - INFO - Saving checkpoint at 8000 iterations +2023/10/26 07:40:58 - mmengine - INFO - Iter(train) [ 8500/640000] base_lr: 1.9991e-04 lr: 1.9992e-05 eta: 8 days, 2:22:18 time: 1.0892 data_time: 0.0341 memory: 21517 grad_norm: 2.5620 loss: 2.2099 caption_loss_cls: 3.5159 grounding_loss_reg: 5.5211 detection_loss_cls: 0.1032 detection_loss_reg: 0.4830 semantic_segmentation_loss_cls: 0.0298 instance_segmentation_loss_cls: 0.0991 instance_segmentation_loss_reg: 0.4819 instance_segmentation_loss_poly: 1.4297 +2023/10/26 07:50:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 07:50:04 - mmengine - INFO - Iter(train) [ 9000/640000] base_lr: 1.9990e-04 lr: 1.9991e-05 eta: 8 days, 2:04:14 time: 1.1043 data_time: 0.0346 memory: 21517 grad_norm: 2.5349 loss: 2.1561 caption_loss_cls: 3.4783 grounding_loss_reg: 5.4866 detection_loss_cls: 0.1017 detection_loss_reg: 0.4805 semantic_segmentation_loss_cls: 0.0291 instance_segmentation_loss_cls: 0.0974 instance_segmentation_loss_reg: 0.4778 instance_segmentation_loss_poly: 1.4154 +2023/10/26 07:50:04 - mmengine - INFO - Saving checkpoint at 9000 iterations +2023/10/26 07:59:20 - mmengine - INFO - Iter(train) [ 9500/640000] base_lr: 1.9989e-04 lr: 1.9990e-05 eta: 8 days, 1:57:58 time: 1.0985 data_time: 0.0346 memory: 21517 grad_norm: 2.5608 loss: 2.1369 caption_loss_cls: 3.4503 grounding_loss_reg: 5.4495 detection_loss_cls: 0.1006 detection_loss_reg: 0.4808 semantic_segmentation_loss_cls: 0.0286 instance_segmentation_loss_cls: 0.0965 instance_segmentation_loss_reg: 0.4780 instance_segmentation_loss_poly: 1.4107 +2023/10/26 08:08:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 08:08:21 - mmengine - INFO - Iter(train) [ 10000/640000] base_lr: 1.9988e-04 lr: 1.9989e-05 eta: 8 days, 1:34:18 time: 1.0907 data_time: 0.0347 memory: 21517 grad_norm: 2.6280 loss: 2.1603 caption_loss_cls: 3.4301 grounding_loss_reg: 5.4153 detection_loss_cls: 0.0992 detection_loss_reg: 0.4788 semantic_segmentation_loss_cls: 0.0282 instance_segmentation_loss_cls: 0.0953 instance_segmentation_loss_reg: 0.4765 instance_segmentation_loss_poly: 1.4044 +2023/10/26 08:08:21 - mmengine - INFO - Saving checkpoint at 10000 iterations +2023/10/26 08:17:47 - mmengine - INFO - Iter(train) [ 10500/640000] base_lr: 1.9987e-04 lr: 1.9988e-05 eta: 8 days, 1:38:27 time: 1.0858 data_time: 0.0345 memory: 21517 grad_norm: 2.6563 loss: 2.1425 caption_loss_cls: 3.4123 grounding_loss_reg: 5.3693 detection_loss_cls: 0.0976 detection_loss_reg: 0.4751 semantic_segmentation_loss_cls: 0.0278 instance_segmentation_loss_cls: 0.0940 instance_segmentation_loss_reg: 0.4738 instance_segmentation_loss_poly: 1.3930 +2023/10/26 08:26:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 08:26:27 - mmengine - INFO - Iter(train) [ 11000/640000] base_lr: 1.9986e-04 lr: 1.9987e-05 eta: 8 days, 0:57:10 time: 1.0747 data_time: 0.0324 memory: 21517 grad_norm: 2.6842 loss: 2.1326 caption_loss_cls: 3.3942 grounding_loss_reg: 5.3389 detection_loss_cls: 0.0965 detection_loss_reg: 0.4746 semantic_segmentation_loss_cls: 0.0274 instance_segmentation_loss_cls: 0.0931 instance_segmentation_loss_reg: 0.4719 instance_segmentation_loss_poly: 1.3858 +2023/10/26 08:26:27 - mmengine - INFO - Saving checkpoint at 11000 iterations +2023/10/26 08:35:37 - mmengine - INFO - Iter(train) [ 11500/640000] base_lr: 1.9984e-04 lr: 1.9986e-05 eta: 8 days, 0:45:41 time: 1.0844 data_time: 0.0329 memory: 21517 grad_norm: 2.6786 loss: 2.1197 caption_loss_cls: 3.3737 grounding_loss_reg: 5.3065 detection_loss_cls: 0.0955 detection_loss_reg: 0.4734 semantic_segmentation_loss_cls: 0.0271 instance_segmentation_loss_cls: 0.0923 instance_segmentation_loss_reg: 0.4719 instance_segmentation_loss_poly: 1.3842 +2023/10/26 08:44:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 08:44:52 - mmengine - INFO - Iter(train) [ 12000/640000] base_lr: 1.9983e-04 lr: 1.9984e-05 eta: 8 days, 0:39:29 time: 1.0926 data_time: 0.0331 memory: 21517 grad_norm: 2.6445 loss: 2.0815 caption_loss_cls: 3.3595 grounding_loss_reg: 5.2802 detection_loss_cls: 0.0945 detection_loss_reg: 0.4747 semantic_segmentation_loss_cls: 0.0267 instance_segmentation_loss_cls: 0.0919 instance_segmentation_loss_reg: 0.4732 instance_segmentation_loss_poly: 1.3827 +2023/10/26 08:44:52 - mmengine - INFO - Saving checkpoint at 12000 iterations +2023/10/26 08:54:41 - mmengine - INFO - Iter(train) [ 12500/640000] base_lr: 1.9981e-04 lr: 1.9983e-05 eta: 8 days, 1:00:36 time: 1.1057 data_time: 0.0333 memory: 21517 grad_norm: 2.6224 loss: 2.0501 caption_loss_cls: 3.3482 grounding_loss_reg: 5.2539 detection_loss_cls: 0.0934 detection_loss_reg: 0.4736 semantic_segmentation_loss_cls: 0.0264 instance_segmentation_loss_cls: 0.0911 instance_segmentation_loss_reg: 0.4710 instance_segmentation_loss_poly: 1.3759 +2023/10/26 09:03:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 09:03:55 - mmengine - INFO - Iter(train) [ 13000/640000] base_lr: 1.9980e-04 lr: 1.9982e-05 eta: 8 days, 0:51:35 time: 1.1076 data_time: 0.0334 memory: 21517 grad_norm: 2.6281 loss: 2.0437 caption_loss_cls: 3.3322 grounding_loss_reg: 5.2280 detection_loss_cls: 0.0926 detection_loss_reg: 0.4718 semantic_segmentation_loss_cls: 0.0261 instance_segmentation_loss_cls: 0.0905 instance_segmentation_loss_reg: 0.4700 instance_segmentation_loss_poly: 1.3696 +2023/10/26 09:03:55 - mmengine - INFO - Saving checkpoint at 13000 iterations +2023/10/26 09:13:31 - mmengine - INFO - Iter(train) [ 13500/640000] base_lr: 1.9978e-04 lr: 1.9980e-05 eta: 8 days, 1:00:11 time: 1.1127 data_time: 0.0336 memory: 21517 grad_norm: 2.6274 loss: 2.0367 caption_loss_cls: 3.3200 grounding_loss_reg: 5.2029 detection_loss_cls: 0.0916 detection_loss_reg: 0.4704 semantic_segmentation_loss_cls: 0.0259 instance_segmentation_loss_cls: 0.0898 instance_segmentation_loss_reg: 0.4686 instance_segmentation_loss_poly: 1.3620 +2023/10/26 09:22:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 09:22:41 - mmengine - INFO - Iter(train) [ 14000/640000] base_lr: 1.9977e-04 lr: 1.9979e-05 eta: 8 days, 0:47:32 time: 1.1152 data_time: 0.0336 memory: 21517 grad_norm: 2.6036 loss: 2.0043 caption_loss_cls: 3.3086 grounding_loss_reg: 5.1780 detection_loss_cls: 0.0908 detection_loss_reg: 0.4692 semantic_segmentation_loss_cls: 0.0256 instance_segmentation_loss_cls: 0.0895 instance_segmentation_loss_reg: 0.4696 instance_segmentation_loss_poly: 1.3594 +2023/10/26 09:22:41 - mmengine - INFO - Saving checkpoint at 14000 iterations +2023/10/26 09:32:17 - mmengine - INFO - Iter(train) [ 14500/640000] base_lr: 1.9975e-04 lr: 1.9977e-05 eta: 8 days, 0:53:21 time: 1.1174 data_time: 0.0337 memory: 21517 grad_norm: 2.5713 loss: 1.9798 caption_loss_cls: 3.2996 grounding_loss_reg: 5.1579 detection_loss_cls: 0.0900 detection_loss_reg: 0.4684 semantic_segmentation_loss_cls: 0.0253 instance_segmentation_loss_cls: 0.0890 instance_segmentation_loss_reg: 0.4686 instance_segmentation_loss_poly: 1.3550 +2023/10/26 09:41:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 09:41:15 - mmengine - INFO - Iter(train) [ 15000/640000] base_lr: 1.9973e-04 lr: 1.9976e-05 eta: 8 days, 0:32:26 time: 1.1219 data_time: 0.0340 memory: 21517 grad_norm: 2.5729 loss: 1.9683 caption_loss_cls: 3.2858 grounding_loss_reg: 5.1337 detection_loss_cls: 0.0893 detection_loss_reg: 0.4670 semantic_segmentation_loss_cls: 0.0250 instance_segmentation_loss_cls: 0.0884 instance_segmentation_loss_reg: 0.4679 instance_segmentation_loss_poly: 1.3509 +2023/10/26 09:41:15 - mmengine - INFO - Saving checkpoint at 15000 iterations +2023/10/26 09:50:49 - mmengine - INFO - Iter(train) [ 15500/640000] base_lr: 1.9971e-04 lr: 1.9974e-05 eta: 8 days, 0:36:08 time: 1.1280 data_time: 0.0342 memory: 21517 grad_norm: 2.5852 loss: 1.9580 caption_loss_cls: 3.2742 grounding_loss_reg: 5.1088 detection_loss_cls: 0.0884 detection_loss_reg: 0.4654 semantic_segmentation_loss_cls: 0.0248 instance_segmentation_loss_cls: 0.0877 instance_segmentation_loss_reg: 0.4664 instance_segmentation_loss_poly: 1.3430 +2023/10/26 10:00:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 10:00:10 - mmengine - INFO - Iter(train) [ 16000/640000] base_lr: 1.9969e-04 lr: 1.9972e-05 eta: 8 days, 0:30:41 time: 1.1293 data_time: 0.0341 memory: 21517 grad_norm: 2.6069 loss: 1.9475 caption_loss_cls: 3.2624 grounding_loss_reg: 5.0850 detection_loss_cls: 0.0878 detection_loss_reg: 0.4644 semantic_segmentation_loss_cls: 0.0246 instance_segmentation_loss_cls: 0.0871 instance_segmentation_loss_reg: 0.4645 instance_segmentation_loss_poly: 1.3365 +2023/10/26 10:00:10 - mmengine - INFO - Saving checkpoint at 16000 iterations +2023/10/26 10:09:18 - mmengine - INFO - Iter(train) [ 16500/640000] base_lr: 1.9968e-04 lr: 1.9970e-05 eta: 8 days, 0:16:53 time: 1.1193 data_time: 0.0340 memory: 21517 grad_norm: 2.6388 loss: 1.9509 caption_loss_cls: 3.2474 grounding_loss_reg: 5.0630 detection_loss_cls: 0.0872 detection_loss_reg: 0.4633 semantic_segmentation_loss_cls: 0.0244 instance_segmentation_loss_cls: 0.0867 instance_segmentation_loss_reg: 0.4642 instance_segmentation_loss_poly: 1.3331 +2023/10/26 10:18:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 10:18:11 - mmengine - INFO - Iter(train) [ 17000/640000] base_lr: 1.9966e-04 lr: 1.9969e-05 eta: 7 days, 23:54:26 time: 1.1142 data_time: 0.0336 memory: 21517 grad_norm: 2.6402 loss: 1.9339 caption_loss_cls: 3.2380 grounding_loss_reg: 5.0411 detection_loss_cls: 0.0864 detection_loss_reg: 0.4620 semantic_segmentation_loss_cls: 0.0242 instance_segmentation_loss_cls: 0.0864 instance_segmentation_loss_reg: 0.4639 instance_segmentation_loss_poly: 1.3302 +2023/10/26 10:18:11 - mmengine - INFO - Saving checkpoint at 17000 iterations +2023/10/26 10:27:26 - mmengine - INFO - Iter(train) [ 17500/640000] base_lr: 1.9963e-04 lr: 1.9967e-05 eta: 7 days, 23:45:09 time: 1.1086 data_time: 0.0332 memory: 21517 grad_norm: 2.6385 loss: 1.9094 caption_loss_cls: 3.2261 grounding_loss_reg: 5.0214 detection_loss_cls: 0.0857 detection_loss_reg: 0.4598 semantic_segmentation_loss_cls: 0.0240 instance_segmentation_loss_cls: 0.0858 instance_segmentation_loss_reg: 0.4618 instance_segmentation_loss_poly: 1.3247 +2023/10/26 10:36:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 10:36:29 - mmengine - INFO - Iter(train) [ 18000/640000] base_lr: 1.9961e-04 lr: 1.9965e-05 eta: 7 days, 23:29:17 time: 1.1068 data_time: 0.0331 memory: 21517 grad_norm: 2.6660 loss: 1.9079 caption_loss_cls: 3.2125 grounding_loss_reg: 4.9994 detection_loss_cls: 0.0851 detection_loss_reg: 0.4588 semantic_segmentation_loss_cls: 0.0238 instance_segmentation_loss_cls: 0.0854 instance_segmentation_loss_reg: 0.4614 instance_segmentation_loss_poly: 1.3211 +2023/10/26 10:36:29 - mmengine - INFO - Saving checkpoint at 18000 iterations +2023/10/26 10:46:02 - mmengine - INFO - Iter(train) [ 18500/640000] base_lr: 1.9959e-04 lr: 1.9963e-05 eta: 7 days, 23:30:55 time: 1.1064 data_time: 0.0332 memory: 21517 grad_norm: 2.6899 loss: 1.9115 caption_loss_cls: 3.2048 grounding_loss_reg: 4.9824 detection_loss_cls: 0.0844 detection_loss_reg: 0.4577 semantic_segmentation_loss_cls: 0.0236 instance_segmentation_loss_cls: 0.0850 instance_segmentation_loss_reg: 0.4609 instance_segmentation_loss_poly: 1.3180 +2023/10/26 10:55:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 10:55:21 - mmengine - INFO - Iter(train) [ 19000/640000] base_lr: 1.9957e-04 lr: 1.9961e-05 eta: 7 days, 23:23:42 time: 1.1114 data_time: 0.0333 memory: 21517 grad_norm: 2.6835 loss: 1.8967 caption_loss_cls: 3.1993 grounding_loss_reg: 4.9628 detection_loss_cls: 0.0839 detection_loss_reg: 0.4571 semantic_segmentation_loss_cls: 0.0235 instance_segmentation_loss_cls: 0.0845 instance_segmentation_loss_reg: 0.4599 instance_segmentation_loss_poly: 1.3141 +2023/10/26 10:55:21 - mmengine - INFO - Saving checkpoint at 19000 iterations +2023/10/26 11:04:20 - mmengine - INFO - Iter(train) [ 19500/640000] base_lr: 1.9955e-04 lr: 1.9959e-05 eta: 7 days, 23:06:26 time: 1.1029 data_time: 0.0327 memory: 21517 grad_norm: 2.6725 loss: 1.8740 caption_loss_cls: 3.1904 grounding_loss_reg: 4.9404 detection_loss_cls: 0.0834 detection_loss_reg: 0.4560 semantic_segmentation_loss_cls: 0.0233 instance_segmentation_loss_cls: 0.0840 instance_segmentation_loss_reg: 0.4589 instance_segmentation_loss_poly: 1.3104 +2023/10/26 11:13:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 11:13:37 - mmengine - INFO - Iter(train) [ 20000/640000] base_lr: 1.9952e-04 lr: 1.9957e-05 eta: 7 days, 22:58:06 time: 1.1017 data_time: 0.0326 memory: 21517 grad_norm: 2.6593 loss: 1.8637 caption_loss_cls: 3.1630 grounding_loss_reg: 4.8851 detection_loss_cls: 0.0828 detection_loss_reg: 0.4543 semantic_segmentation_loss_cls: 0.0232 instance_segmentation_loss_cls: 0.0834 instance_segmentation_loss_reg: 0.4570 instance_segmentation_loss_poly: 1.3043 +2023/10/26 11:13:37 - mmengine - INFO - Saving checkpoint at 20000 iterations +2023/10/26 11:22:15 - mmengine - INFO - Evaluating bbox... +2023/10/26 11:23:11 - mmengine - INFO - bbox_mAP_copypaste: 0.203 0.347 0.214 0.119 0.252 0.248 +2023/10/26 11:23:11 - mmengine - INFO - Evaluating segm... +2023/10/26 11:24:23 - mmengine - INFO - segm_mAP_copypaste: 0.111 0.252 0.084 0.044 0.144 0.179 +2023/10/26 11:29:30 - mmengine - INFO - per class results: +2023/10/26 11:29:30 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 69.2 | 83.86 | +| building | 77.91 | 90.92 | +| sky | 91.85 | 97.35 | +| floor | 74.69 | 89.61 | +| tree | 66.41 | 84.65 | +| ceiling | 78.11 | 93.45 | +| road | 74.83 | 81.87 | +| bed | 79.71 | 91.26 | +| windowpane | 49.6 | 64.66 | +| grass | 63.45 | 79.59 | +| cabinet | 49.23 | 58.34 | +| sidewalk | 52.59 | 76.13 | +| person | 72.9 | 88.81 | +| earth | 33.21 | 45.33 | +| door | 31.06 | 47.2 | +| table | 41.32 | 58.57 | +| mountain | 49.27 | 79.24 | +| plant | 42.14 | 48.38 | +| curtain | 55.42 | 87.97 | +| chair | 44.35 | 62.33 | +| car | 74.48 | 85.98 | +| water | 45.48 | 64.14 | +| painting | 57.73 | 71.5 | +| sofa | 52.33 | 66.39 | +| shelf | 28.34 | 40.76 | +| house | 33.77 | 50.25 | +| sea | 54.87 | 83.46 | +| mirror | 45.44 | 53.22 | +| rug | 46.05 | 48.44 | +| field | 22.62 | 34.76 | +| armchair | 24.62 | 31.91 | +| seat | 39.63 | 66.08 | +| fence | 24.57 | 30.44 | +| desk | 24.75 | 53.46 | +| rock | 26.18 | 33.88 | +| wardrobe | 36.91 | 41.1 | +| lamp | 42.81 | 61.99 | +| bathtub | 48.8 | 73.28 | +| railing | 29.28 | 40.01 | +| cushion | 36.24 | 47.01 | +| base | 2.07 | 2.11 | +| box | 14.17 | 17.3 | +| column | 39.31 | 49.72 | +| signboard | 25.9 | 31.24 | +| chest of drawers | 28.45 | 51.74 | +| counter | 20.96 | 26.25 | +| sand | 20.95 | 24.34 | +| sink | 46.81 | 54.42 | +| skyscraper | 46.47 | 60.06 | +| fireplace | 52.22 | 66.62 | +| refrigerator | 44.58 | 48.11 | +| grandstand | 36.32 | 39.99 | +| path | 11.67 | 13.6 | +| stairs | 32.21 | 48.51 | +| runway | 64.15 | 74.83 | +| case | 30.35 | 54.41 | +| pool table | 85.63 | 93.09 | +| pillow | 39.41 | 56.89 | +| screen door | 35.68 | 59.01 | +| stairway | 18.16 | 20.61 | +| river | 7.05 | 8.36 | +| bridge | 29.28 | 47.31 | +| bookcase | 30.06 | 42.62 | +| blind | 9.4 | 9.92 | +| coffee table | 41.66 | 48.65 | +| toilet | 60.75 | 87.77 | +| flower | 20.58 | 24.46 | +| book | 39.9 | 54.81 | +| hill | 0.0 | 0.0 | +| bench | 29.24 | 35.86 | +| countertop | 33.9 | 50.1 | +| stove | 45.02 | 67.7 | +| palm | 39.3 | 54.89 | +| kitchen island | 8.3 | 8.78 | +| computer | 54.08 | 73.86 | +| swivel chair | 24.39 | 29.73 | +| boat | 39.63 | 44.06 | +| bar | 9.9 | 10.39 | +| arcade machine | 25.29 | 75.37 | +| hovel | 0.31 | 0.31 | +| bus | 71.37 | 79.5 | +| towel | 36.73 | 41.51 | +| light | 36.9 | 50.73 | +| truck | 17.48 | 22.66 | +| tower | 30.71 | 54.55 | +| chandelier | 48.16 | 68.54 | +| awning | 16.08 | 17.58 | +| streetlight | 11.69 | 13.19 | +| booth | 20.04 | 29.91 | +| television receiver | 42.46 | 62.12 | +| airplane | 49.31 | 63.87 | +| dirt track | 0.0 | 0.0 | +| apparel | 18.39 | 27.92 | +| pole | 14.26 | 26.76 | +| land | 0.0 | 0.0 | +| bannister | 0.47 | 0.6 | +| escalator | 21.18 | 23.25 | +| ottoman | 23.79 | 35.37 | +| bottle | 17.03 | 23.66 | +| buffet | 34.21 | 44.51 | +| poster | 15.92 | 50.59 | +| stage | 3.57 | 5.46 | +| van | 19.01 | 23.96 | +| ship | 6.81 | 8.51 | +| fountain | 0.97 | 0.99 | +| conveyer belt | 30.1 | 87.06 | +| canopy | 0.38 | 0.44 | +| washer | 45.74 | 50.61 | +| plaything | 14.57 | 48.31 | +| swimming pool | 27.73 | 76.96 | +| stool | 12.46 | 13.46 | +| barrel | 1.82 | 2.94 | +| basket | 8.45 | 9.98 | +| waterfall | 48.76 | 52.43 | +| tent | 66.84 | 93.27 | +| bag | 2.25 | 2.34 | +| minibike | 54.52 | 66.97 | +| cradle | 67.03 | 85.86 | +| oven | 6.28 | 6.77 | +| ball | 44.68 | 61.99 | +| food | 44.39 | 50.45 | +| step | 3.01 | 3.48 | +| tank | 32.48 | 33.75 | +| trade name | 13.77 | 14.86 | +| microwave | 29.25 | 33.2 | +| pot | 28.09 | 33.76 | +| animal | 51.39 | 60.24 | +| bicycle | 42.43 | 59.45 | +| lake | 3.15 | 4.08 | +| dishwasher | 15.34 | 18.28 | +| screen | 52.88 | 80.8 | +| blanket | 0.0 | 0.0 | +| sculpture | 12.59 | 17.16 | +| hood | 24.0 | 25.22 | +| sconce | 16.46 | 20.25 | +| vase | 16.13 | 18.48 | +| traffic light | 15.33 | 17.97 | +| tray | 0.98 | 1.15 | +| ashcan | 9.46 | 9.63 | +| fan | 37.6 | 48.62 | +| pier | 36.67 | 45.21 | +| crt screen | 0.0 | 0.0 | +| plate | 17.43 | 18.73 | +| monitor | 1.5 | 1.5 | +| bulletin board | 0.0 | 0.0 | +| shower | 0.0 | 0.0 | +| radiator | 19.19 | 21.88 | +| glass | 6.86 | 7.06 | +| clock | 12.09 | 16.56 | +| flag | 15.36 | 16.27 | ++---------------------+-------+-------+ +2023/10/26 11:29:47 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.2030 coco/bbox_mAP_50: 0.3470 coco/bbox_mAP_75: 0.2140 coco/bbox_mAP_s: 0.1190 coco/bbox_mAP_m: 0.2520 coco/bbox_mAP_l: 0.2480 coco/segm_mAP: 0.1110 coco/segm_mAP_50: 0.2520 coco/segm_mAP_75: 0.0840 coco/segm_mAP_s: 0.0440 coco/segm_mAP_m: 0.1440 coco/segm_mAP_l: 0.1790 Bleu_1: 0.6437 Bleu_2: 0.4587 Bleu_3: 0.3137 Bleu_4: 0.2121 METEOR: 0.2022 ROUGE_L: 0.4725 CIDEr: 0.6465 SPICE: 0.1355 aAcc: 76.4600 mIoU: 31.8800 mAcc: 42.4600 visual-grounding/miou: 0.4986 visual-grounding/acc: 0.5614 data_time: 0.0102 time: 0.5281 +2023/10/26 11:39:12 - mmengine - INFO - Iter(train) [ 20500/640000] base_lr: 1.9950e-04 lr: 1.9954e-05 eta: 7 days, 22:55:24 time: 1.1065 data_time: 0.0302 memory: 21518 grad_norm: 2.6548 loss: 1.8551 caption_loss_cls: 3.1226 grounding_loss_reg: 4.8267 detection_loss_cls: 0.0782 detection_loss_reg: 0.4504 semantic_segmentation_loss_cls: 0.0209 instance_segmentation_loss_cls: 0.0804 instance_segmentation_loss_reg: 0.4541 instance_segmentation_loss_poly: 1.2872 +2023/10/26 11:48:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 11:48:27 - mmengine - INFO - Iter(train) [ 21000/640000] base_lr: 1.9947e-04 lr: 1.9952e-05 eta: 7 days, 22:46:33 time: 1.1120 data_time: 0.0305 memory: 21517 grad_norm: 2.6382 loss: 1.8455 caption_loss_cls: 3.0935 grounding_loss_reg: 4.7845 detection_loss_cls: 0.0764 detection_loss_reg: 0.4480 semantic_segmentation_loss_cls: 0.0202 instance_segmentation_loss_cls: 0.0784 instance_segmentation_loss_reg: 0.4514 instance_segmentation_loss_poly: 1.2747 +2023/10/26 11:48:27 - mmengine - INFO - Saving checkpoint at 21000 iterations +2023/10/26 11:57:17 - mmengine - INFO - Iter(train) [ 21500/640000] base_lr: 1.9945e-04 lr: 1.9950e-05 eta: 7 days, 22:25:24 time: 1.1059 data_time: 0.0306 memory: 21517 grad_norm: 2.6773 loss: 1.8699 caption_loss_cls: 3.0687 grounding_loss_reg: 4.7364 detection_loss_cls: 0.0749 detection_loss_reg: 0.4451 semantic_segmentation_loss_cls: 0.0198 instance_segmentation_loss_cls: 0.0768 instance_segmentation_loss_reg: 0.4484 instance_segmentation_loss_poly: 1.2630 +2023/10/26 12:06:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 12:06:42 - mmengine - INFO - Iter(train) [ 22000/640000] base_lr: 1.9942e-04 lr: 1.9948e-05 eta: 7 days, 22:20:57 time: 1.1113 data_time: 0.0310 memory: 21517 grad_norm: 2.6644 loss: 1.8677 caption_loss_cls: 3.0469 grounding_loss_reg: 4.6969 detection_loss_cls: 0.0738 detection_loss_reg: 0.4428 semantic_segmentation_loss_cls: 0.0195 instance_segmentation_loss_cls: 0.0755 instance_segmentation_loss_reg: 0.4455 instance_segmentation_loss_poly: 1.2518 +2023/10/26 12:06:42 - mmengine - INFO - Saving checkpoint at 22000 iterations +2023/10/26 12:16:07 - mmengine - INFO - Iter(train) [ 22500/640000] base_lr: 1.9940e-04 lr: 1.9945e-05 eta: 7 days, 22:16:35 time: 1.1091 data_time: 0.0311 memory: 21517 grad_norm: 2.6925 loss: 1.8691 caption_loss_cls: 3.0316 grounding_loss_reg: 4.6543 detection_loss_cls: 0.0728 detection_loss_reg: 0.4410 semantic_segmentation_loss_cls: 0.0193 instance_segmentation_loss_cls: 0.0746 instance_segmentation_loss_reg: 0.4433 instance_segmentation_loss_poly: 1.2432 +2023/10/26 12:25:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 12:25:38 - mmengine - INFO - Iter(train) [ 23000/640000] base_lr: 1.9937e-04 lr: 1.9943e-05 eta: 7 days, 22:14:55 time: 1.1124 data_time: 0.0314 memory: 21517 grad_norm: 2.6769 loss: 1.8589 caption_loss_cls: 3.0152 grounding_loss_reg: 4.6217 detection_loss_cls: 0.0716 detection_loss_reg: 0.4385 semantic_segmentation_loss_cls: 0.0191 instance_segmentation_loss_cls: 0.0739 instance_segmentation_loss_reg: 0.4419 instance_segmentation_loss_poly: 1.2356 +2023/10/26 12:25:38 - mmengine - INFO - Saving checkpoint at 23000 iterations +2023/10/26 12:35:18 - mmengine - INFO - Iter(train) [ 23500/640000] base_lr: 1.9934e-04 lr: 1.9940e-05 eta: 7 days, 22:16:33 time: 1.1225 data_time: 0.0321 memory: 21517 grad_norm: 2.6594 loss: 1.8580 caption_loss_cls: 3.0025 grounding_loss_reg: 4.5876 detection_loss_cls: 0.0710 detection_loss_reg: 0.4367 semantic_segmentation_loss_cls: 0.0189 instance_segmentation_loss_cls: 0.0734 instance_segmentation_loss_reg: 0.4416 instance_segmentation_loss_poly: 1.2304 +2023/10/26 12:44:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 12:44:36 - mmengine - INFO - Iter(train) [ 24000/640000] base_lr: 1.9931e-04 lr: 1.9938e-05 eta: 7 days, 22:08:06 time: 1.1228 data_time: 0.0339 memory: 21517 grad_norm: 2.6972 loss: 1.8764 caption_loss_cls: 2.9886 grounding_loss_reg: 4.5511 detection_loss_cls: 0.0705 detection_loss_reg: 0.4363 semantic_segmentation_loss_cls: 0.0187 instance_segmentation_loss_cls: 0.0727 instance_segmentation_loss_reg: 0.4395 instance_segmentation_loss_poly: 1.2241 +2023/10/26 12:44:36 - mmengine - INFO - Saving checkpoint at 24000 iterations +2023/10/26 12:54:30 - mmengine - INFO - Iter(train) [ 24500/640000] base_lr: 1.9928e-04 lr: 1.9935e-05 eta: 7 days, 22:15:09 time: 1.1296 data_time: 0.0366 memory: 21517 grad_norm: 2.6491 loss: 1.8438 caption_loss_cls: 2.9772 grounding_loss_reg: 4.5258 detection_loss_cls: 0.0699 detection_loss_reg: 0.4346 semantic_segmentation_loss_cls: 0.0185 instance_segmentation_loss_cls: 0.0719 instance_segmentation_loss_reg: 0.4371 instance_segmentation_loss_poly: 1.2151 +2023/10/26 13:04:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 13:04:21 - mmengine - INFO - Iter(train) [ 25000/640000] base_lr: 1.9926e-04 lr: 1.9932e-05 eta: 7 days, 22:19:55 time: 1.1384 data_time: 0.0369 memory: 21517 grad_norm: 2.6388 loss: 1.8309 caption_loss_cls: 2.9672 grounding_loss_reg: 4.4982 detection_loss_cls: 0.0690 detection_loss_reg: 0.4322 semantic_segmentation_loss_cls: 0.0184 instance_segmentation_loss_cls: 0.0710 instance_segmentation_loss_reg: 0.4348 instance_segmentation_loss_poly: 1.2077 +2023/10/26 13:04:21 - mmengine - INFO - Saving checkpoint at 25000 iterations +2023/10/26 13:13:47 - mmengine - INFO - Iter(train) [ 25500/640000] base_lr: 1.9923e-04 lr: 1.9930e-05 eta: 7 days, 22:14:10 time: 1.1474 data_time: 0.0371 memory: 21517 grad_norm: 2.6206 loss: 1.8115 caption_loss_cls: 2.9591 grounding_loss_reg: 4.4667 detection_loss_cls: 0.0682 detection_loss_reg: 0.4298 semantic_segmentation_loss_cls: 0.0183 instance_segmentation_loss_cls: 0.0702 instance_segmentation_loss_reg: 0.4325 instance_segmentation_loss_poly: 1.1999 +2023/10/26 13:23:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 13:23:32 - mmengine - INFO - Iter(train) [ 26000/640000] base_lr: 1.9919e-04 lr: 1.9927e-05 eta: 7 days, 22:15:44 time: 1.1525 data_time: 0.0370 memory: 21517 grad_norm: 2.5793 loss: 1.7860 caption_loss_cls: 2.9472 grounding_loss_reg: 4.4419 detection_loss_cls: 0.0677 detection_loss_reg: 0.4288 semantic_segmentation_loss_cls: 0.0181 instance_segmentation_loss_cls: 0.0701 instance_segmentation_loss_reg: 0.4326 instance_segmentation_loss_poly: 1.1985 +2023/10/26 13:23:32 - mmengine - INFO - Saving checkpoint at 26000 iterations +2023/10/26 13:32:51 - mmengine - INFO - Iter(train) [ 26500/640000] base_lr: 1.9916e-04 lr: 1.9924e-05 eta: 7 days, 22:07:02 time: 1.1510 data_time: 0.0369 memory: 21517 grad_norm: 2.5350 loss: 1.7599 caption_loss_cls: 2.9358 grounding_loss_reg: 4.4155 detection_loss_cls: 0.0674 detection_loss_reg: 0.4274 semantic_segmentation_loss_cls: 0.0180 instance_segmentation_loss_cls: 0.0696 instance_segmentation_loss_reg: 0.4318 instance_segmentation_loss_poly: 1.1955 +2023/10/26 13:41:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 13:41:59 - mmengine - INFO - Iter(train) [ 27000/640000] base_lr: 1.9913e-04 lr: 1.9921e-05 eta: 7 days, 21:53:58 time: 1.1451 data_time: 0.0366 memory: 21517 grad_norm: 2.5690 loss: 1.7664 caption_loss_cls: 2.9220 grounding_loss_reg: 4.3882 detection_loss_cls: 0.0673 detection_loss_reg: 0.4281 semantic_segmentation_loss_cls: 0.0179 instance_segmentation_loss_cls: 0.0694 instance_segmentation_loss_reg: 0.4317 instance_segmentation_loss_poly: 1.1931 +2023/10/26 13:41:59 - mmengine - INFO - Saving checkpoint at 27000 iterations +2023/10/26 13:51:27 - mmengine - INFO - Iter(train) [ 27500/640000] base_lr: 1.9910e-04 lr: 1.9918e-05 eta: 7 days, 21:48:26 time: 1.1421 data_time: 0.0363 memory: 21517 grad_norm: 2.5696 loss: 1.7553 caption_loss_cls: 2.9137 grounding_loss_reg: 4.3644 detection_loss_cls: 0.0666 detection_loss_reg: 0.4269 semantic_segmentation_loss_cls: 0.0178 instance_segmentation_loss_cls: 0.0691 instance_segmentation_loss_reg: 0.4318 instance_segmentation_loss_poly: 1.1912 +2023/10/26 14:00:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 14:00:44 - mmengine - INFO - Iter(train) [ 28000/640000] base_lr: 1.9907e-04 lr: 1.9915e-05 eta: 7 days, 21:38:47 time: 1.1419 data_time: 0.0347 memory: 21517 grad_norm: 2.5469 loss: 1.7409 caption_loss_cls: 2.9033 grounding_loss_reg: 4.3421 detection_loss_cls: 0.0662 detection_loss_reg: 0.4269 semantic_segmentation_loss_cls: 0.0177 instance_segmentation_loss_cls: 0.0689 instance_segmentation_loss_reg: 0.4316 instance_segmentation_loss_poly: 1.1900 +2023/10/26 14:00:44 - mmengine - INFO - Saving checkpoint at 28000 iterations +2023/10/26 14:10:08 - mmengine - INFO - Iter(train) [ 28500/640000] base_lr: 1.9903e-04 lr: 1.9912e-05 eta: 7 days, 21:31:50 time: 1.1343 data_time: 0.0345 memory: 21517 grad_norm: 2.5907 loss: 1.7622 caption_loss_cls: 2.8976 grounding_loss_reg: 4.3204 detection_loss_cls: 0.0659 detection_loss_reg: 0.4271 semantic_segmentation_loss_cls: 0.0176 instance_segmentation_loss_cls: 0.0686 instance_segmentation_loss_reg: 0.4310 instance_segmentation_loss_poly: 1.1867 +2023/10/26 14:18:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 14:18:41 - mmengine - INFO - Iter(train) [ 29000/640000] base_lr: 1.9900e-04 lr: 1.9909e-05 eta: 7 days, 21:06:52 time: 1.1150 data_time: 0.0340 memory: 21517 grad_norm: 2.6497 loss: 1.7907 caption_loss_cls: 2.8901 grounding_loss_reg: 4.2979 detection_loss_cls: 0.0654 detection_loss_reg: 0.4264 semantic_segmentation_loss_cls: 0.0176 instance_segmentation_loss_cls: 0.0684 instance_segmentation_loss_reg: 0.4310 instance_segmentation_loss_poly: 1.1854 +2023/10/26 14:18:41 - mmengine - INFO - Saving checkpoint at 29000 iterations +2023/10/26 14:28:02 - mmengine - INFO - Iter(train) [ 29500/640000] base_lr: 1.9896e-04 lr: 1.9906e-05 eta: 7 days, 20:58:56 time: 1.1138 data_time: 0.0342 memory: 21517 grad_norm: 2.6650 loss: 1.7919 caption_loss_cls: 2.8880 grounding_loss_reg: 4.2742 detection_loss_cls: 0.0649 detection_loss_reg: 0.4246 semantic_segmentation_loss_cls: 0.0175 instance_segmentation_loss_cls: 0.0679 instance_segmentation_loss_reg: 0.4283 instance_segmentation_loss_poly: 1.1785 +2023/10/26 14:37:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 14:37:03 - mmengine - INFO - Iter(train) [ 30000/640000] base_lr: 1.9893e-04 lr: 1.9903e-05 eta: 7 days, 20:44:07 time: 1.1028 data_time: 0.0340 memory: 21517 grad_norm: 2.7182 loss: 1.8062 caption_loss_cls: 2.8800 grounding_loss_reg: 4.2552 detection_loss_cls: 0.0644 detection_loss_reg: 0.4230 semantic_segmentation_loss_cls: 0.0174 instance_segmentation_loss_cls: 0.0678 instance_segmentation_loss_reg: 0.4286 instance_segmentation_loss_poly: 1.1775 +2023/10/26 14:37:03 - mmengine - INFO - Saving checkpoint at 30000 iterations +2023/10/26 14:46:36 - mmengine - INFO - Iter(train) [ 30500/640000] base_lr: 1.9889e-04 lr: 1.9899e-05 eta: 7 days, 20:40:02 time: 1.1061 data_time: 0.0341 memory: 21517 grad_norm: 2.7295 loss: 1.8156 caption_loss_cls: 2.8737 grounding_loss_reg: 4.2395 detection_loss_cls: 0.0641 detection_loss_reg: 0.4226 semantic_segmentation_loss_cls: 0.0173 instance_segmentation_loss_cls: 0.0676 instance_segmentation_loss_reg: 0.4285 instance_segmentation_loss_poly: 1.1763 +2023/10/26 14:56:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 14:56:07 - mmengine - INFO - Iter(train) [ 31000/640000] base_lr: 1.9886e-04 lr: 1.9896e-05 eta: 7 days, 20:35:15 time: 1.1119 data_time: 0.0343 memory: 21517 grad_norm: 2.6998 loss: 1.8074 caption_loss_cls: 2.8674 grounding_loss_reg: 4.2212 detection_loss_cls: 0.0639 detection_loss_reg: 0.4220 semantic_segmentation_loss_cls: 0.0172 instance_segmentation_loss_cls: 0.0673 instance_segmentation_loss_reg: 0.4269 instance_segmentation_loss_poly: 1.1717 +2023/10/26 14:56:07 - mmengine - INFO - Saving checkpoint at 31000 iterations +2023/10/26 15:05:29 - mmengine - INFO - Iter(train) [ 31500/640000] base_lr: 1.9882e-04 lr: 1.9893e-05 eta: 7 days, 20:27:21 time: 1.1104 data_time: 0.0341 memory: 21517 grad_norm: 2.6829 loss: 1.7885 caption_loss_cls: 2.8587 grounding_loss_reg: 4.2043 detection_loss_cls: 0.0636 detection_loss_reg: 0.4203 semantic_segmentation_loss_cls: 0.0172 instance_segmentation_loss_cls: 0.0669 instance_segmentation_loss_reg: 0.4245 instance_segmentation_loss_poly: 1.1648 +2023/10/26 15:15:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 15:15:14 - mmengine - INFO - Iter(train) [ 32000/640000] base_lr: 1.9878e-04 lr: 1.9889e-05 eta: 7 days, 20:26:53 time: 1.1175 data_time: 0.0343 memory: 21517 grad_norm: 2.6922 loss: 1.7804 caption_loss_cls: 2.8525 grounding_loss_reg: 4.1856 detection_loss_cls: 0.0631 detection_loss_reg: 0.4172 semantic_segmentation_loss_cls: 0.0171 instance_segmentation_loss_cls: 0.0665 instance_segmentation_loss_reg: 0.4227 instance_segmentation_loss_poly: 1.1587 +2023/10/26 15:15:14 - mmengine - INFO - Saving checkpoint at 32000 iterations +2023/10/26 15:24:58 - mmengine - INFO - Iter(train) [ 32500/640000] base_lr: 1.9874e-04 lr: 1.9886e-05 eta: 7 days, 20:25:50 time: 1.1225 data_time: 0.0345 memory: 21517 grad_norm: 2.6673 loss: 1.7657 caption_loss_cls: 2.8488 grounding_loss_reg: 4.1687 detection_loss_cls: 0.0629 detection_loss_reg: 0.4167 semantic_segmentation_loss_cls: 0.0170 instance_segmentation_loss_cls: 0.0661 instance_segmentation_loss_reg: 0.4228 instance_segmentation_loss_poly: 1.1569 +2023/10/26 15:34:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 15:34:02 - mmengine - INFO - Iter(train) [ 33000/640000] base_lr: 1.9870e-04 lr: 1.9882e-05 eta: 7 days, 20:12:09 time: 1.1302 data_time: 0.0346 memory: 21517 grad_norm: 2.6392 loss: 1.7410 caption_loss_cls: 2.8416 grounding_loss_reg: 4.1530 detection_loss_cls: 0.0626 detection_loss_reg: 0.4164 semantic_segmentation_loss_cls: 0.0169 instance_segmentation_loss_cls: 0.0657 instance_segmentation_loss_reg: 0.4217 instance_segmentation_loss_poly: 1.1538 +2023/10/26 15:34:02 - mmengine - INFO - Saving checkpoint at 33000 iterations +2023/10/26 15:43:07 - mmengine - INFO - Iter(train) [ 33500/640000] base_lr: 1.9866e-04 lr: 1.9879e-05 eta: 7 days, 19:58:52 time: 1.1262 data_time: 0.0343 memory: 21517 grad_norm: 2.6483 loss: 1.7425 caption_loss_cls: 2.8385 grounding_loss_reg: 4.1388 detection_loss_cls: 0.0624 detection_loss_reg: 0.4154 semantic_segmentation_loss_cls: 0.0168 instance_segmentation_loss_cls: 0.0653 instance_segmentation_loss_reg: 0.4203 instance_segmentation_loss_poly: 1.1500 +2023/10/26 15:52:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 15:52:21 - mmengine - INFO - Iter(train) [ 34000/640000] base_lr: 1.9862e-04 lr: 1.9875e-05 eta: 7 days, 19:48:09 time: 1.1292 data_time: 0.0345 memory: 21517 grad_norm: 2.6381 loss: 1.7400 caption_loss_cls: 2.8293 grounding_loss_reg: 4.1237 detection_loss_cls: 0.0622 detection_loss_reg: 0.4146 semantic_segmentation_loss_cls: 0.0168 instance_segmentation_loss_cls: 0.0647 instance_segmentation_loss_reg: 0.4186 instance_segmentation_loss_poly: 1.1471 +2023/10/26 15:52:21 - mmengine - INFO - Saving checkpoint at 34000 iterations +2023/10/26 16:01:53 - mmengine - INFO - Iter(train) [ 34500/640000] base_lr: 1.9858e-04 lr: 1.9871e-05 eta: 7 days, 19:43:08 time: 1.1292 data_time: 0.0345 memory: 21517 grad_norm: 2.6430 loss: 1.7377 caption_loss_cls: 2.8192 grounding_loss_reg: 4.1069 detection_loss_cls: 0.0618 detection_loss_reg: 0.4129 semantic_segmentation_loss_cls: 0.0168 instance_segmentation_loss_cls: 0.0643 instance_segmentation_loss_reg: 0.4175 instance_segmentation_loss_poly: 1.1428 +2023/10/26 16:10:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 16:10:58 - mmengine - INFO - Iter(train) [ 35000/640000] base_lr: 1.9854e-04 lr: 1.9868e-05 eta: 7 days, 19:29:57 time: 1.1226 data_time: 0.0344 memory: 21517 grad_norm: 2.6481 loss: 1.7309 caption_loss_cls: 2.8166 grounding_loss_reg: 4.0912 detection_loss_cls: 0.0615 detection_loss_reg: 0.4116 semantic_segmentation_loss_cls: 0.0168 instance_segmentation_loss_cls: 0.0642 instance_segmentation_loss_reg: 0.4169 instance_segmentation_loss_poly: 1.1413 +2023/10/26 16:10:58 - mmengine - INFO - Saving checkpoint at 35000 iterations +2023/10/26 16:20:15 - mmengine - INFO - Iter(train) [ 35500/640000] base_lr: 1.9850e-04 lr: 1.9864e-05 eta: 7 days, 19:20:36 time: 1.1216 data_time: 0.0343 memory: 21517 grad_norm: 2.6680 loss: 1.7394 caption_loss_cls: 2.8123 grounding_loss_reg: 4.0770 detection_loss_cls: 0.0616 detection_loss_reg: 0.4121 semantic_segmentation_loss_cls: 0.0167 instance_segmentation_loss_cls: 0.0639 instance_segmentation_loss_reg: 0.4159 instance_segmentation_loss_poly: 1.1388 +2023/10/26 16:29:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 16:29:32 - mmengine - INFO - Iter(train) [ 36000/640000] base_lr: 1.9846e-04 lr: 1.9860e-05 eta: 7 days, 19:10:50 time: 1.1143 data_time: 0.0342 memory: 21517 grad_norm: 2.6515 loss: 1.7290 caption_loss_cls: 2.8051 grounding_loss_reg: 4.0629 detection_loss_cls: 0.0612 detection_loss_reg: 0.4110 semantic_segmentation_loss_cls: 0.0166 instance_segmentation_loss_cls: 0.0636 instance_segmentation_loss_reg: 0.4152 instance_segmentation_loss_poly: 1.1367 +2023/10/26 16:29:32 - mmengine - INFO - Saving checkpoint at 36000 iterations +2023/10/26 16:39:09 - mmengine - INFO - Iter(train) [ 36500/640000] base_lr: 1.9842e-04 lr: 1.9856e-05 eta: 7 days, 19:07:03 time: 1.1127 data_time: 0.0342 memory: 21517 grad_norm: 2.6749 loss: 1.7388 caption_loss_cls: 2.8020 grounding_loss_reg: 4.0467 detection_loss_cls: 0.0610 detection_loss_reg: 0.4104 semantic_segmentation_loss_cls: 0.0166 instance_segmentation_loss_cls: 0.0632 instance_segmentation_loss_reg: 0.4140 instance_segmentation_loss_poly: 1.1346 +2023/10/26 16:48:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 16:48:37 - mmengine - INFO - Iter(train) [ 37000/640000] base_lr: 1.9837e-04 lr: 1.9852e-05 eta: 7 days, 19:00:24 time: 1.1186 data_time: 0.0346 memory: 21517 grad_norm: 2.6756 loss: 1.7441 caption_loss_cls: 2.7995 grounding_loss_reg: 4.0350 detection_loss_cls: 0.0608 detection_loss_reg: 0.4102 semantic_segmentation_loss_cls: 0.0165 instance_segmentation_loss_cls: 0.0630 instance_segmentation_loss_reg: 0.4141 instance_segmentation_loss_poly: 1.1342 +2023/10/26 16:48:37 - mmengine - INFO - Saving checkpoint at 37000 iterations +2023/10/26 16:57:15 - mmengine - INFO - Iter(train) [ 37500/640000] base_lr: 1.9833e-04 lr: 1.9848e-05 eta: 7 days, 18:40:14 time: 1.1118 data_time: 0.0345 memory: 21517 grad_norm: 2.6849 loss: 1.7510 caption_loss_cls: 2.7979 grounding_loss_reg: 4.0190 detection_loss_cls: 0.0606 detection_loss_reg: 0.4095 semantic_segmentation_loss_cls: 0.0165 instance_segmentation_loss_cls: 0.0626 instance_segmentation_loss_reg: 0.4130 instance_segmentation_loss_poly: 1.1312 +2023/10/26 17:06:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 17:06:57 - mmengine - INFO - Iter(train) [ 38000/640000] base_lr: 1.9828e-04 lr: 1.9844e-05 eta: 7 days, 18:37:15 time: 1.1190 data_time: 0.0346 memory: 21517 grad_norm: 2.6661 loss: 1.7471 caption_loss_cls: 2.7996 grounding_loss_reg: 4.0083 detection_loss_cls: 0.0605 detection_loss_reg: 0.4103 semantic_segmentation_loss_cls: 0.0164 instance_segmentation_loss_cls: 0.0623 instance_segmentation_loss_reg: 0.4122 instance_segmentation_loss_poly: 1.1293 +2023/10/26 17:06:57 - mmengine - INFO - Saving checkpoint at 38000 iterations +2023/10/26 17:16:47 - mmengine - INFO - Iter(train) [ 38500/640000] base_lr: 1.9824e-04 lr: 1.9840e-05 eta: 7 days, 18:36:23 time: 1.1234 data_time: 0.0348 memory: 21517 grad_norm: 2.6505 loss: 1.7388 caption_loss_cls: 2.7987 grounding_loss_reg: 3.9969 detection_loss_cls: 0.0603 detection_loss_reg: 0.4092 semantic_segmentation_loss_cls: 0.0163 instance_segmentation_loss_cls: 0.0622 instance_segmentation_loss_reg: 0.4118 instance_segmentation_loss_poly: 1.1266 +2023/10/26 17:25:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 17:25:55 - mmengine - INFO - Iter(train) [ 39000/640000] base_lr: 1.9819e-04 lr: 1.9836e-05 eta: 7 days, 18:24:15 time: 1.1241 data_time: 0.0348 memory: 21517 grad_norm: 2.6542 loss: 1.7303 caption_loss_cls: 2.7933 grounding_loss_reg: 3.9839 detection_loss_cls: 0.0602 detection_loss_reg: 0.4087 semantic_segmentation_loss_cls: 0.0163 instance_segmentation_loss_cls: 0.0621 instance_segmentation_loss_reg: 0.4114 instance_segmentation_loss_poly: 1.1253 +2023/10/26 17:25:55 - mmengine - INFO - Saving checkpoint at 39000 iterations +2023/10/26 17:35:08 - mmengine - INFO - Iter(train) [ 39500/640000] base_lr: 1.9814e-04 lr: 1.9831e-05 eta: 7 days, 18:13:36 time: 1.1230 data_time: 0.0351 memory: 21517 grad_norm: 2.6662 loss: 1.7354 caption_loss_cls: 2.7834 grounding_loss_reg: 3.9739 detection_loss_cls: 0.0599 detection_loss_reg: 0.4081 semantic_segmentation_loss_cls: 0.0162 instance_segmentation_loss_cls: 0.0620 instance_segmentation_loss_reg: 0.4119 instance_segmentation_loss_poly: 1.1260 +2023/10/26 17:44:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 17:44:10 - mmengine - INFO - Iter(train) [ 40000/640000] base_lr: 1.9810e-04 lr: 1.9827e-05 eta: 7 days, 18:00:22 time: 1.1196 data_time: 0.0349 memory: 21517 grad_norm: 2.6778 loss: 1.7378 caption_loss_cls: 2.7816 grounding_loss_reg: 3.9615 detection_loss_cls: 0.0597 detection_loss_reg: 0.4077 semantic_segmentation_loss_cls: 0.0162 instance_segmentation_loss_cls: 0.0617 instance_segmentation_loss_reg: 0.4111 instance_segmentation_loss_poly: 1.1230 +2023/10/26 17:44:10 - mmengine - INFO - Saving checkpoint at 40000 iterations +2023/10/26 17:52:55 - mmengine - INFO - Evaluating bbox... +2023/10/26 17:53:51 - mmengine - INFO - bbox_mAP_copypaste: 0.265 0.423 0.286 0.155 0.312 0.338 +2023/10/26 17:53:51 - mmengine - INFO - Evaluating segm... +2023/10/26 17:55:02 - mmengine - INFO - segm_mAP_copypaste: 0.161 0.335 0.139 0.069 0.198 0.253 +2023/10/26 17:59:24 - mmengine - INFO - per class results: +2023/10/26 17:59:24 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 72.87 | 85.29 | +| building | 78.66 | 89.28 | +| sky | 92.64 | 97.03 | +| floor | 77.05 | 89.09 | +| tree | 69.97 | 81.55 | +| ceiling | 80.46 | 89.99 | +| road | 79.98 | 85.89 | +| bed | 80.04 | 90.49 | +| windowpane | 54.89 | 74.77 | +| grass | 64.38 | 90.82 | +| cabinet | 53.51 | 70.48 | +| sidewalk | 57.62 | 80.61 | +| person | 75.55 | 88.33 | +| earth | 34.44 | 47.9 | +| door | 35.83 | 50.49 | +| table | 45.2 | 73.23 | +| mountain | 52.58 | 67.26 | +| plant | 46.6 | 59.65 | +| curtain | 65.46 | 77.33 | +| chair | 43.74 | 58.55 | +| car | 76.97 | 90.96 | +| water | 49.22 | 66.22 | +| painting | 63.81 | 82.24 | +| sofa | 51.49 | 61.12 | +| shelf | 30.06 | 43.2 | +| house | 46.4 | 75.41 | +| sea | 45.45 | 65.65 | +| mirror | 49.31 | 58.06 | +| rug | 47.96 | 50.83 | +| field | 18.14 | 23.66 | +| armchair | 30.9 | 52.62 | +| seat | 45.85 | 78.42 | +| fence | 30.35 | 52.2 | +| desk | 24.01 | 47.05 | +| rock | 31.12 | 47.63 | +| wardrobe | 45.66 | 78.1 | +| lamp | 47.43 | 62.02 | +| bathtub | 52.0 | 58.07 | +| railing | 26.0 | 40.77 | +| cushion | 40.99 | 54.2 | +| base | 17.03 | 51.77 | +| box | 15.74 | 20.98 | +| column | 46.67 | 56.67 | +| signboard | 31.28 | 47.56 | +| chest of drawers | 26.26 | 33.79 | +| counter | 23.42 | 33.57 | +| sand | 29.67 | 43.91 | +| sink | 51.51 | 59.32 | +| skyscraper | 48.44 | 61.26 | +| fireplace | 52.72 | 64.05 | +| refrigerator | 59.41 | 65.37 | +| grandstand | 39.9 | 56.78 | +| path | 11.93 | 15.55 | +| stairs | 22.3 | 25.06 | +| runway | 67.36 | 85.69 | +| case | 27.18 | 45.47 | +| pool table | 86.42 | 91.36 | +| pillow | 37.94 | 45.19 | +| screen door | 43.28 | 54.28 | +| stairway | 26.52 | 29.24 | +| river | 18.43 | 32.67 | +| bridge | 32.09 | 74.16 | +| bookcase | 29.46 | 47.03 | +| blind | 8.72 | 8.84 | +| coffee table | 49.58 | 70.57 | +| toilet | 74.32 | 82.39 | +| flower | 22.15 | 37.15 | +| book | 38.26 | 59.8 | +| hill | 6.39 | 12.91 | +| bench | 38.29 | 50.24 | +| countertop | 40.94 | 64.33 | +| stove | 53.03 | 64.41 | +| palm | 37.99 | 50.72 | +| kitchen island | 16.0 | 21.47 | +| computer | 51.05 | 58.48 | +| swivel chair | 34.65 | 46.98 | +| boat | 62.11 | 67.05 | +| bar | 31.21 | 38.62 | +| arcade machine | 35.71 | 46.99 | +| hovel | 6.57 | 8.14 | +| bus | 75.39 | 92.95 | +| towel | 43.4 | 51.92 | +| light | 35.6 | 43.67 | +| truck | 20.44 | 33.55 | +| tower | 29.02 | 39.2 | +| chandelier | 49.95 | 59.55 | +| awning | 20.09 | 29.21 | +| streetlight | 19.59 | 26.21 | +| booth | 27.26 | 49.05 | +| television receiver | 56.86 | 67.31 | +| airplane | 45.82 | 61.57 | +| dirt track | 0.0 | 0.0 | +| apparel | 8.74 | 10.31 | +| pole | 19.67 | 33.5 | +| land | 0.66 | 0.72 | +| bannister | 1.36 | 1.58 | +| escalator | 15.67 | 19.08 | +| ottoman | 23.24 | 26.86 | +| bottle | 15.24 | 17.13 | +| buffet | 33.47 | 39.11 | +| poster | 9.55 | 10.68 | +| stage | 7.71 | 10.88 | +| van | 9.12 | 9.87 | +| ship | 4.52 | 5.06 | +| fountain | 0.21 | 0.24 | +| conveyer belt | 48.42 | 68.11 | +| canopy | 21.39 | 46.38 | +| washer | 39.44 | 60.58 | +| plaything | 14.23 | 15.96 | +| swimming pool | 5.62 | 6.07 | +| stool | 22.99 | 27.08 | +| barrel | 9.46 | 47.57 | +| basket | 14.13 | 20.15 | +| waterfall | 41.39 | 42.25 | +| tent | 78.76 | 97.21 | +| bag | 4.21 | 4.44 | +| minibike | 60.87 | 71.69 | +| cradle | 60.22 | 74.1 | +| oven | 28.27 | 41.41 | +| ball | 43.92 | 58.48 | +| food | 46.98 | 57.16 | +| step | 6.66 | 7.26 | +| tank | 30.85 | 33.73 | +| trade name | 5.81 | 5.9 | +| microwave | 31.15 | 37.81 | +| pot | 32.37 | 37.87 | +| animal | 56.92 | 59.43 | +| bicycle | 47.84 | 68.15 | +| lake | 0.0 | 0.0 | +| dishwasher | 33.36 | 40.96 | +| screen | 56.39 | 88.27 | +| blanket | 0.81 | 0.84 | +| sculpture | 30.3 | 39.46 | +| hood | 35.29 | 41.48 | +| sconce | 11.38 | 12.14 | +| vase | 28.88 | 36.01 | +| traffic light | 19.47 | 26.88 | +| tray | 2.16 | 3.57 | +| ashcan | 27.29 | 33.2 | +| fan | 39.34 | 56.99 | +| pier | 49.36 | 76.58 | +| crt screen | 1.05 | 1.18 | +| plate | 35.69 | 41.77 | +| monitor | 35.85 | 65.95 | +| bulletin board | 11.93 | 12.92 | +| shower | 0.0 | 0.0 | +| radiator | 33.19 | 40.87 | +| glass | 6.61 | 6.76 | +| clock | 10.36 | 11.42 | +| flag | 21.07 | 22.65 | ++---------------------+-------+-------+ +2023/10/26 17:59:39 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.2650 coco/bbox_mAP_50: 0.4230 coco/bbox_mAP_75: 0.2860 coco/bbox_mAP_s: 0.1550 coco/bbox_mAP_m: 0.3120 coco/bbox_mAP_l: 0.3380 coco/segm_mAP: 0.1610 coco/segm_mAP_50: 0.3350 coco/segm_mAP_75: 0.1390 coco/segm_mAP_s: 0.0690 coco/segm_mAP_m: 0.1980 coco/segm_mAP_l: 0.2530 Bleu_1: 0.6709 Bleu_2: 0.4927 Bleu_3: 0.3517 Bleu_4: 0.2501 METEOR: 0.2175 ROUGE_L: 0.4909 CIDEr: 0.7580 SPICE: 0.1537 aAcc: 78.2200 mIoU: 35.8700 mAcc: 47.0300 visual-grounding/miou: 0.6013 visual-grounding/acc: 0.6905 data_time: 0.0047 time: 0.5215 +2023/10/26 18:08:16 - mmengine - INFO - Iter(train) [ 40500/640000] base_lr: 1.9805e-04 lr: 1.9823e-05 eta: 7 days, 17:41:21 time: 1.1048 data_time: 0.0315 memory: 21517 grad_norm: 2.6884 loss: 1.7335 caption_loss_cls: 2.7780 grounding_loss_reg: 3.9503 detection_loss_cls: 0.0595 detection_loss_reg: 0.4065 semantic_segmentation_loss_cls: 0.0161 instance_segmentation_loss_cls: 0.0615 instance_segmentation_loss_reg: 0.4106 instance_segmentation_loss_poly: 1.1212 +2023/10/26 18:17:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 18:17:17 - mmengine - INFO - Iter(train) [ 41000/640000] base_lr: 1.9800e-04 lr: 1.9818e-05 eta: 7 days, 17:27:56 time: 1.0979 data_time: 0.0312 memory: 21517 grad_norm: 2.6678 loss: 1.7268 caption_loss_cls: 2.7727 grounding_loss_reg: 3.9434 detection_loss_cls: 0.0593 detection_loss_reg: 0.4067 semantic_segmentation_loss_cls: 0.0160 instance_segmentation_loss_cls: 0.0613 instance_segmentation_loss_reg: 0.4100 instance_segmentation_loss_poly: 1.1190 +2023/10/26 18:17:17 - mmengine - INFO - Saving checkpoint at 41000 iterations +2023/10/26 18:26:21 - mmengine - INFO - Iter(train) [ 41500/640000] base_lr: 1.9795e-04 lr: 1.9814e-05 eta: 7 days, 17:15:31 time: 1.1046 data_time: 0.0314 memory: 21517 grad_norm: 2.6506 loss: 1.7110 caption_loss_cls: 2.7707 grounding_loss_reg: 3.9312 detection_loss_cls: 0.0590 detection_loss_reg: 0.4061 semantic_segmentation_loss_cls: 0.0160 instance_segmentation_loss_cls: 0.0610 instance_segmentation_loss_reg: 0.4088 instance_segmentation_loss_poly: 1.1157 +2023/10/26 18:35:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 18:35:16 - mmengine - INFO - Iter(train) [ 42000/640000] base_lr: 1.9790e-04 lr: 1.9809e-05 eta: 7 days, 17:00:55 time: 1.0929 data_time: 0.0310 memory: 21517 grad_norm: 2.6835 loss: 1.7207 caption_loss_cls: 2.7738 grounding_loss_reg: 3.9242 detection_loss_cls: 0.0587 detection_loss_reg: 0.4051 semantic_segmentation_loss_cls: 0.0160 instance_segmentation_loss_cls: 0.0608 instance_segmentation_loss_reg: 0.4074 instance_segmentation_loss_poly: 1.1126 +2023/10/26 18:35:16 - mmengine - INFO - Saving checkpoint at 42000 iterations +2023/10/26 18:44:27 - mmengine - INFO - Iter(train) [ 42500/640000] base_lr: 1.9785e-04 lr: 1.9805e-05 eta: 7 days, 16:50:14 time: 1.0830 data_time: 0.0308 memory: 21517 grad_norm: 2.7258 loss: 1.7338 caption_loss_cls: 2.7661 grounding_loss_reg: 3.9116 detection_loss_cls: 0.0586 detection_loss_reg: 0.4047 semantic_segmentation_loss_cls: 0.0159 instance_segmentation_loss_cls: 0.0606 instance_segmentation_loss_reg: 0.4068 instance_segmentation_loss_poly: 1.1100 +2023/10/26 18:54:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 18:54:08 - mmengine - INFO - Iter(train) [ 43000/640000] base_lr: 1.9780e-04 lr: 1.9800e-05 eta: 7 days, 16:46:35 time: 1.0915 data_time: 0.0310 memory: 21517 grad_norm: 2.7129 loss: 1.7308 caption_loss_cls: 2.7641 grounding_loss_reg: 3.8989 detection_loss_cls: 0.0585 detection_loss_reg: 0.4044 semantic_segmentation_loss_cls: 0.0159 instance_segmentation_loss_cls: 0.0607 instance_segmentation_loss_reg: 0.4078 instance_segmentation_loss_poly: 1.1100 +2023/10/26 18:54:08 - mmengine - INFO - Saving checkpoint at 43000 iterations +2023/10/26 19:03:32 - mmengine - INFO - Iter(train) [ 43500/640000] base_lr: 1.9775e-04 lr: 1.9796e-05 eta: 7 days, 16:38:48 time: 1.0941 data_time: 0.0311 memory: 21517 grad_norm: 2.7200 loss: 1.7353 caption_loss_cls: 2.7595 grounding_loss_reg: 3.8888 detection_loss_cls: 0.0583 detection_loss_reg: 0.4043 semantic_segmentation_loss_cls: 0.0158 instance_segmentation_loss_cls: 0.0604 instance_segmentation_loss_reg: 0.4065 instance_segmentation_loss_poly: 1.1072 +2023/10/26 19:12:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 19:12:44 - mmengine - INFO - Iter(train) [ 44000/640000] base_lr: 1.9770e-04 lr: 1.9791e-05 eta: 7 days, 16:28:19 time: 1.0965 data_time: 0.0313 memory: 21517 grad_norm: 2.7214 loss: 1.7405 caption_loss_cls: 2.7545 grounding_loss_reg: 3.8778 detection_loss_cls: 0.0581 detection_loss_reg: 0.4039 semantic_segmentation_loss_cls: 0.0158 instance_segmentation_loss_cls: 0.0606 instance_segmentation_loss_reg: 0.4079 instance_segmentation_loss_poly: 1.1072 +2023/10/26 19:12:44 - mmengine - INFO - Saving checkpoint at 44000 iterations +2023/10/26 19:22:21 - mmengine - INFO - Iter(train) [ 44500/640000] base_lr: 1.9765e-04 lr: 1.9786e-05 eta: 7 days, 16:23:26 time: 1.1111 data_time: 0.0346 memory: 21517 grad_norm: 2.7040 loss: 1.7349 caption_loss_cls: 2.7500 grounding_loss_reg: 3.8672 detection_loss_cls: 0.0580 detection_loss_reg: 0.4040 semantic_segmentation_loss_cls: 0.0157 instance_segmentation_loss_cls: 0.0607 instance_segmentation_loss_reg: 0.4094 instance_segmentation_loss_poly: 1.1098 +2023/10/26 19:31:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 19:31:32 - mmengine - INFO - Iter(train) [ 45000/640000] base_lr: 1.9759e-04 lr: 1.9781e-05 eta: 7 days, 16:12:48 time: 1.1137 data_time: 0.0347 memory: 21517 grad_norm: 2.7331 loss: 1.7394 caption_loss_cls: 2.7462 grounding_loss_reg: 3.8567 detection_loss_cls: 0.0580 detection_loss_reg: 0.4050 semantic_segmentation_loss_cls: 0.0157 instance_segmentation_loss_cls: 0.0605 instance_segmentation_loss_reg: 0.4095 instance_segmentation_loss_poly: 1.1083 +2023/10/26 19:31:32 - mmengine - INFO - Saving checkpoint at 45000 iterations +2023/10/26 19:41:05 - mmengine - INFO - Iter(train) [ 45500/640000] base_lr: 1.9754e-04 lr: 1.9776e-05 eta: 7 days, 16:06:51 time: 1.1208 data_time: 0.0350 memory: 21517 grad_norm: 2.6948 loss: 1.7329 caption_loss_cls: 2.7458 grounding_loss_reg: 3.8486 detection_loss_cls: 0.0580 detection_loss_reg: 0.4058 semantic_segmentation_loss_cls: 0.0157 instance_segmentation_loss_cls: 0.0604 instance_segmentation_loss_reg: 0.4091 instance_segmentation_loss_poly: 1.1071 +2023/10/26 19:50:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 19:50:50 - mmengine - INFO - Iter(train) [ 46000/640000] base_lr: 1.9749e-04 lr: 1.9772e-05 eta: 7 days, 16:03:38 time: 1.1335 data_time: 0.0356 memory: 21517 grad_norm: 2.6573 loss: 1.7137 caption_loss_cls: 2.7443 grounding_loss_reg: 3.8442 detection_loss_cls: 0.0578 detection_loss_reg: 0.4055 semantic_segmentation_loss_cls: 0.0156 instance_segmentation_loss_cls: 0.0602 instance_segmentation_loss_reg: 0.4078 instance_segmentation_loss_poly: 1.1040 +2023/10/26 19:50:50 - mmengine - INFO - Saving checkpoint at 46000 iterations +2023/10/26 20:00:22 - mmengine - INFO - Iter(train) [ 46500/640000] base_lr: 1.9743e-04 lr: 1.9767e-05 eta: 7 days, 15:57:15 time: 1.1387 data_time: 0.0355 memory: 21517 grad_norm: 2.6317 loss: 1.6912 caption_loss_cls: 2.7445 grounding_loss_reg: 3.8320 detection_loss_cls: 0.0575 detection_loss_reg: 0.4049 semantic_segmentation_loss_cls: 0.0156 instance_segmentation_loss_cls: 0.0600 instance_segmentation_loss_reg: 0.4067 instance_segmentation_loss_poly: 1.1001 +2023/10/26 20:10:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 20:10:02 - mmengine - INFO - Iter(train) [ 47000/640000] base_lr: 1.9738e-04 lr: 1.9762e-05 eta: 7 days, 15:52:43 time: 1.1385 data_time: 0.0355 memory: 21517 grad_norm: 2.5834 loss: 1.6757 caption_loss_cls: 2.7422 grounding_loss_reg: 3.8262 detection_loss_cls: 0.0573 detection_loss_reg: 0.4029 semantic_segmentation_loss_cls: 0.0155 instance_segmentation_loss_cls: 0.0598 instance_segmentation_loss_reg: 0.4059 instance_segmentation_loss_poly: 1.0985 +2023/10/26 20:10:02 - mmengine - INFO - Saving checkpoint at 47000 iterations +2023/10/26 20:19:31 - mmengine - INFO - Iter(train) [ 47500/640000] base_lr: 1.9732e-04 lr: 1.9756e-05 eta: 7 days, 15:45:32 time: 1.1397 data_time: 0.0357 memory: 21517 grad_norm: 2.5806 loss: 1.6765 caption_loss_cls: 2.7385 grounding_loss_reg: 3.8163 detection_loss_cls: 0.0571 detection_loss_reg: 0.4023 semantic_segmentation_loss_cls: 0.0155 instance_segmentation_loss_cls: 0.0598 instance_segmentation_loss_reg: 0.4059 instance_segmentation_loss_poly: 1.0969 +2023/10/26 20:29:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 20:29:06 - mmengine - INFO - Iter(train) [ 48000/640000] base_lr: 1.9726e-04 lr: 1.9751e-05 eta: 7 days, 15:39:36 time: 1.1454 data_time: 0.0370 memory: 21517 grad_norm: 2.5612 loss: 1.6699 caption_loss_cls: 2.7364 grounding_loss_reg: 3.8080 detection_loss_cls: 0.0569 detection_loss_reg: 0.4018 semantic_segmentation_loss_cls: 0.0155 instance_segmentation_loss_cls: 0.0597 instance_segmentation_loss_reg: 0.4053 instance_segmentation_loss_poly: 1.0959 +2023/10/26 20:29:06 - mmengine - INFO - Saving checkpoint at 48000 iterations +2023/10/26 20:38:37 - mmengine - INFO - Iter(train) [ 48500/640000] base_lr: 1.9721e-04 lr: 1.9746e-05 eta: 7 days, 15:33:01 time: 1.1441 data_time: 0.0369 memory: 21517 grad_norm: 2.5535 loss: 1.6665 caption_loss_cls: 2.7292 grounding_loss_reg: 3.8013 detection_loss_cls: 0.0568 detection_loss_reg: 0.4008 semantic_segmentation_loss_cls: 0.0154 instance_segmentation_loss_cls: 0.0595 instance_segmentation_loss_reg: 0.4045 instance_segmentation_loss_poly: 1.0937 +2023/10/26 20:48:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 20:48:04 - mmengine - INFO - Iter(train) [ 49000/640000] base_lr: 1.9715e-04 lr: 1.9741e-05 eta: 7 days, 15:25:15 time: 1.1478 data_time: 0.0368 memory: 21517 grad_norm: 2.5136 loss: 1.6427 caption_loss_cls: 2.7275 grounding_loss_reg: 3.7946 detection_loss_cls: 0.0565 detection_loss_reg: 0.4000 semantic_segmentation_loss_cls: 0.0153 instance_segmentation_loss_cls: 0.0593 instance_segmentation_loss_reg: 0.4041 instance_segmentation_loss_poly: 1.0923 +2023/10/26 20:48:04 - mmengine - INFO - Saving checkpoint at 49000 iterations +2023/10/26 20:57:32 - mmengine - INFO - Iter(train) [ 49500/640000] base_lr: 1.9709e-04 lr: 1.9736e-05 eta: 7 days, 15:17:51 time: 1.1468 data_time: 0.0366 memory: 21517 grad_norm: 2.5232 loss: 1.6356 caption_loss_cls: 2.7259 grounding_loss_reg: 3.7845 detection_loss_cls: 0.0565 detection_loss_reg: 0.4008 semantic_segmentation_loss_cls: 0.0153 instance_segmentation_loss_cls: 0.0591 instance_segmentation_loss_reg: 0.4034 instance_segmentation_loss_poly: 1.0897 +2023/10/26 21:06:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 21:06:56 - mmengine - INFO - Iter(train) [ 50000/640000] base_lr: 1.9703e-04 lr: 1.9730e-05 eta: 7 days, 15:09:37 time: 1.1414 data_time: 0.0363 memory: 21517 grad_norm: 2.5555 loss: 1.6375 caption_loss_cls: 2.7259 grounding_loss_reg: 3.7786 detection_loss_cls: 0.0562 detection_loss_reg: 0.3995 semantic_segmentation_loss_cls: 0.0153 instance_segmentation_loss_cls: 0.0586 instance_segmentation_loss_reg: 0.4014 instance_segmentation_loss_poly: 1.0846 +2023/10/26 21:06:56 - mmengine - INFO - Saving checkpoint at 50000 iterations +2023/10/26 21:16:19 - mmengine - INFO - Iter(train) [ 50500/640000] base_lr: 1.9697e-04 lr: 1.9725e-05 eta: 7 days, 15:01:00 time: 1.1391 data_time: 0.0363 memory: 21517 grad_norm: 2.5454 loss: 1.6430 caption_loss_cls: 2.7228 grounding_loss_reg: 3.7678 detection_loss_cls: 0.0561 detection_loss_reg: 0.3987 semantic_segmentation_loss_cls: 0.0152 instance_segmentation_loss_cls: 0.0586 instance_segmentation_loss_reg: 0.4027 instance_segmentation_loss_poly: 1.0866 +2023/10/26 21:25:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 21:25:16 - mmengine - INFO - Iter(train) [ 51000/640000] base_lr: 1.9691e-04 lr: 1.9719e-05 eta: 7 days, 14:47:35 time: 1.1284 data_time: 0.0361 memory: 21517 grad_norm: 2.6108 loss: 1.6607 caption_loss_cls: 2.7220 grounding_loss_reg: 3.7583 detection_loss_cls: 0.0558 detection_loss_reg: 0.3981 semantic_segmentation_loss_cls: 0.0152 instance_segmentation_loss_cls: 0.0585 instance_segmentation_loss_reg: 0.4032 instance_segmentation_loss_poly: 1.0868 +2023/10/26 21:25:16 - mmengine - INFO - Saving checkpoint at 51000 iterations +2023/10/26 21:34:43 - mmengine - INFO - Iter(train) [ 51500/640000] base_lr: 1.9685e-04 lr: 1.9714e-05 eta: 7 days, 14:39:43 time: 1.1278 data_time: 0.0358 memory: 21517 grad_norm: 2.5885 loss: 1.6401 caption_loss_cls: 2.7221 grounding_loss_reg: 3.7508 detection_loss_cls: 0.0557 detection_loss_reg: 0.3982 semantic_segmentation_loss_cls: 0.0151 instance_segmentation_loss_cls: 0.0585 instance_segmentation_loss_reg: 0.4032 instance_segmentation_loss_poly: 1.0867 +2023/10/26 21:44:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 21:44:01 - mmengine - INFO - Iter(train) [ 52000/640000] base_lr: 1.9679e-04 lr: 1.9708e-05 eta: 7 days, 14:30:16 time: 1.1236 data_time: 0.0347 memory: 21517 grad_norm: 2.5972 loss: 1.6423 caption_loss_cls: 2.7212 grounding_loss_reg: 3.7431 detection_loss_cls: 0.0558 detection_loss_reg: 0.3987 semantic_segmentation_loss_cls: 0.0151 instance_segmentation_loss_cls: 0.0582 instance_segmentation_loss_reg: 0.4016 instance_segmentation_loss_poly: 1.0838 +2023/10/26 21:44:01 - mmengine - INFO - Saving checkpoint at 52000 iterations +2023/10/26 21:52:51 - mmengine - INFO - Iter(train) [ 52500/640000] base_lr: 1.9673e-04 lr: 1.9703e-05 eta: 7 days, 14:15:37 time: 1.1132 data_time: 0.0343 memory: 21517 grad_norm: 2.6278 loss: 1.6514 caption_loss_cls: 2.7171 grounding_loss_reg: 3.7393 detection_loss_cls: 0.0557 detection_loss_reg: 0.3987 semantic_segmentation_loss_cls: 0.0151 instance_segmentation_loss_cls: 0.0580 instance_segmentation_loss_reg: 0.4010 instance_segmentation_loss_poly: 1.0821 +2023/10/26 22:02:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 22:02:42 - mmengine - INFO - Iter(train) [ 53000/640000] base_lr: 1.9667e-04 lr: 1.9697e-05 eta: 7 days, 14:12:17 time: 1.1193 data_time: 0.0347 memory: 21517 grad_norm: 2.6255 loss: 1.6567 caption_loss_cls: 2.7131 grounding_loss_reg: 3.7344 detection_loss_cls: 0.0553 detection_loss_reg: 0.3971 semantic_segmentation_loss_cls: 0.0150 instance_segmentation_loss_cls: 0.0581 instance_segmentation_loss_reg: 0.4020 instance_segmentation_loss_poly: 1.0851 +2023/10/26 22:02:42 - mmengine - INFO - Saving checkpoint at 53000 iterations +2023/10/26 22:11:59 - mmengine - INFO - Iter(train) [ 53500/640000] base_lr: 1.9661e-04 lr: 1.9691e-05 eta: 7 days, 14:02:48 time: 1.1167 data_time: 0.0348 memory: 21517 grad_norm: 2.6355 loss: 1.6622 caption_loss_cls: 2.7084 grounding_loss_reg: 3.7237 detection_loss_cls: 0.0552 detection_loss_reg: 0.3966 semantic_segmentation_loss_cls: 0.0150 instance_segmentation_loss_cls: 0.0579 instance_segmentation_loss_reg: 0.4010 instance_segmentation_loss_poly: 1.0822 +2023/10/26 22:21:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 22:21:18 - mmengine - INFO - Iter(train) [ 54000/640000] base_lr: 1.9654e-04 lr: 1.9686e-05 eta: 7 days, 13:53:33 time: 1.1154 data_time: 0.0348 memory: 21517 grad_norm: 2.6163 loss: 1.6598 caption_loss_cls: 2.7100 grounding_loss_reg: 3.7184 detection_loss_cls: 0.0551 detection_loss_reg: 0.3972 semantic_segmentation_loss_cls: 0.0150 instance_segmentation_loss_cls: 0.0577 instance_segmentation_loss_reg: 0.4002 instance_segmentation_loss_poly: 1.0805 +2023/10/26 22:21:18 - mmengine - INFO - Saving checkpoint at 54000 iterations +2023/10/26 22:30:20 - mmengine - INFO - Iter(train) [ 54500/640000] base_lr: 1.9648e-04 lr: 1.9680e-05 eta: 7 days, 13:41:13 time: 1.1103 data_time: 0.0345 memory: 21517 grad_norm: 2.6288 loss: 1.6549 caption_loss_cls: 2.7080 grounding_loss_reg: 3.7110 detection_loss_cls: 0.0550 detection_loss_reg: 0.3971 semantic_segmentation_loss_cls: 0.0149 instance_segmentation_loss_cls: 0.0577 instance_segmentation_loss_reg: 0.4005 instance_segmentation_loss_poly: 1.0813 +2023/10/26 22:39:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 22:39:37 - mmengine - INFO - Iter(train) [ 55000/640000] base_lr: 1.9641e-04 lr: 1.9674e-05 eta: 7 days, 13:31:35 time: 1.1151 data_time: 0.0348 memory: 21517 grad_norm: 2.6158 loss: 1.6586 caption_loss_cls: 2.7039 grounding_loss_reg: 3.7049 detection_loss_cls: 0.0548 detection_loss_reg: 0.3971 semantic_segmentation_loss_cls: 0.0149 instance_segmentation_loss_cls: 0.0576 instance_segmentation_loss_reg: 0.4013 instance_segmentation_loss_poly: 1.0826 +2023/10/26 22:39:37 - mmengine - INFO - Saving checkpoint at 55000 iterations +2023/10/26 22:48:46 - mmengine - INFO - Iter(train) [ 55500/640000] base_lr: 1.9635e-04 lr: 1.9668e-05 eta: 7 days, 13:20:31 time: 1.1107 data_time: 0.0348 memory: 21517 grad_norm: 2.6327 loss: 1.6704 caption_loss_cls: 2.7029 grounding_loss_reg: 3.6989 detection_loss_cls: 0.0548 detection_loss_reg: 0.3970 semantic_segmentation_loss_cls: 0.0148 instance_segmentation_loss_cls: 0.0575 instance_segmentation_loss_reg: 0.4009 instance_segmentation_loss_poly: 1.0810 +2023/10/26 22:57:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 22:57:51 - mmengine - INFO - Iter(train) [ 56000/640000] base_lr: 1.9628e-04 lr: 1.9662e-05 eta: 7 days, 13:08:55 time: 1.1075 data_time: 0.0369 memory: 21517 grad_norm: 2.6663 loss: 1.6805 caption_loss_cls: 2.7020 grounding_loss_reg: 3.6946 detection_loss_cls: 0.0548 detection_loss_reg: 0.3975 semantic_segmentation_loss_cls: 0.0148 instance_segmentation_loss_cls: 0.0575 instance_segmentation_loss_reg: 0.4013 instance_segmentation_loss_poly: 1.0820 +2023/10/26 22:57:51 - mmengine - INFO - Saving checkpoint at 56000 iterations +2023/10/26 23:07:21 - mmengine - INFO - Iter(train) [ 56500/640000] base_lr: 1.9622e-04 lr: 1.9656e-05 eta: 7 days, 13:01:33 time: 1.1174 data_time: 0.0371 memory: 21517 grad_norm: 2.6285 loss: 1.6653 caption_loss_cls: 2.7014 grounding_loss_reg: 3.6880 detection_loss_cls: 0.0547 detection_loss_reg: 0.3976 semantic_segmentation_loss_cls: 0.0147 instance_segmentation_loss_cls: 0.0575 instance_segmentation_loss_reg: 0.4006 instance_segmentation_loss_poly: 1.0802 +2023/10/26 23:16:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 23:16:25 - mmengine - INFO - Iter(train) [ 57000/640000] base_lr: 1.9615e-04 lr: 1.9650e-05 eta: 7 days, 12:49:49 time: 1.1058 data_time: 0.0368 memory: 21517 grad_norm: 2.6751 loss: 1.6888 caption_loss_cls: 2.6978 grounding_loss_reg: 3.6823 detection_loss_cls: 0.0546 detection_loss_reg: 0.3976 semantic_segmentation_loss_cls: 0.0147 instance_segmentation_loss_cls: 0.0575 instance_segmentation_loss_reg: 0.4016 instance_segmentation_loss_poly: 1.0817 +2023/10/26 23:16:25 - mmengine - INFO - Saving checkpoint at 57000 iterations +2023/10/26 23:25:36 - mmengine - INFO - Iter(train) [ 57500/640000] base_lr: 1.9608e-04 lr: 1.9644e-05 eta: 7 days, 12:39:20 time: 1.1041 data_time: 0.0367 memory: 21517 grad_norm: 2.6638 loss: 1.6802 caption_loss_cls: 2.6928 grounding_loss_reg: 3.6787 detection_loss_cls: 0.0544 detection_loss_reg: 0.3965 semantic_segmentation_loss_cls: 0.0147 instance_segmentation_loss_cls: 0.0576 instance_segmentation_loss_reg: 0.4024 instance_segmentation_loss_poly: 1.0835 +2023/10/26 23:34:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 23:34:37 - mmengine - INFO - Iter(train) [ 58000/640000] base_lr: 1.9601e-04 lr: 1.9638e-05 eta: 7 days, 12:27:03 time: 1.0995 data_time: 0.0365 memory: 21517 grad_norm: 2.6927 loss: 1.6807 caption_loss_cls: 2.6888 grounding_loss_reg: 3.6688 detection_loss_cls: 0.0545 detection_loss_reg: 0.3977 semantic_segmentation_loss_cls: 0.0146 instance_segmentation_loss_cls: 0.0575 instance_segmentation_loss_reg: 0.4019 instance_segmentation_loss_poly: 1.0814 +2023/10/26 23:34:37 - mmengine - INFO - Saving checkpoint at 58000 iterations +2023/10/26 23:44:35 - mmengine - INFO - Iter(train) [ 58500/640000] base_lr: 1.9595e-04 lr: 1.9631e-05 eta: 7 days, 12:24:22 time: 1.1135 data_time: 0.0372 memory: 21517 grad_norm: 2.6599 loss: 1.6771 caption_loss_cls: 2.6850 grounding_loss_reg: 3.6650 detection_loss_cls: 0.0546 detection_loss_reg: 0.3990 semantic_segmentation_loss_cls: 0.0146 instance_segmentation_loss_cls: 0.0574 instance_segmentation_loss_reg: 0.4024 instance_segmentation_loss_poly: 1.0826 +2023/10/26 23:53:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/26 23:53:52 - mmengine - INFO - Iter(train) [ 59000/640000] base_lr: 1.9588e-04 lr: 1.9625e-05 eta: 7 days, 12:14:51 time: 1.1137 data_time: 0.0372 memory: 21517 grad_norm: 2.6576 loss: 1.6746 caption_loss_cls: 2.6894 grounding_loss_reg: 3.6573 detection_loss_cls: 0.0545 detection_loss_reg: 0.3982 semantic_segmentation_loss_cls: 0.0146 instance_segmentation_loss_cls: 0.0573 instance_segmentation_loss_reg: 0.4030 instance_segmentation_loss_poly: 1.0831 +2023/10/26 23:53:52 - mmengine - INFO - Saving checkpoint at 59000 iterations +2023/10/27 00:03:24 - mmengine - INFO - Iter(train) [ 59500/640000] base_lr: 1.9581e-04 lr: 1.9619e-05 eta: 7 days, 12:07:45 time: 1.1195 data_time: 0.0374 memory: 21517 grad_norm: 2.6430 loss: 1.6668 caption_loss_cls: 2.6867 grounding_loss_reg: 3.6492 detection_loss_cls: 0.0545 detection_loss_reg: 0.3989 semantic_segmentation_loss_cls: 0.0146 instance_segmentation_loss_cls: 0.0573 instance_segmentation_loss_reg: 0.4030 instance_segmentation_loss_poly: 1.0835 +2023/10/27 00:12:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 00:12:41 - mmengine - INFO - Iter(train) [ 60000/640000] base_lr: 1.9574e-04 lr: 1.9612e-05 eta: 7 days, 11:58:11 time: 1.1224 data_time: 0.0352 memory: 21517 grad_norm: 2.6128 loss: 1.6516 caption_loss_cls: 2.6877 grounding_loss_reg: 3.6449 detection_loss_cls: 0.0543 detection_loss_reg: 0.3993 semantic_segmentation_loss_cls: 0.0145 instance_segmentation_loss_cls: 0.0571 instance_segmentation_loss_reg: 0.4019 instance_segmentation_loss_poly: 1.0811 +2023/10/27 00:12:41 - mmengine - INFO - Saving checkpoint at 60000 iterations +2023/10/27 00:21:35 - mmengine - INFO - Evaluating bbox... +2023/10/27 00:22:30 - mmengine - INFO - bbox_mAP_copypaste: 0.304 0.468 0.325 0.182 0.363 0.392 +2023/10/27 00:22:30 - mmengine - INFO - Evaluating segm... +2023/10/27 00:23:40 - mmengine - INFO - segm_mAP_copypaste: 0.191 0.379 0.175 0.078 0.234 0.307 +2023/10/27 00:29:13 - mmengine - INFO - per class results: +2023/10/27 00:29:13 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 72.68 | 85.29 | +| building | 80.21 | 90.36 | +| sky | 91.8 | 97.93 | +| floor | 78.88 | 87.67 | +| tree | 68.39 | 84.72 | +| ceiling | 78.58 | 94.06 | +| road | 77.97 | 86.54 | +| bed | 83.38 | 93.24 | +| windowpane | 53.28 | 63.53 | +| grass | 60.81 | 71.56 | +| cabinet | 53.84 | 65.57 | +| sidewalk | 58.6 | 82.21 | +| person | 76.05 | 89.91 | +| earth | 24.84 | 28.97 | +| door | 37.98 | 45.18 | +| table | 47.1 | 72.02 | +| mountain | 46.73 | 53.79 | +| plant | 48.17 | 61.06 | +| curtain | 63.71 | 86.3 | +| chair | 43.62 | 55.49 | +| car | 79.84 | 90.98 | +| water | 29.63 | 33.58 | +| painting | 63.29 | 81.58 | +| sofa | 57.61 | 78.57 | +| shelf | 33.8 | 51.78 | +| house | 35.52 | 44.61 | +| sea | 51.71 | 88.24 | +| mirror | 45.4 | 75.26 | +| rug | 50.27 | 53.65 | +| field | 23.97 | 59.21 | +| armchair | 29.71 | 46.72 | +| seat | 55.42 | 64.8 | +| fence | 33.2 | 41.72 | +| desk | 34.48 | 50.1 | +| rock | 44.41 | 71.23 | +| wardrobe | 45.42 | 73.25 | +| lamp | 48.73 | 71.63 | +| bathtub | 58.4 | 85.06 | +| railing | 25.93 | 33.63 | +| cushion | 41.78 | 52.04 | +| base | 17.89 | 23.25 | +| box | 17.61 | 21.52 | +| column | 46.07 | 62.95 | +| signboard | 31.62 | 43.93 | +| chest of drawers | 38.78 | 58.76 | +| counter | 19.3 | 21.24 | +| sand | 27.97 | 42.69 | +| sink | 53.04 | 66.46 | +| skyscraper | 27.62 | 29.18 | +| fireplace | 56.02 | 70.04 | +| refrigerator | 58.35 | 83.22 | +| grandstand | 30.53 | 63.79 | +| path | 17.26 | 48.69 | +| stairs | 32.24 | 44.32 | +| runway | 75.41 | 93.87 | +| case | 36.92 | 54.6 | +| pool table | 87.43 | 94.27 | +| pillow | 48.4 | 67.97 | +| screen door | 58.48 | 71.82 | +| stairway | 20.13 | 21.87 | +| river | 11.08 | 13.86 | +| bridge | 27.91 | 86.71 | +| bookcase | 29.85 | 56.29 | +| blind | 27.99 | 41.1 | +| coffee table | 53.62 | 76.44 | +| toilet | 75.84 | 84.06 | +| flower | 28.55 | 42.19 | +| book | 37.64 | 68.7 | +| hill | 7.17 | 13.26 | +| bench | 32.5 | 49.38 | +| countertop | 44.58 | 51.91 | +| stove | 56.9 | 63.44 | +| palm | 38.42 | 47.91 | +| kitchen island | 27.77 | 48.38 | +| computer | 65.97 | 84.23 | +| swivel chair | 33.86 | 63.47 | +| boat | 37.73 | 50.44 | +| bar | 22.51 | 28.79 | +| arcade machine | 34.25 | 37.12 | +| hovel | 34.13 | 71.95 | +| bus | 69.39 | 94.13 | +| towel | 43.39 | 67.85 | +| light | 37.71 | 45.55 | +| truck | 27.11 | 41.94 | +| tower | 29.59 | 43.67 | +| chandelier | 44.74 | 52.5 | +| awning | 14.92 | 17.53 | +| streetlight | 19.4 | 25.55 | +| booth | 28.01 | 56.89 | +| television receiver | 55.31 | 78.18 | +| airplane | 53.39 | 61.42 | +| dirt track | 2.31 | 4.84 | +| apparel | 16.99 | 28.54 | +| pole | 16.74 | 47.24 | +| land | 0.0 | 0.0 | +| bannister | 3.07 | 4.36 | +| escalator | 0.72 | 0.73 | +| ottoman | 36.18 | 58.83 | +| bottle | 18.89 | 24.04 | +| buffet | 41.04 | 54.7 | +| poster | 14.74 | 17.11 | +| stage | 8.74 | 20.02 | +| van | 29.41 | 43.35 | +| ship | 54.43 | 95.31 | +| fountain | 14.64 | 18.74 | +| conveyer belt | 46.46 | 72.6 | +| canopy | 17.94 | 43.67 | +| washer | 49.72 | 54.02 | +| plaything | 16.9 | 22.91 | +| swimming pool | 31.55 | 37.13 | +| stool | 33.75 | 46.38 | +| barrel | 5.82 | 62.95 | +| basket | 16.58 | 20.55 | +| waterfall | 69.97 | 84.73 | +| tent | 29.83 | 30.83 | +| bag | 13.44 | 16.55 | +| minibike | 68.03 | 77.75 | +| cradle | 65.47 | 84.89 | +| oven | 28.9 | 36.81 | +| ball | 40.3 | 56.12 | +| food | 42.88 | 49.83 | +| step | 10.42 | 12.21 | +| tank | 23.2 | 27.48 | +| trade name | 1.18 | 1.19 | +| microwave | 36.72 | 44.63 | +| pot | 38.75 | 46.77 | +| animal | 54.15 | 56.96 | +| bicycle | 50.92 | 63.23 | +| lake | 14.26 | 66.88 | +| dishwasher | 44.08 | 60.25 | +| screen | 70.5 | 77.04 | +| blanket | 0.23 | 0.24 | +| sculpture | 39.06 | 53.08 | +| hood | 45.56 | 58.37 | +| sconce | 11.89 | 13.61 | +| vase | 28.69 | 37.49 | +| traffic light | 23.51 | 39.94 | +| tray | 3.87 | 4.97 | +| ashcan | 25.48 | 31.36 | +| fan | 38.02 | 47.34 | +| pier | 22.05 | 24.25 | +| crt screen | 8.96 | 9.78 | +| plate | 43.83 | 54.69 | +| monitor | 4.28 | 4.64 | +| bulletin board | 19.21 | 46.31 | +| shower | 0.0 | 0.0 | +| radiator | 36.32 | 42.31 | +| glass | 10.76 | 11.59 | +| clock | 19.63 | 23.92 | +| flag | 30.61 | 38.23 | ++---------------------+-------+-------+ +2023/10/27 00:29:36 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.3040 coco/bbox_mAP_50: 0.4680 coco/bbox_mAP_75: 0.3250 coco/bbox_mAP_s: 0.1820 coco/bbox_mAP_m: 0.3630 coco/bbox_mAP_l: 0.3920 coco/segm_mAP: 0.1910 coco/segm_mAP_50: 0.3790 coco/segm_mAP_75: 0.1750 coco/segm_mAP_s: 0.0780 coco/segm_mAP_m: 0.2340 coco/segm_mAP_l: 0.3070 Bleu_1: 0.6767 Bleu_2: 0.4929 Bleu_3: 0.3499 Bleu_4: 0.2471 METEOR: 0.2288 ROUGE_L: 0.4960 CIDEr: 0.7871 SPICE: 0.1596 aAcc: 78.3000 mIoU: 37.8600 mAcc: 51.3800 visual-grounding/miou: 0.6562 visual-grounding/acc: 0.7413 data_time: 0.0195 time: 0.5361 +2023/10/27 00:39:07 - mmengine - INFO - Iter(train) [ 60500/640000] base_lr: 1.9567e-04 lr: 1.9606e-05 eta: 7 days, 11:51:50 time: 1.1243 data_time: 0.0349 memory: 21517 grad_norm: 2.6280 loss: 1.6528 caption_loss_cls: 2.6802 grounding_loss_reg: 3.6387 detection_loss_cls: 0.0543 detection_loss_reg: 0.3998 semantic_segmentation_loss_cls: 0.0145 instance_segmentation_loss_cls: 0.0571 instance_segmentation_loss_reg: 0.4018 instance_segmentation_loss_poly: 1.0802 +2023/10/27 00:48:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 00:48:40 - mmengine - INFO - Iter(train) [ 61000/640000] base_lr: 1.9560e-04 lr: 1.9600e-05 eta: 7 days, 11:44:51 time: 1.1316 data_time: 0.0353 memory: 21517 grad_norm: 2.6011 loss: 1.6307 caption_loss_cls: 2.6769 grounding_loss_reg: 3.6300 detection_loss_cls: 0.0542 detection_loss_reg: 0.3994 semantic_segmentation_loss_cls: 0.0145 instance_segmentation_loss_cls: 0.0570 instance_segmentation_loss_reg: 0.4020 instance_segmentation_loss_poly: 1.0794 +2023/10/27 00:48:40 - mmengine - INFO - Saving checkpoint at 61000 iterations +2023/10/27 00:58:27 - mmengine - INFO - Iter(train) [ 61500/640000] base_lr: 1.9552e-04 lr: 1.9593e-05 eta: 7 days, 11:39:49 time: 1.1403 data_time: 0.0358 memory: 21517 grad_norm: 2.5929 loss: 1.6290 caption_loss_cls: 2.6718 grounding_loss_reg: 3.6256 detection_loss_cls: 0.0539 detection_loss_reg: 0.3983 semantic_segmentation_loss_cls: 0.0144 instance_segmentation_loss_cls: 0.0568 instance_segmentation_loss_reg: 0.4019 instance_segmentation_loss_poly: 1.0790 +2023/10/27 01:07:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 01:07:12 - mmengine - INFO - Iter(train) [ 62000/640000] base_lr: 1.9545e-04 lr: 1.9586e-05 eta: 7 days, 11:25:19 time: 1.1366 data_time: 0.0357 memory: 21517 grad_norm: 2.5570 loss: 1.6246 caption_loss_cls: 2.6694 grounding_loss_reg: 3.6184 detection_loss_cls: 0.0541 detection_loss_reg: 0.3992 semantic_segmentation_loss_cls: 0.0144 instance_segmentation_loss_cls: 0.0567 instance_segmentation_loss_reg: 0.4013 instance_segmentation_loss_poly: 1.0778 +2023/10/27 01:07:12 - mmengine - INFO - Saving checkpoint at 62000 iterations +2023/10/27 01:16:33 - mmengine - INFO - Iter(train) [ 62500/640000] base_lr: 1.9538e-04 lr: 1.9580e-05 eta: 7 days, 11:16:21 time: 1.1273 data_time: 0.0352 memory: 21517 grad_norm: 2.5759 loss: 1.6224 caption_loss_cls: 2.6626 grounding_loss_reg: 3.6111 detection_loss_cls: 0.0539 detection_loss_reg: 0.3986 semantic_segmentation_loss_cls: 0.0143 instance_segmentation_loss_cls: 0.0564 instance_segmentation_loss_reg: 0.4005 instance_segmentation_loss_poly: 1.0769 +2023/10/27 01:26:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 01:26:21 - mmengine - INFO - Iter(train) [ 63000/640000] base_lr: 1.9530e-04 lr: 1.9573e-05 eta: 7 days, 11:11:29 time: 1.1350 data_time: 0.0387 memory: 21517 grad_norm: 2.5815 loss: 1.6162 caption_loss_cls: 2.6583 grounding_loss_reg: 3.6061 detection_loss_cls: 0.0537 detection_loss_reg: 0.3977 semantic_segmentation_loss_cls: 0.0143 instance_segmentation_loss_cls: 0.0564 instance_segmentation_loss_reg: 0.4011 instance_segmentation_loss_poly: 1.0779 +2023/10/27 01:26:21 - mmengine - INFO - Saving checkpoint at 63000 iterations +2023/10/27 01:35:54 - mmengine - INFO - Iter(train) [ 63500/640000] base_lr: 1.9523e-04 lr: 1.9566e-05 eta: 7 days, 11:04:17 time: 1.1353 data_time: 0.0390 memory: 21517 grad_norm: 2.5978 loss: 1.6211 caption_loss_cls: 2.6559 grounding_loss_reg: 3.6022 detection_loss_cls: 0.0535 detection_loss_reg: 0.3962 semantic_segmentation_loss_cls: 0.0143 instance_segmentation_loss_cls: 0.0561 instance_segmentation_loss_reg: 0.4002 instance_segmentation_loss_poly: 1.0761 +2023/10/27 01:45:26 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 01:45:26 - mmengine - INFO - Iter(train) [ 64000/640000] base_lr: 1.9515e-04 lr: 1.9560e-05 eta: 7 days, 10:56:50 time: 1.1389 data_time: 0.0392 memory: 21517 grad_norm: 2.5958 loss: 1.6141 caption_loss_cls: 2.6500 grounding_loss_reg: 3.5978 detection_loss_cls: 0.0534 detection_loss_reg: 0.3968 semantic_segmentation_loss_cls: 0.0143 instance_segmentation_loss_cls: 0.0558 instance_segmentation_loss_reg: 0.3976 instance_segmentation_loss_poly: 1.0700 +2023/10/27 01:45:26 - mmengine - INFO - Saving checkpoint at 64000 iterations +2023/10/27 01:54:58 - mmengine - INFO - Iter(train) [ 64500/640000] base_lr: 1.9508e-04 lr: 1.9553e-05 eta: 7 days, 10:49:27 time: 1.1377 data_time: 0.0395 memory: 21517 grad_norm: 2.5730 loss: 1.6009 caption_loss_cls: 2.6484 grounding_loss_reg: 3.5945 detection_loss_cls: 0.0532 detection_loss_reg: 0.3962 semantic_segmentation_loss_cls: 0.0142 instance_segmentation_loss_cls: 0.0558 instance_segmentation_loss_reg: 0.3976 instance_segmentation_loss_poly: 1.0702 +2023/10/27 02:04:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 02:04:20 - mmengine - INFO - Iter(train) [ 65000/640000] base_lr: 1.9500e-04 lr: 1.9546e-05 eta: 7 days, 10:40:25 time: 1.1347 data_time: 0.0393 memory: 21517 grad_norm: 2.5849 loss: 1.6053 caption_loss_cls: 2.6470 grounding_loss_reg: 3.5901 detection_loss_cls: 0.0529 detection_loss_reg: 0.3946 semantic_segmentation_loss_cls: 0.0142 instance_segmentation_loss_cls: 0.0556 instance_segmentation_loss_reg: 0.3965 instance_segmentation_loss_poly: 1.0677 +2023/10/27 02:04:20 - mmengine - INFO - Saving checkpoint at 65000 iterations +2023/10/27 02:13:53 - mmengine - INFO - Iter(train) [ 65500/640000] base_lr: 1.9493e-04 lr: 1.9539e-05 eta: 7 days, 10:33:05 time: 1.1314 data_time: 0.0390 memory: 21517 grad_norm: 2.5805 loss: 1.5973 caption_loss_cls: 2.6430 grounding_loss_reg: 3.5870 detection_loss_cls: 0.0528 detection_loss_reg: 0.3938 semantic_segmentation_loss_cls: 0.0142 instance_segmentation_loss_cls: 0.0554 instance_segmentation_loss_reg: 0.3957 instance_segmentation_loss_poly: 1.0657 +2023/10/27 02:23:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 02:23:04 - mmengine - INFO - Iter(train) [ 66000/640000] base_lr: 1.9485e-04 lr: 1.9532e-05 eta: 7 days, 10:22:33 time: 1.1377 data_time: 0.0391 memory: 21517 grad_norm: 2.5711 loss: 1.5842 caption_loss_cls: 2.6397 grounding_loss_reg: 3.5824 detection_loss_cls: 0.0527 detection_loss_reg: 0.3923 semantic_segmentation_loss_cls: 0.0141 instance_segmentation_loss_cls: 0.0552 instance_segmentation_loss_reg: 0.3948 instance_segmentation_loss_poly: 1.0639 +2023/10/27 02:23:04 - mmengine - INFO - Saving checkpoint at 66000 iterations +2023/10/27 02:32:18 - mmengine - INFO - Iter(train) [ 66500/640000] base_lr: 1.9477e-04 lr: 1.9525e-05 eta: 7 days, 10:12:27 time: 1.1360 data_time: 0.0390 memory: 21517 grad_norm: 2.5698 loss: 1.5817 caption_loss_cls: 2.6344 grounding_loss_reg: 3.5782 detection_loss_cls: 0.0526 detection_loss_reg: 0.3920 semantic_segmentation_loss_cls: 0.0141 instance_segmentation_loss_cls: 0.0550 instance_segmentation_loss_reg: 0.3941 instance_segmentation_loss_poly: 1.0616 +2023/10/27 02:41:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 02:41:29 - mmengine - INFO - Iter(train) [ 67000/640000] base_lr: 1.9469e-04 lr: 1.9518e-05 eta: 7 days, 10:01:59 time: 1.1268 data_time: 0.0354 memory: 21517 grad_norm: 2.5497 loss: 1.5742 caption_loss_cls: 2.6306 grounding_loss_reg: 3.5743 detection_loss_cls: 0.0523 detection_loss_reg: 0.3912 semantic_segmentation_loss_cls: 0.0141 instance_segmentation_loss_cls: 0.0550 instance_segmentation_loss_reg: 0.3945 instance_segmentation_loss_poly: 1.0626 +2023/10/27 02:41:29 - mmengine - INFO - Saving checkpoint at 67000 iterations +2023/10/27 02:51:05 - mmengine - INFO - Iter(train) [ 67500/640000] base_lr: 1.9462e-04 lr: 1.9510e-05 eta: 7 days, 9:54:57 time: 1.1274 data_time: 0.0352 memory: 21517 grad_norm: 2.5455 loss: 1.5690 caption_loss_cls: 2.6235 grounding_loss_reg: 3.5695 detection_loss_cls: 0.0522 detection_loss_reg: 0.3904 semantic_segmentation_loss_cls: 0.0141 instance_segmentation_loss_cls: 0.0549 instance_segmentation_loss_reg: 0.3940 instance_segmentation_loss_poly: 1.0624 +2023/10/27 03:00:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 03:00:25 - mmengine - INFO - Iter(train) [ 68000/640000] base_lr: 1.9454e-04 lr: 1.9503e-05 eta: 7 days, 9:45:40 time: 1.1245 data_time: 0.0351 memory: 21517 grad_norm: 2.5359 loss: 1.5635 caption_loss_cls: 2.6240 grounding_loss_reg: 3.5646 detection_loss_cls: 0.0521 detection_loss_reg: 0.3898 semantic_segmentation_loss_cls: 0.0141 instance_segmentation_loss_cls: 0.0547 instance_segmentation_loss_reg: 0.3937 instance_segmentation_loss_poly: 1.0616 +2023/10/27 03:00:25 - mmengine - INFO - Saving checkpoint at 68000 iterations +2023/10/27 03:09:58 - mmengine - INFO - Iter(train) [ 68500/640000] base_lr: 1.9446e-04 lr: 1.9496e-05 eta: 7 days, 9:38:17 time: 1.1248 data_time: 0.0353 memory: 21517 grad_norm: 2.5677 loss: 1.5834 caption_loss_cls: 2.6190 grounding_loss_reg: 3.5594 detection_loss_cls: 0.0520 detection_loss_reg: 0.3897 semantic_segmentation_loss_cls: 0.0140 instance_segmentation_loss_cls: 0.0548 instance_segmentation_loss_reg: 0.3947 instance_segmentation_loss_poly: 1.0632 +2023/10/27 03:19:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 03:19:29 - mmengine - INFO - Iter(train) [ 69000/640000] base_lr: 1.9438e-04 lr: 1.9489e-05 eta: 7 days, 9:30:29 time: 1.1271 data_time: 0.0351 memory: 21517 grad_norm: 2.5355 loss: 1.5658 caption_loss_cls: 2.6147 grounding_loss_reg: 3.5532 detection_loss_cls: 0.0519 detection_loss_reg: 0.3903 semantic_segmentation_loss_cls: 0.0140 instance_segmentation_loss_cls: 0.0547 instance_segmentation_loss_reg: 0.3936 instance_segmentation_loss_poly: 1.0607 +2023/10/27 03:19:29 - mmengine - INFO - Saving checkpoint at 69000 iterations +2023/10/27 03:28:58 - mmengine - INFO - Iter(train) [ 69500/640000] base_lr: 1.9429e-04 lr: 1.9481e-05 eta: 7 days, 9:22:28 time: 1.1261 data_time: 0.0351 memory: 21517 grad_norm: 2.5451 loss: 1.5746 caption_loss_cls: 2.6127 grounding_loss_reg: 3.5503 detection_loss_cls: 0.0518 detection_loss_reg: 0.3893 semantic_segmentation_loss_cls: 0.0139 instance_segmentation_loss_cls: 0.0546 instance_segmentation_loss_reg: 0.3938 instance_segmentation_loss_poly: 1.0607 +2023/10/27 03:38:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 03:38:27 - mmengine - INFO - Iter(train) [ 70000/640000] base_lr: 1.9421e-04 lr: 1.9474e-05 eta: 7 days, 9:14:22 time: 1.1305 data_time: 0.0355 memory: 21517 grad_norm: 2.5507 loss: 1.5816 caption_loss_cls: 2.6092 grounding_loss_reg: 3.5478 detection_loss_cls: 0.0519 detection_loss_reg: 0.3899 semantic_segmentation_loss_cls: 0.0139 instance_segmentation_loss_cls: 0.0548 instance_segmentation_loss_reg: 0.3946 instance_segmentation_loss_poly: 1.0620 +2023/10/27 03:38:27 - mmengine - INFO - Saving checkpoint at 70000 iterations +2023/10/27 03:47:26 - mmengine - INFO - Iter(train) [ 70500/640000] base_lr: 1.9413e-04 lr: 1.9466e-05 eta: 7 days, 9:02:17 time: 1.1268 data_time: 0.0354 memory: 21517 grad_norm: 2.5676 loss: 1.5902 caption_loss_cls: 2.6065 grounding_loss_reg: 3.5462 detection_loss_cls: 0.0519 detection_loss_reg: 0.3897 semantic_segmentation_loss_cls: 0.0139 instance_segmentation_loss_cls: 0.0545 instance_segmentation_loss_reg: 0.3930 instance_segmentation_loss_poly: 1.0589 +2023/10/27 03:56:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 03:56:51 - mmengine - INFO - Iter(train) [ 71000/640000] base_lr: 1.9405e-04 lr: 1.9459e-05 eta: 7 days, 8:53:42 time: 1.1303 data_time: 0.0354 memory: 21517 grad_norm: 2.5861 loss: 1.5915 caption_loss_cls: 2.6024 grounding_loss_reg: 3.5437 detection_loss_cls: 0.0519 detection_loss_reg: 0.3903 semantic_segmentation_loss_cls: 0.0139 instance_segmentation_loss_cls: 0.0544 instance_segmentation_loss_reg: 0.3918 instance_segmentation_loss_poly: 1.0558 +2023/10/27 03:56:51 - mmengine - INFO - Saving checkpoint at 71000 iterations +2023/10/27 04:06:43 - mmengine - INFO - Iter(train) [ 71500/640000] base_lr: 1.9396e-04 lr: 1.9451e-05 eta: 7 days, 8:48:38 time: 1.1344 data_time: 0.0411 memory: 21517 grad_norm: 2.5689 loss: 1.5869 caption_loss_cls: 2.6027 grounding_loss_reg: 3.5383 detection_loss_cls: 0.0518 detection_loss_reg: 0.3899 semantic_segmentation_loss_cls: 0.0138 instance_segmentation_loss_cls: 0.0544 instance_segmentation_loss_reg: 0.3923 instance_segmentation_loss_poly: 1.0564 +2023/10/27 04:15:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 04:15:41 - mmengine - INFO - Iter(train) [ 72000/640000] base_lr: 1.9388e-04 lr: 1.9444e-05 eta: 7 days, 8:36:29 time: 1.1291 data_time: 0.0411 memory: 21517 grad_norm: 2.5691 loss: 1.5931 caption_loss_cls: 2.6034 grounding_loss_reg: 3.5336 detection_loss_cls: 0.0516 detection_loss_reg: 0.3884 semantic_segmentation_loss_cls: 0.0138 instance_segmentation_loss_cls: 0.0547 instance_segmentation_loss_reg: 0.3941 instance_segmentation_loss_poly: 1.0596 +2023/10/27 04:15:41 - mmengine - INFO - Saving checkpoint at 72000 iterations +2023/10/27 04:25:08 - mmengine - INFO - Iter(train) [ 72500/640000] base_lr: 1.9380e-04 lr: 1.9436e-05 eta: 7 days, 8:28:07 time: 1.1275 data_time: 0.0412 memory: 21517 grad_norm: 2.5628 loss: 1.5893 caption_loss_cls: 2.6048 grounding_loss_reg: 3.5302 detection_loss_cls: 0.0517 detection_loss_reg: 0.3893 semantic_segmentation_loss_cls: 0.0138 instance_segmentation_loss_cls: 0.0545 instance_segmentation_loss_reg: 0.3926 instance_segmentation_loss_poly: 1.0566 +2023/10/27 04:34:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 04:34:35 - mmengine - INFO - Iter(train) [ 73000/640000] base_lr: 1.9371e-04 lr: 1.9428e-05 eta: 7 days, 8:19:36 time: 1.1263 data_time: 0.0413 memory: 21517 grad_norm: 2.5672 loss: 1.6048 caption_loss_cls: 2.6063 grounding_loss_reg: 3.5269 detection_loss_cls: 0.0518 detection_loss_reg: 0.3900 semantic_segmentation_loss_cls: 0.0138 instance_segmentation_loss_cls: 0.0545 instance_segmentation_loss_reg: 0.3931 instance_segmentation_loss_poly: 1.0570 +2023/10/27 04:34:35 - mmengine - INFO - Saving checkpoint at 73000 iterations +2023/10/27 04:44:01 - mmengine - INFO - Iter(train) [ 73500/640000] base_lr: 1.9363e-04 lr: 1.9421e-05 eta: 7 days, 8:11:04 time: 1.1255 data_time: 0.0412 memory: 21517 grad_norm: 2.5480 loss: 1.5896 caption_loss_cls: 2.6015 grounding_loss_reg: 3.5213 detection_loss_cls: 0.0517 detection_loss_reg: 0.3896 semantic_segmentation_loss_cls: 0.0138 instance_segmentation_loss_cls: 0.0545 instance_segmentation_loss_reg: 0.3935 instance_segmentation_loss_poly: 1.0571 +2023/10/27 04:53:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231026_050054 +2023/10/27 04:53:24 - mmengine - INFO - Iter(train) [ 74000/640000] base_lr: 1.9354e-04 lr: 1.9413e-05 eta: 7 days, 8:02:12 time: 1.1242 data_time: 0.0411 memory: 21517 grad_norm: 2.5565 loss: 1.5978 caption_loss_cls: 2.6036 grounding_loss_reg: 3.5184 detection_loss_cls: 0.0515 detection_loss_reg: 0.3894 semantic_segmentation_loss_cls: 0.0137 instance_segmentation_loss_cls: 0.0545 instance_segmentation_loss_reg: 0.3941 instance_segmentation_loss_poly: 1.0589 +2023/10/27 04:53:24 - mmengine - INFO - Saving checkpoint at 74000 iterations +2023/10/28 20:39:08 - mmengine - INFO - Iter(train) [ 74500/640000] base_lr: 1.9345e-04 lr: 1.9405e-05 eta: 7 days, 10:52:21 time: 1.1318 data_time: 0.0379 memory: 21521 grad_norm: 2.5391 loss: 1.5888 caption_loss_cls: 2.6012 grounding_loss_reg: 3.5136 detection_loss_cls: 0.0514 detection_loss_reg: 0.3896 semantic_segmentation_loss_cls: 0.0137 instance_segmentation_loss_cls: 0.0542 instance_segmentation_loss_reg: 0.3929 instance_segmentation_loss_poly: 1.0563 +2023/10/28 20:48:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/28 20:48:12 - mmengine - INFO - Iter(train) [ 75000/640000] base_lr: 1.9337e-04 lr: 1.9397e-05 eta: 7 days, 6:39:22 time: 1.1264 data_time: 0.0375 memory: 21521 grad_norm: 2.5527 loss: 1.5851 caption_loss_cls: 2.5974 grounding_loss_reg: 3.5113 detection_loss_cls: 0.0512 detection_loss_reg: 0.3887 semantic_segmentation_loss_cls: 0.0137 instance_segmentation_loss_cls: 0.0540 instance_segmentation_loss_reg: 0.3916 instance_segmentation_loss_poly: 1.0539 +2023/10/28 20:48:12 - mmengine - INFO - Saving checkpoint at 75000 iterations +2023/10/28 20:57:47 - mmengine - INFO - Iter(train) [ 75500/640000] base_lr: 1.9328e-04 lr: 1.9389e-05 eta: 7 days, 8:26:43 time: 1.1222 data_time: 0.0322 memory: 21521 grad_norm: 2.5480 loss: 1.5731 caption_loss_cls: 2.5965 grounding_loss_reg: 3.5087 detection_loss_cls: 0.0509 detection_loss_reg: 0.3870 semantic_segmentation_loss_cls: 0.0136 instance_segmentation_loss_cls: 0.0538 instance_segmentation_loss_reg: 0.3902 instance_segmentation_loss_poly: 1.0508 +2023/10/28 21:06:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/28 21:06:32 - mmengine - INFO - Iter(train) [ 76000/640000] base_lr: 1.9319e-04 lr: 1.9381e-05 eta: 7 days, 5:19:03 time: 1.1187 data_time: 0.0317 memory: 21521 grad_norm: 2.5591 loss: 1.5725 caption_loss_cls: 2.5934 grounding_loss_reg: 3.5053 detection_loss_cls: 0.0508 detection_loss_reg: 0.3862 semantic_segmentation_loss_cls: 0.0136 instance_segmentation_loss_cls: 0.0535 instance_segmentation_loss_reg: 0.3904 instance_segmentation_loss_poly: 1.0515 +2023/10/28 21:06:32 - mmengine - INFO - Saving checkpoint at 76000 iterations +2023/10/28 21:16:00 - mmengine - INFO - Iter(train) [ 76500/640000] base_lr: 1.9310e-04 lr: 1.9373e-05 eta: 7 days, 6:05:45 time: 1.1190 data_time: 0.0313 memory: 21521 grad_norm: 2.5290 loss: 1.5566 caption_loss_cls: 2.5872 grounding_loss_reg: 3.5004 detection_loss_cls: 0.0508 detection_loss_reg: 0.3858 semantic_segmentation_loss_cls: 0.0136 instance_segmentation_loss_cls: 0.0531 instance_segmentation_loss_reg: 0.3892 instance_segmentation_loss_poly: 1.0485 +2023/10/28 21:25:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/28 21:25:22 - mmengine - INFO - Iter(train) [ 77000/640000] base_lr: 1.9301e-04 lr: 1.9365e-05 eta: 7 days, 6:13:37 time: 1.1179 data_time: 0.0310 memory: 21521 grad_norm: 2.5572 loss: 1.5524 caption_loss_cls: 2.5865 grounding_loss_reg: 3.4968 detection_loss_cls: 0.0507 detection_loss_reg: 0.3851 semantic_segmentation_loss_cls: 0.0136 instance_segmentation_loss_cls: 0.0526 instance_segmentation_loss_reg: 0.3866 instance_segmentation_loss_poly: 1.0437 +2023/10/28 21:25:22 - mmengine - INFO - Saving checkpoint at 77000 iterations +2023/10/28 21:35:08 - mmengine - INFO - Iter(train) [ 77500/640000] base_lr: 1.9292e-04 lr: 1.9357e-05 eta: 7 days, 7:24:06 time: 1.1231 data_time: 0.0311 memory: 21521 grad_norm: 2.5595 loss: 1.5568 caption_loss_cls: 2.5869 grounding_loss_reg: 3.4930 detection_loss_cls: 0.0507 detection_loss_reg: 0.3842 semantic_segmentation_loss_cls: 0.0136 instance_segmentation_loss_cls: 0.0525 instance_segmentation_loss_reg: 0.3868 instance_segmentation_loss_poly: 1.0444 +2023/10/28 21:44:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/28 21:44:29 - mmengine - INFO - Iter(train) [ 78000/640000] base_lr: 1.9283e-04 lr: 1.9348e-05 eta: 7 days, 7:13:45 time: 1.1225 data_time: 0.0308 memory: 21521 grad_norm: 2.5769 loss: 1.5542 caption_loss_cls: 2.5867 grounding_loss_reg: 3.4904 detection_loss_cls: 0.0505 detection_loss_reg: 0.3831 semantic_segmentation_loss_cls: 0.0136 instance_segmentation_loss_cls: 0.0523 instance_segmentation_loss_reg: 0.3860 instance_segmentation_loss_poly: 1.0435 +2023/10/28 21:44:29 - mmengine - INFO - Saving checkpoint at 78000 iterations +2023/10/28 21:54:09 - mmengine - INFO - Iter(train) [ 78500/640000] base_lr: 1.9274e-04 lr: 1.9340e-05 eta: 7 days, 7:42:53 time: 1.1251 data_time: 0.0342 memory: 21521 grad_norm: 2.5855 loss: 1.5590 caption_loss_cls: 2.5821 grounding_loss_reg: 3.4864 detection_loss_cls: 0.0504 detection_loss_reg: 0.3828 semantic_segmentation_loss_cls: 0.0135 instance_segmentation_loss_cls: 0.0521 instance_segmentation_loss_reg: 0.3850 instance_segmentation_loss_poly: 1.0411 +2023/10/28 22:02:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/28 22:02:17 - mmengine - INFO - Iter(train) [ 79000/640000] base_lr: 1.9265e-04 lr: 1.9332e-05 eta: 7 days, 5:12:56 time: 1.1112 data_time: 0.0339 memory: 21521 grad_norm: 2.6263 loss: 1.5808 caption_loss_cls: 2.5742 grounding_loss_reg: 3.4839 detection_loss_cls: 0.0503 detection_loss_reg: 0.3823 semantic_segmentation_loss_cls: 0.0135 instance_segmentation_loss_cls: 0.0520 instance_segmentation_loss_reg: 0.3847 instance_segmentation_loss_poly: 1.0401 +2023/10/28 22:02:17 - mmengine - INFO - Saving checkpoint at 79000 iterations +2023/10/28 22:11:55 - mmengine - INFO - Iter(train) [ 79500/640000] base_lr: 1.9256e-04 lr: 1.9323e-05 eta: 7 days, 5:40:22 time: 1.1118 data_time: 0.0333 memory: 21521 grad_norm: 2.6339 loss: 1.5909 caption_loss_cls: 2.5750 grounding_loss_reg: 3.4837 detection_loss_cls: 0.0500 detection_loss_reg: 0.3803 semantic_segmentation_loss_cls: 0.0135 instance_segmentation_loss_cls: 0.0519 instance_segmentation_loss_reg: 0.3843 instance_segmentation_loss_poly: 1.0389 +2023/10/28 22:21:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/28 22:21:32 - mmengine - INFO - Iter(train) [ 80000/640000] base_lr: 1.9246e-04 lr: 1.9315e-05 eta: 7 days, 6:00:32 time: 1.1248 data_time: 0.0334 memory: 21521 grad_norm: 2.5893 loss: 1.5677 caption_loss_cls: 2.5741 grounding_loss_reg: 3.4821 detection_loss_cls: 0.0501 detection_loss_reg: 0.3809 semantic_segmentation_loss_cls: 0.0135 instance_segmentation_loss_cls: 0.0518 instance_segmentation_loss_reg: 0.3842 instance_segmentation_loss_poly: 1.0377 +2023/10/28 22:21:32 - mmengine - INFO - Saving checkpoint at 80000 iterations +2023/10/28 22:30:06 - mmengine - INFO - Evaluating bbox... +2023/10/28 22:31:02 - mmengine - INFO - bbox_mAP_copypaste: 0.333 0.496 0.364 0.199 0.386 0.437 +2023/10/28 22:31:02 - mmengine - INFO - Evaluating segm... +2023/10/28 22:32:12 - mmengine - INFO - segm_mAP_copypaste: 0.198 0.397 0.178 0.086 0.235 0.321 +2023/10/28 22:37:03 - mmengine - INFO - per class results: +2023/10/28 22:37:03 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 73.09 | 87.28 | +| building | 79.66 | 92.27 | +| sky | 92.51 | 95.72 | +| floor | 77.64 | 86.07 | +| tree | 69.21 | 82.21 | +| ceiling | 79.42 | 88.4 | +| road | 79.64 | 83.38 | +| bed | 83.78 | 93.1 | +| windowpane | 54.84 | 63.36 | +| grass | 62.81 | 73.18 | +| cabinet | 55.31 | 65.16 | +| sidewalk | 57.48 | 81.93 | +| person | 75.66 | 88.17 | +| earth | 31.78 | 43.08 | +| door | 40.53 | 62.58 | +| table | 51.2 | 70.89 | +| mountain | 51.78 | 73.32 | +| plant | 45.78 | 59.34 | +| curtain | 65.56 | 72.59 | +| chair | 46.96 | 64.62 | +| car | 76.3 | 89.62 | +| water | 50.83 | 68.13 | +| painting | 65.58 | 83.72 | +| sofa | 59.42 | 78.19 | +| shelf | 33.42 | 49.05 | +| house | 40.84 | 57.88 | +| sea | 56.35 | 86.76 | +| mirror | 51.32 | 57.03 | +| rug | 58.03 | 63.36 | +| field | 27.92 | 63.28 | +| armchair | 35.83 | 58.75 | +| seat | 57.03 | 76.05 | +| fence | 32.63 | 58.95 | +| desk | 31.91 | 62.6 | +| rock | 34.07 | 47.83 | +| wardrobe | 42.18 | 49.94 | +| lamp | 45.3 | 55.17 | +| bathtub | 57.2 | 68.15 | +| railing | 25.44 | 32.57 | +| cushion | 30.54 | 33.47 | +| base | 18.35 | 32.04 | +| box | 11.07 | 12.44 | +| column | 35.44 | 76.51 | +| signboard | 29.57 | 35.17 | +| chest of drawers | 36.59 | 55.18 | +| counter | 29.07 | 51.92 | +| sand | 40.26 | 45.09 | +| sink | 52.29 | 78.83 | +| skyscraper | 29.37 | 31.33 | +| fireplace | 49.29 | 85.62 | +| refrigerator | 62.71 | 84.85 | +| grandstand | 43.29 | 49.26 | +| path | 23.73 | 38.69 | +| stairs | 20.68 | 25.21 | +| runway | 80.24 | 85.74 | +| case | 31.16 | 35.87 | +| pool table | 89.58 | 93.41 | +| pillow | 45.97 | 70.05 | +| screen door | 21.32 | 22.79 | +| stairway | 21.64 | 31.65 | +| river | 16.67 | 26.76 | +| bridge | 50.51 | 70.7 | +| bookcase | 24.07 | 65.5 | +| blind | 28.86 | 53.6 | +| coffee table | 56.68 | 76.84 | +| toilet | 76.68 | 88.62 | +| flower | 23.32 | 32.44 | +| book | 31.39 | 39.33 | +| hill | 2.29 | 3.01 | +| bench | 37.1 | 52.29 | +| countertop | 34.49 | 36.22 | +| stove | 54.64 | 81.7 | +| palm | 45.91 | 67.09 | +| kitchen island | 33.61 | 76.46 | +| computer | 62.98 | 83.01 | +| swivel chair | 27.74 | 34.89 | +| boat | 48.29 | 56.19 | +| bar | 31.7 | 45.97 | +| arcade machine | 44.03 | 62.41 | +| hovel | 22.82 | 28.39 | +| bus | 64.88 | 93.49 | +| towel | 48.35 | 61.42 | +| light | 34.17 | 38.46 | +| truck | 23.46 | 59.51 | +| tower | 28.62 | 34.99 | +| chandelier | 56.66 | 80.55 | +| awning | 5.44 | 5.68 | +| streetlight | 18.1 | 24.09 | +| booth | 48.76 | 58.3 | +| television receiver | 56.6 | 60.04 | +| airplane | 56.99 | 64.94 | +| dirt track | 0.0 | 0.0 | +| apparel | 29.44 | 42.77 | +| pole | 7.36 | 8.2 | +| land | 0.03 | 0.03 | +| bannister | 2.45 | 2.73 | +| escalator | 42.23 | 77.37 | +| ottoman | 29.98 | 64.08 | +| bottle | 19.67 | 25.06 | +| buffet | 27.77 | 33.48 | +| poster | 12.48 | 16.94 | +| stage | 12.3 | 21.21 | +| van | 26.17 | 30.15 | +| ship | 46.85 | 97.16 | +| fountain | 9.73 | 10.64 | +| conveyer belt | 74.72 | 83.73 | +| canopy | 23.66 | 45.05 | +| washer | 48.44 | 70.55 | +| plaything | 23.78 | 35.13 | +| swimming pool | 25.35 | 27.82 | +| stool | 34.97 | 46.13 | +| barrel | 4.49 | 59.94 | +| basket | 20.78 | 30.18 | +| waterfall | 26.01 | 27.89 | +| tent | 78.81 | 97.88 | +| bag | 12.02 | 14.27 | +| minibike | 56.14 | 66.04 | +| cradle | 65.49 | 87.82 | +| oven | 19.01 | 30.02 | +| ball | 42.01 | 48.82 | +| food | 49.61 | 65.21 | +| step | 10.69 | 13.13 | +| tank | 38.77 | 41.44 | +| trade name | 24.03 | 28.46 | +| microwave | 34.7 | 37.94 | +| pot | 33.53 | 37.42 | +| animal | 54.71 | 60.79 | +| bicycle | 48.46 | 63.74 | +| lake | 1.4 | 1.73 | +| dishwasher | 22.68 | 23.13 | +| screen | 73.9 | 85.13 | +| blanket | 0.36 | 0.37 | +| sculpture | 25.55 | 37.01 | +| hood | 42.56 | 62.02 | +| sconce | 23.76 | 56.18 | +| vase | 30.96 | 42.97 | +| traffic light | 25.15 | 44.91 | +| tray | 5.55 | 9.06 | +| ashcan | 27.37 | 46.44 | +| fan | 40.2 | 64.01 | +| pier | 35.41 | 61.69 | +| crt screen | 4.48 | 9.01 | +| plate | 42.58 | 53.94 | +| monitor | 9.2 | 11.84 | +| bulletin board | 18.69 | 27.91 | +| shower | 0.32 | 0.37 | +| radiator | 47.31 | 53.19 | +| glass | 3.41 | 3.5 | +| clock | 11.29 | 11.66 | +| flag | 21.45 | 22.21 | ++---------------------+-------+-------+ +2023/10/28 22:37:20 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.3330 coco/bbox_mAP_50: 0.4960 coco/bbox_mAP_75: 0.3640 coco/bbox_mAP_s: 0.1990 coco/bbox_mAP_m: 0.3860 coco/bbox_mAP_l: 0.4370 coco/segm_mAP: 0.1980 coco/segm_mAP_50: 0.3970 coco/segm_mAP_75: 0.1780 coco/segm_mAP_s: 0.0860 coco/segm_mAP_m: 0.2350 coco/segm_mAP_l: 0.3210 Bleu_1: 0.6841 Bleu_2: 0.5007 Bleu_3: 0.3573 Bleu_4: 0.2519 METEOR: 0.2284 ROUGE_L: 0.4991 CIDEr: 0.7897 SPICE: 0.1608 aAcc: 78.8300 mIoU: 38.5600 mAcc: 51.6600 visual-grounding/miou: 0.6834 visual-grounding/acc: 0.7722 data_time: 0.0098 time: 0.5294 +2023/10/28 22:46:44 - mmengine - INFO - Iter(train) [ 80500/640000] base_lr: 1.9237e-04 lr: 1.9306e-05 eta: 7 days, 6:00:07 time: 1.1242 data_time: 0.0307 memory: 21522 grad_norm: 2.6290 loss: 1.5819 caption_loss_cls: 2.5773 grounding_loss_reg: 3.4776 detection_loss_cls: 0.0500 detection_loss_reg: 0.3806 semantic_segmentation_loss_cls: 0.0135 instance_segmentation_loss_cls: 0.0516 instance_segmentation_loss_reg: 0.3841 instance_segmentation_loss_poly: 1.0385 +2023/10/28 22:55:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/28 22:55:50 - mmengine - INFO - Iter(train) [ 81000/640000] base_lr: 1.9228e-04 lr: 1.9298e-05 eta: 7 days, 5:33:20 time: 1.1204 data_time: 0.0308 memory: 21522 grad_norm: 2.6283 loss: 1.5837 caption_loss_cls: 2.5758 grounding_loss_reg: 3.4733 detection_loss_cls: 0.0499 detection_loss_reg: 0.3802 semantic_segmentation_loss_cls: 0.0135 instance_segmentation_loss_cls: 0.0515 instance_segmentation_loss_reg: 0.3839 instance_segmentation_loss_poly: 1.0377 +2023/10/28 22:55:50 - mmengine - INFO - Saving checkpoint at 81000 iterations +2023/10/28 23:04:22 - mmengine - INFO - Iter(train) [ 81500/640000] base_lr: 1.9218e-04 lr: 1.9289e-05 eta: 7 days, 4:25:34 time: 1.1017 data_time: 0.0303 memory: 21522 grad_norm: 2.6867 loss: 1.5961 caption_loss_cls: 2.5668 grounding_loss_reg: 3.4708 detection_loss_cls: 0.0498 detection_loss_reg: 0.3795 semantic_segmentation_loss_cls: 0.0135 instance_segmentation_loss_cls: 0.0513 instance_segmentation_loss_reg: 0.3830 instance_segmentation_loss_poly: 1.0368 +2023/10/28 23:13:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/28 23:13:04 - mmengine - INFO - Iter(train) [ 82000/640000] base_lr: 1.9209e-04 lr: 1.9281e-05 eta: 7 days, 3:36:36 time: 1.0919 data_time: 0.0301 memory: 21522 grad_norm: 2.7089 loss: 1.6089 caption_loss_cls: 2.5711 grounding_loss_reg: 3.4673 detection_loss_cls: 0.0499 detection_loss_reg: 0.3795 semantic_segmentation_loss_cls: 0.0134 instance_segmentation_loss_cls: 0.0511 instance_segmentation_loss_reg: 0.3822 instance_segmentation_loss_poly: 1.0351 +2023/10/28 23:13:04 - mmengine - INFO - Saving checkpoint at 82000 iterations +2023/10/28 23:21:54 - mmengine - INFO - Iter(train) [ 82500/640000] base_lr: 1.9199e-04 lr: 1.9272e-05 eta: 7 days, 3:01:35 time: 1.0794 data_time: 0.0299 memory: 21522 grad_norm: 2.7334 loss: 1.6245 caption_loss_cls: 2.5736 grounding_loss_reg: 3.4647 detection_loss_cls: 0.0500 detection_loss_reg: 0.3797 semantic_segmentation_loss_cls: 0.0134 instance_segmentation_loss_cls: 0.0510 instance_segmentation_loss_reg: 0.3831 instance_segmentation_loss_poly: 1.0376 +2023/10/28 23:31:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/28 23:31:18 - mmengine - INFO - Iter(train) [ 83000/640000] base_lr: 1.9190e-04 lr: 1.9263e-05 eta: 7 days, 3:04:44 time: 1.0984 data_time: 0.0305 memory: 21522 grad_norm: 2.6822 loss: 1.6034 caption_loss_cls: 2.5728 grounding_loss_reg: 3.4619 detection_loss_cls: 0.0498 detection_loss_reg: 0.3790 semantic_segmentation_loss_cls: 0.0134 instance_segmentation_loss_cls: 0.0506 instance_segmentation_loss_reg: 0.3814 instance_segmentation_loss_poly: 1.0333 +2023/10/28 23:31:18 - mmengine - INFO - Saving checkpoint at 83000 iterations +2023/10/28 23:40:24 - mmengine - INFO - Iter(train) [ 83500/640000] base_lr: 1.9180e-04 lr: 1.9255e-05 eta: 7 days, 2:48:19 time: 1.0905 data_time: 0.0306 memory: 21522 grad_norm: 2.6917 loss: 1.6015 caption_loss_cls: 2.5708 grounding_loss_reg: 3.4606 detection_loss_cls: 0.0497 detection_loss_reg: 0.3797 semantic_segmentation_loss_cls: 0.0134 instance_segmentation_loss_cls: 0.0506 instance_segmentation_loss_reg: 0.3817 instance_segmentation_loss_poly: 1.0345 +2023/10/28 23:49:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/28 23:49:37 - mmengine - INFO - Iter(train) [ 84000/640000] base_lr: 1.9170e-04 lr: 1.9246e-05 eta: 7 days, 2:39:47 time: 1.0846 data_time: 0.0318 memory: 21522 grad_norm: 2.7677 loss: 1.6269 caption_loss_cls: 2.5665 grounding_loss_reg: 3.4542 detection_loss_cls: 0.0496 detection_loss_reg: 0.3790 semantic_segmentation_loss_cls: 0.0133 instance_segmentation_loss_cls: 0.0505 instance_segmentation_loss_reg: 0.3825 instance_segmentation_loss_poly: 1.0371 +2023/10/28 23:49:37 - mmengine - INFO - Saving checkpoint at 84000 iterations +2023/10/28 23:59:05 - mmengine - INFO - Iter(train) [ 84500/640000] base_lr: 1.9161e-04 lr: 1.9237e-05 eta: 7 days, 2:43:55 time: 1.0851 data_time: 0.0346 memory: 21522 grad_norm: 2.7790 loss: 1.6280 caption_loss_cls: 2.5617 grounding_loss_reg: 3.4499 detection_loss_cls: 0.0495 detection_loss_reg: 0.3783 semantic_segmentation_loss_cls: 0.0133 instance_segmentation_loss_cls: 0.0505 instance_segmentation_loss_reg: 0.3824 instance_segmentation_loss_poly: 1.0365 +2023/10/29 00:07:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 00:07:42 - mmengine - INFO - Iter(train) [ 85000/640000] base_lr: 1.9151e-04 lr: 1.9228e-05 eta: 7 days, 2:04:13 time: 1.0777 data_time: 0.0344 memory: 21522 grad_norm: 2.7953 loss: 1.6361 caption_loss_cls: 2.5591 grounding_loss_reg: 3.4497 detection_loss_cls: 0.0496 detection_loss_reg: 0.3794 semantic_segmentation_loss_cls: 0.0133 instance_segmentation_loss_cls: 0.0504 instance_segmentation_loss_reg: 0.3823 instance_segmentation_loss_poly: 1.0364 +2023/10/29 00:07:42 - mmengine - INFO - Saving checkpoint at 85000 iterations +2023/10/29 00:16:55 - mmengine - INFO - Iter(train) [ 85500/640000] base_lr: 1.9141e-04 lr: 1.9219e-05 eta: 7 days, 1:56:08 time: 1.0880 data_time: 0.0348 memory: 21522 grad_norm: 2.7906 loss: 1.6385 caption_loss_cls: 2.5582 grounding_loss_reg: 3.4469 detection_loss_cls: 0.0496 detection_loss_reg: 0.3788 semantic_segmentation_loss_cls: 0.0133 instance_segmentation_loss_cls: 0.0505 instance_segmentation_loss_reg: 0.3826 instance_segmentation_loss_poly: 1.0377 +2023/10/29 00:26:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 00:26:01 - mmengine - INFO - Iter(train) [ 86000/640000] base_lr: 1.9131e-04 lr: 1.9210e-05 eta: 7 days, 1:42:55 time: 1.0942 data_time: 0.0349 memory: 21522 grad_norm: 2.7530 loss: 1.6097 caption_loss_cls: 2.5566 grounding_loss_reg: 3.4433 detection_loss_cls: 0.0494 detection_loss_reg: 0.3790 semantic_segmentation_loss_cls: 0.0133 instance_segmentation_loss_cls: 0.0505 instance_segmentation_loss_reg: 0.3828 instance_segmentation_loss_poly: 1.0389 +2023/10/29 00:26:01 - mmengine - INFO - Saving checkpoint at 86000 iterations +2023/10/29 00:35:40 - mmengine - INFO - Iter(train) [ 86500/640000] base_lr: 1.9121e-04 lr: 1.9201e-05 eta: 7 days, 1:53:32 time: 1.1063 data_time: 0.0350 memory: 21522 grad_norm: 2.7287 loss: 1.5801 caption_loss_cls: 2.5532 grounding_loss_reg: 3.4371 detection_loss_cls: 0.0493 detection_loss_reg: 0.3792 semantic_segmentation_loss_cls: 0.0132 instance_segmentation_loss_cls: 0.0504 instance_segmentation_loss_reg: 0.3825 instance_segmentation_loss_poly: 1.0382 +2023/10/29 00:44:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 00:44:50 - mmengine - INFO - Iter(train) [ 87000/640000] base_lr: 1.9111e-04 lr: 1.9192e-05 eta: 7 days, 1:42:28 time: 1.1027 data_time: 0.0351 memory: 21522 grad_norm: 2.7316 loss: 1.5881 caption_loss_cls: 2.5532 grounding_loss_reg: 3.4372 detection_loss_cls: 0.0493 detection_loss_reg: 0.3792 semantic_segmentation_loss_cls: 0.0132 instance_segmentation_loss_cls: 0.0503 instance_segmentation_loss_reg: 0.3822 instance_segmentation_loss_poly: 1.0366 +2023/10/29 00:44:50 - mmengine - INFO - Saving checkpoint at 87000 iterations +2023/10/29 00:54:26 - mmengine - INFO - Iter(train) [ 87500/640000] base_lr: 1.9101e-04 lr: 1.9183e-05 eta: 7 days, 1:49:20 time: 1.1103 data_time: 0.0354 memory: 21522 grad_norm: 2.7117 loss: 1.5911 caption_loss_cls: 2.5534 grounding_loss_reg: 3.4351 detection_loss_cls: 0.0493 detection_loss_reg: 0.3801 semantic_segmentation_loss_cls: 0.0132 instance_segmentation_loss_cls: 0.0504 instance_segmentation_loss_reg: 0.3827 instance_segmentation_loss_poly: 1.0364 +2023/10/29 01:03:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 01:03:28 - mmengine - INFO - Iter(train) [ 88000/640000] base_lr: 1.9091e-04 lr: 1.9173e-05 eta: 7 days, 1:33:06 time: 1.1077 data_time: 0.0342 memory: 21522 grad_norm: 2.6738 loss: 1.5731 caption_loss_cls: 2.5482 grounding_loss_reg: 3.4319 detection_loss_cls: 0.0493 detection_loss_reg: 0.3801 semantic_segmentation_loss_cls: 0.0131 instance_segmentation_loss_cls: 0.0503 instance_segmentation_loss_reg: 0.3829 instance_segmentation_loss_poly: 1.0357 +2023/10/29 01:03:28 - mmengine - INFO - Saving checkpoint at 88000 iterations +2023/10/29 01:13:02 - mmengine - INFO - Iter(train) [ 88500/640000] base_lr: 1.9080e-04 lr: 1.9164e-05 eta: 7 days, 1:36:43 time: 1.1090 data_time: 0.0341 memory: 21522 grad_norm: 2.6258 loss: 1.5518 caption_loss_cls: 2.5517 grounding_loss_reg: 3.4289 detection_loss_cls: 0.0491 detection_loss_reg: 0.3793 semantic_segmentation_loss_cls: 0.0132 instance_segmentation_loss_cls: 0.0501 instance_segmentation_loss_reg: 0.3812 instance_segmentation_loss_poly: 1.0322 +2023/10/29 01:22:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 01:22:03 - mmengine - INFO - Iter(train) [ 89000/640000] base_lr: 1.9070e-04 lr: 1.9155e-05 eta: 7 days, 1:19:50 time: 1.1151 data_time: 0.0343 memory: 21522 grad_norm: 2.6252 loss: 1.5471 caption_loss_cls: 2.5500 grounding_loss_reg: 3.4255 detection_loss_cls: 0.0489 detection_loss_reg: 0.3790 semantic_segmentation_loss_cls: 0.0132 instance_segmentation_loss_cls: 0.0501 instance_segmentation_loss_reg: 0.3817 instance_segmentation_loss_poly: 1.0335 +2023/10/29 01:22:03 - mmengine - INFO - Saving checkpoint at 89000 iterations +2023/10/29 01:31:29 - mmengine - INFO - Iter(train) [ 89500/640000] base_lr: 1.9060e-04 lr: 1.9145e-05 eta: 7 days, 1:18:21 time: 1.1184 data_time: 0.0345 memory: 21522 grad_norm: 2.6319 loss: 1.5514 caption_loss_cls: 2.5499 grounding_loss_reg: 3.4237 detection_loss_cls: 0.0487 detection_loss_reg: 0.3777 semantic_segmentation_loss_cls: 0.0132 instance_segmentation_loss_cls: 0.0500 instance_segmentation_loss_reg: 0.3815 instance_segmentation_loss_poly: 1.0331 +2023/10/29 01:40:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 01:40:48 - mmengine - INFO - Iter(train) [ 90000/640000] base_lr: 1.9050e-04 lr: 1.9136e-05 eta: 7 days, 1:11:51 time: 1.1214 data_time: 0.0347 memory: 21522 grad_norm: 2.6371 loss: 1.5605 caption_loss_cls: 2.5452 grounding_loss_reg: 3.4183 detection_loss_cls: 0.0488 detection_loss_reg: 0.3794 semantic_segmentation_loss_cls: 0.0132 instance_segmentation_loss_cls: 0.0501 instance_segmentation_loss_reg: 0.3822 instance_segmentation_loss_poly: 1.0349 +2023/10/29 01:40:48 - mmengine - INFO - Saving checkpoint at 90000 iterations +2023/10/29 01:49:48 - mmengine - INFO - Iter(train) [ 90500/640000] base_lr: 1.9039e-04 lr: 1.9126e-05 eta: 7 days, 0:55:17 time: 1.1119 data_time: 0.0349 memory: 21522 grad_norm: 2.6718 loss: 1.5846 caption_loss_cls: 2.5465 grounding_loss_reg: 3.4178 detection_loss_cls: 0.0487 detection_loss_reg: 0.3793 semantic_segmentation_loss_cls: 0.0132 instance_segmentation_loss_cls: 0.0501 instance_segmentation_loss_reg: 0.3825 instance_segmentation_loss_poly: 1.0359 +2023/10/29 01:58:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 01:58:30 - mmengine - INFO - Iter(train) [ 91000/640000] base_lr: 1.9029e-04 lr: 1.9117e-05 eta: 7 days, 0:28:43 time: 1.1047 data_time: 0.0344 memory: 21522 grad_norm: 2.6726 loss: 1.5673 caption_loss_cls: 2.5424 grounding_loss_reg: 3.4149 detection_loss_cls: 0.0485 detection_loss_reg: 0.3785 semantic_segmentation_loss_cls: 0.0131 instance_segmentation_loss_cls: 0.0500 instance_segmentation_loss_reg: 0.3824 instance_segmentation_loss_poly: 1.0357 +2023/10/29 01:58:30 - mmengine - INFO - Saving checkpoint at 91000 iterations +2023/10/29 02:07:50 - mmengine - INFO - Iter(train) [ 91500/640000] base_lr: 1.9018e-04 lr: 1.9107e-05 eta: 7 days, 0:23:43 time: 1.1009 data_time: 0.0340 memory: 21522 grad_norm: 2.6582 loss: 1.5504 caption_loss_cls: 2.5392 grounding_loss_reg: 3.4127 detection_loss_cls: 0.0484 detection_loss_reg: 0.3776 semantic_segmentation_loss_cls: 0.0131 instance_segmentation_loss_cls: 0.0498 instance_segmentation_loss_reg: 0.3815 instance_segmentation_loss_poly: 1.0344 +2023/10/29 02:16:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 02:16:51 - mmengine - INFO - Iter(train) [ 92000/640000] base_lr: 1.9008e-04 lr: 1.9098e-05 eta: 7 days, 0:08:47 time: 1.1006 data_time: 0.0340 memory: 21522 grad_norm: 2.6806 loss: 1.5623 caption_loss_cls: 2.5360 grounding_loss_reg: 3.4103 detection_loss_cls: 0.0483 detection_loss_reg: 0.3773 semantic_segmentation_loss_cls: 0.0131 instance_segmentation_loss_cls: 0.0496 instance_segmentation_loss_reg: 0.3798 instance_segmentation_loss_poly: 1.0300 +2023/10/29 02:16:51 - mmengine - INFO - Saving checkpoint at 92000 iterations +2023/10/29 02:26:25 - mmengine - INFO - Iter(train) [ 92500/640000] base_lr: 1.8997e-04 lr: 1.9088e-05 eta: 7 days, 0:10:04 time: 1.1007 data_time: 0.0339 memory: 21522 grad_norm: 2.7056 loss: 1.5688 caption_loss_cls: 2.5314 grounding_loss_reg: 3.4065 detection_loss_cls: 0.0482 detection_loss_reg: 0.3765 semantic_segmentation_loss_cls: 0.0131 instance_segmentation_loss_cls: 0.0495 instance_segmentation_loss_reg: 0.3798 instance_segmentation_loss_poly: 1.0302 +2023/10/29 02:35:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 02:35:43 - mmengine - INFO - Iter(train) [ 93000/640000] base_lr: 1.8986e-04 lr: 1.9078e-05 eta: 7 days, 0:03:13 time: 1.1048 data_time: 0.0340 memory: 21522 grad_norm: 2.7012 loss: 1.5598 caption_loss_cls: 2.5250 grounding_loss_reg: 3.4043 detection_loss_cls: 0.0479 detection_loss_reg: 0.3750 semantic_segmentation_loss_cls: 0.0131 instance_segmentation_loss_cls: 0.0493 instance_segmentation_loss_reg: 0.3786 instance_segmentation_loss_poly: 1.0268 +2023/10/29 02:35:43 - mmengine - INFO - Saving checkpoint at 93000 iterations +2023/10/29 02:44:49 - mmengine - INFO - Iter(train) [ 93500/640000] base_lr: 1.8975e-04 lr: 1.9069e-05 eta: 6 days, 23:50:44 time: 1.0998 data_time: 0.0335 memory: 21522 grad_norm: 2.6816 loss: 1.5400 caption_loss_cls: 2.5272 grounding_loss_reg: 3.3986 detection_loss_cls: 0.0478 detection_loss_reg: 0.3739 semantic_segmentation_loss_cls: 0.0131 instance_segmentation_loss_cls: 0.0492 instance_segmentation_loss_reg: 0.3771 instance_segmentation_loss_poly: 1.0243 +2023/10/29 02:53:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 02:53:56 - mmengine - INFO - Iter(train) [ 94000/640000] base_lr: 1.8965e-04 lr: 1.9059e-05 eta: 6 days, 23:38:37 time: 1.0968 data_time: 0.0332 memory: 21522 grad_norm: 2.6811 loss: 1.5401 caption_loss_cls: 2.5248 grounding_loss_reg: 3.3988 detection_loss_cls: 0.0477 detection_loss_reg: 0.3730 semantic_segmentation_loss_cls: 0.0130 instance_segmentation_loss_cls: 0.0491 instance_segmentation_loss_reg: 0.3766 instance_segmentation_loss_poly: 1.0228 +2023/10/29 02:53:56 - mmengine - INFO - Saving checkpoint at 94000 iterations +2023/10/29 02:03:36 - mmengine - INFO - Iter(train) [ 94500/640000] base_lr: 1.8954e-04 lr: 1.9049e-05 eta: 6 days, 23:41:23 time: 1.1066 data_time: 0.0332 memory: 21522 grad_norm: 2.6726 loss: 1.5222 caption_loss_cls: 2.5249 grounding_loss_reg: 3.3927 detection_loss_cls: 0.0476 detection_loss_reg: 0.3727 semantic_segmentation_loss_cls: 0.0130 instance_segmentation_loss_cls: 0.0489 instance_segmentation_loss_reg: 0.3756 instance_segmentation_loss_poly: 1.0193 +2023/10/29 02:12:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 02:12:44 - mmengine - INFO - Iter(train) [ 95000/640000] base_lr: 1.8943e-04 lr: 1.9039e-05 eta: 6 days, 23:30:02 time: 1.1134 data_time: 0.0335 memory: 21522 grad_norm: 2.6503 loss: 1.5271 caption_loss_cls: 2.5267 grounding_loss_reg: 3.3928 detection_loss_cls: 0.0476 detection_loss_reg: 0.3718 semantic_segmentation_loss_cls: 0.0131 instance_segmentation_loss_cls: 0.0489 instance_segmentation_loss_reg: 0.3759 instance_segmentation_loss_poly: 1.0187 +2023/10/29 02:12:44 - mmengine - INFO - Saving checkpoint at 95000 iterations +2023/10/29 02:21:36 - mmengine - INFO - Iter(train) [ 95500/640000] base_lr: 1.8932e-04 lr: 1.9029e-05 eta: 6 days, 23:11:50 time: 1.1063 data_time: 0.0335 memory: 21522 grad_norm: 2.7035 loss: 1.5508 caption_loss_cls: 2.5262 grounding_loss_reg: 3.3905 detection_loss_cls: 0.0477 detection_loss_reg: 0.3725 semantic_segmentation_loss_cls: 0.0131 instance_segmentation_loss_cls: 0.0489 instance_segmentation_loss_reg: 0.3760 instance_segmentation_loss_poly: 1.0187 +2023/10/29 02:30:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 02:30:56 - mmengine - INFO - Iter(train) [ 96000/640000] base_lr: 1.8921e-04 lr: 1.9019e-05 eta: 6 days, 23:05:24 time: 1.1108 data_time: 0.0339 memory: 21522 grad_norm: 2.6762 loss: 1.5469 caption_loss_cls: 2.5225 grounding_loss_reg: 3.3877 detection_loss_cls: 0.0478 detection_loss_reg: 0.3734 semantic_segmentation_loss_cls: 0.0130 instance_segmentation_loss_cls: 0.0492 instance_segmentation_loss_reg: 0.3762 instance_segmentation_loss_poly: 1.0187 +2023/10/29 02:30:56 - mmengine - INFO - Saving checkpoint at 96000 iterations +2023/10/29 02:40:23 - mmengine - INFO - Iter(train) [ 96500/640000] base_lr: 1.8910e-04 lr: 1.9009e-05 eta: 6 days, 23:02:08 time: 1.1094 data_time: 0.0340 memory: 21522 grad_norm: 2.7001 loss: 1.5552 caption_loss_cls: 2.5201 grounding_loss_reg: 3.3857 detection_loss_cls: 0.0476 detection_loss_reg: 0.3725 semantic_segmentation_loss_cls: 0.0130 instance_segmentation_loss_cls: 0.0494 instance_segmentation_loss_reg: 0.3768 instance_segmentation_loss_poly: 1.0187 +2023/10/29 02:49:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 02:49:50 - mmengine - INFO - Iter(train) [ 97000/640000] base_lr: 1.8899e-04 lr: 1.8999e-05 eta: 6 days, 22:57:56 time: 1.1114 data_time: 0.0340 memory: 21522 grad_norm: 2.6785 loss: 1.5487 caption_loss_cls: 2.5194 grounding_loss_reg: 3.3812 detection_loss_cls: 0.0477 detection_loss_reg: 0.3730 semantic_segmentation_loss_cls: 0.0130 instance_segmentation_loss_cls: 0.0495 instance_segmentation_loss_reg: 0.3766 instance_segmentation_loss_poly: 1.0179 +2023/10/29 02:49:50 - mmengine - INFO - Saving checkpoint at 97000 iterations +2023/10/29 02:59:28 - mmengine - INFO - Iter(train) [ 97500/640000] base_lr: 1.8888e-04 lr: 1.8989e-05 eta: 6 days, 22:58:12 time: 1.1194 data_time: 0.0346 memory: 21522 grad_norm: 2.6664 loss: 1.5621 caption_loss_cls: 2.5194 grounding_loss_reg: 3.3796 detection_loss_cls: 0.0474 detection_loss_reg: 0.3720 semantic_segmentation_loss_cls: 0.0130 instance_segmentation_loss_cls: 0.0495 instance_segmentation_loss_reg: 0.3762 instance_segmentation_loss_poly: 1.0155 +2023/10/29 03:08:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 03:08:21 - mmengine - INFO - Iter(train) [ 98000/640000] base_lr: 1.8876e-04 lr: 1.8979e-05 eta: 6 days, 22:41:17 time: 1.1162 data_time: 0.0348 memory: 21522 grad_norm: 2.6820 loss: 1.5675 caption_loss_cls: 2.5217 grounding_loss_reg: 3.3759 detection_loss_cls: 0.0472 detection_loss_reg: 0.3712 semantic_segmentation_loss_cls: 0.0130 instance_segmentation_loss_cls: 0.0495 instance_segmentation_loss_reg: 0.3765 instance_segmentation_loss_poly: 1.0152 +2023/10/29 03:08:21 - mmengine - INFO - Saving checkpoint at 98000 iterations +2023/10/29 03:18:17 - mmengine - INFO - Iter(train) [ 98500/640000] base_lr: 1.8865e-04 lr: 1.8968e-05 eta: 6 days, 22:47:23 time: 1.1201 data_time: 0.0349 memory: 21522 grad_norm: 2.6168 loss: 1.5570 caption_loss_cls: 2.5195 grounding_loss_reg: 3.3732 detection_loss_cls: 0.0472 detection_loss_reg: 0.3725 semantic_segmentation_loss_cls: 0.0130 instance_segmentation_loss_cls: 0.0496 instance_segmentation_loss_reg: 0.3764 instance_segmentation_loss_poly: 1.0145 +2023/10/29 03:28:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 03:28:08 - mmengine - INFO - Iter(train) [ 99000/640000] base_lr: 1.8854e-04 lr: 1.8958e-05 eta: 6 days, 22:51:27 time: 1.1308 data_time: 0.0353 memory: 21522 grad_norm: 2.5978 loss: 1.5492 caption_loss_cls: 2.5226 grounding_loss_reg: 3.3685 detection_loss_cls: 0.0472 detection_loss_reg: 0.3721 semantic_segmentation_loss_cls: 0.0130 instance_segmentation_loss_cls: 0.0495 instance_segmentation_loss_reg: 0.3769 instance_segmentation_loss_poly: 1.0154 +2023/10/29 03:28:08 - mmengine - INFO - Saving checkpoint at 99000 iterations +2023/10/29 03:37:38 - mmengine - INFO - Iter(train) [ 99500/640000] base_lr: 1.8842e-04 lr: 1.8948e-05 eta: 6 days, 22:47:26 time: 1.1403 data_time: 0.0356 memory: 21522 grad_norm: 2.5677 loss: 1.5363 caption_loss_cls: 2.5186 grounding_loss_reg: 3.3650 detection_loss_cls: 0.0472 detection_loss_reg: 0.3724 semantic_segmentation_loss_cls: 0.0129 instance_segmentation_loss_cls: 0.0496 instance_segmentation_loss_reg: 0.3772 instance_segmentation_loss_poly: 1.0156 +2023/10/29 03:47:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 03:47:22 - mmengine - INFO - Iter(train) [100000/640000] base_lr: 1.8831e-04 lr: 1.8937e-05 eta: 6 days, 22:48:00 time: 1.1464 data_time: 0.0355 memory: 21522 grad_norm: 2.5371 loss: 1.5250 caption_loss_cls: 2.5184 grounding_loss_reg: 3.3618 detection_loss_cls: 0.0473 detection_loss_reg: 0.3736 semantic_segmentation_loss_cls: 0.0129 instance_segmentation_loss_cls: 0.0495 instance_segmentation_loss_reg: 0.3771 instance_segmentation_loss_poly: 1.0156 +2023/10/29 03:47:22 - mmengine - INFO - Saving checkpoint at 100000 iterations +2023/10/29 03:56:31 - mmengine - INFO - Evaluating bbox... +2023/10/29 03:57:28 - mmengine - INFO - bbox_mAP_copypaste: 0.333 0.505 0.359 0.196 0.384 0.443 +2023/10/29 03:57:28 - mmengine - INFO - Evaluating segm... +2023/10/29 03:58:38 - mmengine - INFO - segm_mAP_copypaste: 0.207 0.403 0.191 0.089 0.256 0.345 +2023/10/29 04:03:40 - mmengine - INFO - per class results: +2023/10/29 04:03:40 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 72.03 | 84.1 | +| building | 79.61 | 91.37 | +| sky | 92.6 | 96.63 | +| floor | 78.44 | 88.21 | +| tree | 69.93 | 85.22 | +| ceiling | 81.57 | 89.51 | +| road | 81.75 | 88.51 | +| bed | 83.9 | 89.32 | +| windowpane | 54.73 | 82.86 | +| grass | 67.68 | 84.7 | +| cabinet | 54.74 | 63.17 | +| sidewalk | 59.4 | 77.92 | +| person | 75.58 | 88.35 | +| earth | 32.88 | 44.41 | +| door | 41.56 | 67.17 | +| table | 50.89 | 65.64 | +| mountain | 49.4 | 55.85 | +| plant | 44.72 | 62.97 | +| curtain | 56.61 | 87.19 | +| chair | 49.71 | 66.51 | +| car | 78.53 | 89.31 | +| water | 50.68 | 73.89 | +| painting | 62.97 | 84.88 | +| sofa | 58.06 | 67.88 | +| shelf | 35.03 | 58.3 | +| house | 37.06 | 44.25 | +| sea | 51.74 | 68.03 | +| mirror | 53.85 | 70.81 | +| rug | 59.52 | 64.49 | +| field | 26.52 | 44.64 | +| armchair | 37.71 | 59.23 | +| seat | 55.67 | 66.88 | +| fence | 29.95 | 40.52 | +| desk | 36.83 | 60.07 | +| rock | 44.52 | 67.64 | +| wardrobe | 37.44 | 42.08 | +| lamp | 48.87 | 71.66 | +| bathtub | 66.51 | 81.89 | +| railing | 32.42 | 49.45 | +| cushion | 45.71 | 72.71 | +| base | 21.58 | 32.72 | +| box | 14.89 | 18.11 | +| column | 44.56 | 67.62 | +| signboard | 32.87 | 49.0 | +| chest of drawers | 30.44 | 51.94 | +| counter | 17.29 | 20.02 | +| sand | 32.26 | 48.08 | +| sink | 62.76 | 72.99 | +| skyscraper | 60.68 | 73.2 | +| fireplace | 58.19 | 74.86 | +| refrigerator | 64.23 | 81.37 | +| grandstand | 30.54 | 65.23 | +| path | 21.13 | 25.11 | +| stairs | 21.55 | 24.44 | +| runway | 83.02 | 90.1 | +| case | 36.67 | 42.48 | +| pool table | 82.89 | 95.08 | +| pillow | 39.56 | 52.95 | +| screen door | 43.33 | 52.72 | +| stairway | 20.27 | 27.32 | +| river | 16.3 | 21.02 | +| bridge | 57.92 | 70.86 | +| bookcase | 19.01 | 21.75 | +| blind | 27.99 | 35.1 | +| coffee table | 54.07 | 78.07 | +| toilet | 80.66 | 85.75 | +| flower | 25.7 | 44.56 | +| book | 41.33 | 56.84 | +| hill | 8.54 | 10.44 | +| bench | 33.66 | 45.9 | +| countertop | 47.76 | 63.73 | +| stove | 53.51 | 57.15 | +| palm | 45.45 | 64.93 | +| kitchen island | 38.61 | 62.19 | +| computer | 46.82 | 57.7 | +| swivel chair | 38.99 | 55.57 | +| boat | 59.09 | 79.48 | +| bar | 35.61 | 67.38 | +| arcade machine | 40.56 | 45.19 | +| hovel | 17.75 | 21.45 | +| bus | 73.63 | 91.05 | +| towel | 51.57 | 61.77 | +| light | 41.11 | 65.51 | +| truck | 26.81 | 32.65 | +| tower | 21.7 | 55.54 | +| chandelier | 57.79 | 68.65 | +| awning | 0.84 | 0.88 | +| streetlight | 17.18 | 20.35 | +| booth | 36.26 | 36.62 | +| television receiver | 53.05 | 55.62 | +| airplane | 54.71 | 63.11 | +| dirt track | 0.0 | 0.0 | +| apparel | 23.05 | 34.31 | +| pole | 19.12 | 28.63 | +| land | 0.0 | 0.0 | +| bannister | 5.61 | 7.82 | +| escalator | 11.81 | 12.28 | +| ottoman | 39.74 | 59.63 | +| bottle | 18.67 | 24.37 | +| buffet | 30.56 | 34.4 | +| poster | 23.59 | 27.57 | +| stage | 9.35 | 16.0 | +| van | 22.99 | 28.83 | +| ship | 37.5 | 38.98 | +| fountain | 1.5 | 1.54 | +| conveyer belt | 50.28 | 78.66 | +| canopy | 12.29 | 17.29 | +| washer | 52.32 | 58.14 | +| plaything | 14.92 | 62.75 | +| swimming pool | 37.29 | 91.8 | +| stool | 34.95 | 53.5 | +| barrel | 4.2 | 16.21 | +| basket | 19.66 | 27.47 | +| waterfall | 47.8 | 63.69 | +| tent | 90.45 | 94.14 | +| bag | 8.54 | 9.01 | +| minibike | 59.24 | 74.56 | +| cradle | 60.1 | 77.59 | +| oven | 30.33 | 40.7 | +| ball | 41.55 | 49.07 | +| food | 52.93 | 59.93 | +| step | 9.66 | 10.5 | +| tank | 37.99 | 43.59 | +| trade name | 12.12 | 13.06 | +| microwave | 40.21 | 44.39 | +| pot | 34.35 | 40.69 | +| animal | 59.58 | 63.46 | +| bicycle | 49.5 | 71.8 | +| lake | 0.06 | 0.06 | +| dishwasher | 41.39 | 79.41 | +| screen | 75.75 | 84.72 | +| blanket | 7.33 | 7.92 | +| sculpture | 36.93 | 49.5 | +| hood | 43.72 | 47.3 | +| sconce | 21.82 | 24.47 | +| vase | 34.22 | 49.06 | +| traffic light | 25.13 | 38.12 | +| tray | 6.79 | 10.0 | +| ashcan | 23.56 | 46.71 | +| fan | 44.84 | 53.67 | +| pier | 58.6 | 64.32 | +| crt screen | 3.58 | 5.49 | +| plate | 48.67 | 64.3 | +| monitor | 16.23 | 49.74 | +| bulletin board | 31.27 | 44.81 | +| shower | 0.0 | 0.0 | +| radiator | 39.15 | 44.54 | +| glass | 13.17 | 15.14 | +| clock | 15.09 | 16.85 | +| flag | 30.02 | 34.46 | ++---------------------+-------+-------+ +2023/10/29 04:03:55 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.3330 coco/bbox_mAP_50: 0.5050 coco/bbox_mAP_75: 0.3590 coco/bbox_mAP_s: 0.1960 coco/bbox_mAP_m: 0.3840 coco/bbox_mAP_l: 0.4430 coco/segm_mAP: 0.2070 coco/segm_mAP_50: 0.4030 coco/segm_mAP_75: 0.1910 coco/segm_mAP_s: 0.0890 coco/segm_mAP_m: 0.2560 coco/segm_mAP_l: 0.3450 Bleu_1: 0.6802 Bleu_2: 0.4992 Bleu_3: 0.3565 Bleu_4: 0.2548 METEOR: 0.2273 ROUGE_L: 0.5003 CIDEr: 0.8087 SPICE: 0.1585 aAcc: 79.2600 mIoU: 39.9400 mAcc: 52.0500 visual-grounding/miou: 0.6919 visual-grounding/acc: 0.7771 data_time: 0.0048 time: 0.5243 +2023/10/29 04:12:56 - mmengine - INFO - Iter(train) [100500/640000] base_lr: 1.8820e-04 lr: 1.8927e-05 eta: 6 days, 22:34:00 time: 1.1400 data_time: 0.0323 memory: 21522 grad_norm: 2.4872 loss: 1.5123 caption_loss_cls: 2.5184 grounding_loss_reg: 3.3574 detection_loss_cls: 0.0472 detection_loss_reg: 0.3731 semantic_segmentation_loss_cls: 0.0129 instance_segmentation_loss_cls: 0.0494 instance_segmentation_loss_reg: 0.3767 instance_segmentation_loss_poly: 1.0142 +2023/10/29 04:22:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 04:22:07 - mmengine - INFO - Iter(train) [101000/640000] base_lr: 1.8808e-04 lr: 1.8916e-05 eta: 6 days, 22:23:12 time: 1.1363 data_time: 0.0322 memory: 21522 grad_norm: 2.5220 loss: 1.5239 caption_loss_cls: 2.5208 grounding_loss_reg: 3.3543 detection_loss_cls: 0.0472 detection_loss_reg: 0.3730 semantic_segmentation_loss_cls: 0.0129 instance_segmentation_loss_cls: 0.0494 instance_segmentation_loss_reg: 0.3765 instance_segmentation_loss_poly: 1.0143 +2023/10/29 04:22:07 - mmengine - INFO - Saving checkpoint at 101000 iterations +2023/10/29 04:31:33 - mmengine - INFO - Iter(train) [101500/640000] base_lr: 1.8796e-04 lr: 1.8906e-05 eta: 6 days, 22:17:01 time: 1.1330 data_time: 0.0317 memory: 21522 grad_norm: 2.5230 loss: 1.5135 caption_loss_cls: 2.5211 grounding_loss_reg: 3.3541 detection_loss_cls: 0.0472 detection_loss_reg: 0.3732 semantic_segmentation_loss_cls: 0.0129 instance_segmentation_loss_cls: 0.0494 instance_segmentation_loss_reg: 0.3765 instance_segmentation_loss_poly: 1.0130 +2023/10/29 04:40:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 04:40:53 - mmengine - INFO - Iter(train) [102000/640000] base_lr: 1.8785e-04 lr: 1.8895e-05 eta: 6 days, 22:09:05 time: 1.1396 data_time: 0.0317 memory: 21522 grad_norm: 2.4918 loss: 1.5047 caption_loss_cls: 2.5206 grounding_loss_reg: 3.3503 detection_loss_cls: 0.0470 detection_loss_reg: 0.3729 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0494 instance_segmentation_loss_reg: 0.3759 instance_segmentation_loss_poly: 1.0109 +2023/10/29 04:40:53 - mmengine - INFO - Saving checkpoint at 102000 iterations +2023/10/29 04:50:10 - mmengine - INFO - Iter(train) [102500/640000] base_lr: 1.8773e-04 lr: 1.8885e-05 eta: 6 days, 22:00:14 time: 1.1302 data_time: 0.0314 memory: 21522 grad_norm: 2.5501 loss: 1.5194 caption_loss_cls: 2.5162 grounding_loss_reg: 3.3518 detection_loss_cls: 0.0467 detection_loss_reg: 0.3715 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0495 instance_segmentation_loss_reg: 0.3755 instance_segmentation_loss_poly: 1.0105 +2023/10/29 04:58:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 04:58:47 - mmengine - INFO - Iter(train) [103000/640000] base_lr: 1.8761e-04 lr: 1.8874e-05 eta: 6 days, 21:38:57 time: 1.1116 data_time: 0.0308 memory: 21522 grad_norm: 2.6160 loss: 1.5406 caption_loss_cls: 2.5145 grounding_loss_reg: 3.3485 detection_loss_cls: 0.0468 detection_loss_reg: 0.3717 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0495 instance_segmentation_loss_reg: 0.3755 instance_segmentation_loss_poly: 1.0115 +2023/10/29 04:58:47 - mmengine - INFO - Saving checkpoint at 103000 iterations +2023/10/29 05:08:11 - mmengine - INFO - Iter(train) [103500/640000] base_lr: 1.8750e-04 lr: 1.8863e-05 eta: 6 days, 21:32:21 time: 1.1101 data_time: 0.0310 memory: 21522 grad_norm: 2.6466 loss: 1.5480 caption_loss_cls: 2.5168 grounding_loss_reg: 3.3491 detection_loss_cls: 0.0467 detection_loss_reg: 0.3716 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0497 instance_segmentation_loss_reg: 0.3759 instance_segmentation_loss_poly: 1.0116 +2023/10/29 05:17:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 05:17:15 - mmengine - INFO - Iter(train) [104000/640000] base_lr: 1.8738e-04 lr: 1.8852e-05 eta: 6 days, 21:19:37 time: 1.1000 data_time: 0.0309 memory: 21522 grad_norm: 2.6971 loss: 1.5706 caption_loss_cls: 2.5186 grounding_loss_reg: 3.3482 detection_loss_cls: 0.0467 detection_loss_reg: 0.3722 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0497 instance_segmentation_loss_reg: 0.3759 instance_segmentation_loss_poly: 1.0119 +2023/10/29 05:17:15 - mmengine - INFO - Saving checkpoint at 104000 iterations +2023/10/29 05:26:44 - mmengine - INFO - Iter(train) [104500/640000] base_lr: 1.8726e-04 lr: 1.8842e-05 eta: 6 days, 21:14:16 time: 1.1067 data_time: 0.0341 memory: 21522 grad_norm: 2.7116 loss: 1.5779 caption_loss_cls: 2.5197 grounding_loss_reg: 3.3440 detection_loss_cls: 0.0467 detection_loss_reg: 0.3726 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0497 instance_segmentation_loss_reg: 0.3761 instance_segmentation_loss_poly: 1.0128 +2023/10/29 05:36:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 05:36:14 - mmengine - INFO - Iter(train) [105000/640000] base_lr: 1.8714e-04 lr: 1.8831e-05 eta: 6 days, 21:09:22 time: 1.1115 data_time: 0.0345 memory: 21522 grad_norm: 2.6895 loss: 1.5819 caption_loss_cls: 2.5239 grounding_loss_reg: 3.3411 detection_loss_cls: 0.0467 detection_loss_reg: 0.3724 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0497 instance_segmentation_loss_reg: 0.3764 instance_segmentation_loss_poly: 1.0122 +2023/10/29 05:36:14 - mmengine - INFO - Saving checkpoint at 105000 iterations +2023/10/29 05:45:34 - mmengine - INFO - Iter(train) [105500/640000] base_lr: 1.8702e-04 lr: 1.8820e-05 eta: 6 days, 21:01:06 time: 1.1100 data_time: 0.0344 memory: 21522 grad_norm: 2.6724 loss: 1.5651 caption_loss_cls: 2.5241 grounding_loss_reg: 3.3350 detection_loss_cls: 0.0467 detection_loss_reg: 0.3723 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0496 instance_segmentation_loss_reg: 0.3764 instance_segmentation_loss_poly: 1.0119 +2023/10/29 05:54:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 05:54:48 - mmengine - INFO - Iter(train) [106000/640000] base_lr: 1.8690e-04 lr: 1.8809e-05 eta: 6 days, 20:51:29 time: 1.1087 data_time: 0.0345 memory: 21522 grad_norm: 2.7025 loss: 1.5670 caption_loss_cls: 2.5201 grounding_loss_reg: 3.3334 detection_loss_cls: 0.0467 detection_loss_reg: 0.3721 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0496 instance_segmentation_loss_reg: 0.3772 instance_segmentation_loss_poly: 1.0133 +2023/10/29 05:54:48 - mmengine - INFO - Saving checkpoint at 106000 iterations +2023/10/29 06:04:32 - mmengine - INFO - Iter(train) [106500/640000] base_lr: 1.8678e-04 lr: 1.8798e-05 eta: 6 days, 20:49:53 time: 1.1153 data_time: 0.0348 memory: 21522 grad_norm: 2.6720 loss: 1.5601 caption_loss_cls: 2.5243 grounding_loss_reg: 3.3333 detection_loss_cls: 0.0468 detection_loss_reg: 0.3736 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0496 instance_segmentation_loss_reg: 0.3780 instance_segmentation_loss_poly: 1.0138 +2023/10/29 06:13:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 06:13:36 - mmengine - INFO - Iter(train) [107000/640000] base_lr: 1.8666e-04 lr: 1.8787e-05 eta: 6 days, 20:37:12 time: 1.1219 data_time: 0.0350 memory: 21522 grad_norm: 2.6421 loss: 1.5408 caption_loss_cls: 2.5238 grounding_loss_reg: 3.3282 detection_loss_cls: 0.0468 detection_loss_reg: 0.3728 semantic_segmentation_loss_cls: 0.0127 instance_segmentation_loss_cls: 0.0494 instance_segmentation_loss_reg: 0.3767 instance_segmentation_loss_poly: 1.0117 +2023/10/29 06:13:36 - mmengine - INFO - Saving checkpoint at 107000 iterations +2023/10/29 06:22:41 - mmengine - INFO - Iter(train) [107500/640000] base_lr: 1.8653e-04 lr: 1.8776e-05 eta: 6 days, 20:25:06 time: 1.1172 data_time: 0.0346 memory: 21522 grad_norm: 2.6397 loss: 1.5441 caption_loss_cls: 2.5250 grounding_loss_reg: 3.3256 detection_loss_cls: 0.0467 detection_loss_reg: 0.3725 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0493 instance_segmentation_loss_reg: 0.3763 instance_segmentation_loss_poly: 1.0109 +2023/10/29 06:31:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 06:31:59 - mmengine - INFO - Iter(train) [108000/640000] base_lr: 1.8641e-04 lr: 1.8765e-05 eta: 6 days, 20:16:21 time: 1.1207 data_time: 0.0347 memory: 21522 grad_norm: 2.6222 loss: 1.5291 caption_loss_cls: 2.5238 grounding_loss_reg: 3.3245 detection_loss_cls: 0.0467 detection_loss_reg: 0.3720 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0491 instance_segmentation_loss_reg: 0.3751 instance_segmentation_loss_poly: 1.0086 +2023/10/29 06:31:59 - mmengine - INFO - Saving checkpoint at 108000 iterations +2023/10/29 06:41:31 - mmengine - INFO - Iter(train) [108500/640000] base_lr: 1.8629e-04 lr: 1.8753e-05 eta: 6 days, 20:11:14 time: 1.1216 data_time: 0.0347 memory: 21522 grad_norm: 2.6419 loss: 1.5336 caption_loss_cls: 2.5289 grounding_loss_reg: 3.3223 detection_loss_cls: 0.0467 detection_loss_reg: 0.3720 semantic_segmentation_loss_cls: 0.0127 instance_segmentation_loss_cls: 0.0490 instance_segmentation_loss_reg: 0.3751 instance_segmentation_loss_poly: 1.0081 +2023/10/29 06:50:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 06:50:37 - mmengine - INFO - Iter(train) [109000/640000] base_lr: 1.8616e-04 lr: 1.8742e-05 eta: 6 days, 19:59:17 time: 1.1153 data_time: 0.0343 memory: 21522 grad_norm: 2.6422 loss: 1.5271 caption_loss_cls: 2.5263 grounding_loss_reg: 3.3205 detection_loss_cls: 0.0467 detection_loss_reg: 0.3720 semantic_segmentation_loss_cls: 0.0127 instance_segmentation_loss_cls: 0.0490 instance_segmentation_loss_reg: 0.3751 instance_segmentation_loss_poly: 1.0079 +2023/10/29 06:50:37 - mmengine - INFO - Saving checkpoint at 109000 iterations +2023/10/29 06:59:49 - mmengine - INFO - Iter(train) [109500/640000] base_lr: 1.8604e-04 lr: 1.8731e-05 eta: 6 days, 19:49:14 time: 1.1137 data_time: 0.0343 memory: 21522 grad_norm: 2.6598 loss: 1.5381 caption_loss_cls: 2.5290 grounding_loss_reg: 3.3155 detection_loss_cls: 0.0466 detection_loss_reg: 0.3713 semantic_segmentation_loss_cls: 0.0127 instance_segmentation_loss_cls: 0.0489 instance_segmentation_loss_reg: 0.3745 instance_segmentation_loss_poly: 1.0057 +2023/10/29 07:08:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 07:08:54 - mmengine - INFO - Iter(train) [110000/640000] base_lr: 1.8592e-04 lr: 1.8720e-05 eta: 6 days, 19:37:16 time: 1.1113 data_time: 0.0341 memory: 21522 grad_norm: 2.6410 loss: 1.5277 caption_loss_cls: 2.5284 grounding_loss_reg: 3.3129 detection_loss_cls: 0.0466 detection_loss_reg: 0.3708 semantic_segmentation_loss_cls: 0.0126 instance_segmentation_loss_cls: 0.0488 instance_segmentation_loss_reg: 0.3731 instance_segmentation_loss_poly: 1.0028 +2023/10/29 07:08:54 - mmengine - INFO - Saving checkpoint at 110000 iterations +2023/10/29 07:18:35 - mmengine - INFO - Iter(train) [110500/640000] base_lr: 1.8579e-04 lr: 1.8708e-05 eta: 6 days, 19:33:59 time: 1.1105 data_time: 0.0342 memory: 21522 grad_norm: 2.6554 loss: 1.5383 caption_loss_cls: 2.5286 grounding_loss_reg: 3.3098 detection_loss_cls: 0.0465 detection_loss_reg: 0.3698 semantic_segmentation_loss_cls: 0.0126 instance_segmentation_loss_cls: 0.0487 instance_segmentation_loss_reg: 0.3728 instance_segmentation_loss_poly: 1.0017 +2023/10/29 07:28:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 07:28:08 - mmengine - INFO - Iter(train) [111000/640000] base_lr: 1.8566e-04 lr: 1.8697e-05 eta: 6 days, 19:28:52 time: 1.1179 data_time: 0.0345 memory: 21522 grad_norm: 2.6587 loss: 1.5452 caption_loss_cls: 2.5293 grounding_loss_reg: 3.3082 detection_loss_cls: 0.0465 detection_loss_reg: 0.3692 semantic_segmentation_loss_cls: 0.0126 instance_segmentation_loss_cls: 0.0486 instance_segmentation_loss_reg: 0.3727 instance_segmentation_loss_poly: 1.0013 +2023/10/29 07:28:09 - mmengine - INFO - Saving checkpoint at 111000 iterations +2023/10/29 07:36:49 - mmengine - INFO - Iter(train) [111500/640000] base_lr: 1.8554e-04 lr: 1.8685e-05 eta: 6 days, 19:11:05 time: 1.1117 data_time: 0.0343 memory: 21522 grad_norm: 2.6704 loss: 1.5472 caption_loss_cls: 2.5300 grounding_loss_reg: 3.3029 detection_loss_cls: 0.0465 detection_loss_reg: 0.3694 semantic_segmentation_loss_cls: 0.0127 instance_segmentation_loss_cls: 0.0485 instance_segmentation_loss_reg: 0.3734 instance_segmentation_loss_poly: 1.0039 +2023/10/29 07:46:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 07:46:21 - mmengine - INFO - Iter(train) [112000/640000] base_lr: 1.8541e-04 lr: 1.8674e-05 eta: 6 days, 19:05:38 time: 1.1153 data_time: 0.0346 memory: 21522 grad_norm: 2.6585 loss: 1.5495 caption_loss_cls: 2.5277 grounding_loss_reg: 3.3047 detection_loss_cls: 0.0465 detection_loss_reg: 0.3699 semantic_segmentation_loss_cls: 0.0126 instance_segmentation_loss_cls: 0.0485 instance_segmentation_loss_reg: 0.3729 instance_segmentation_loss_poly: 1.0028 +2023/10/29 07:46:21 - mmengine - INFO - Saving checkpoint at 112000 iterations +2023/10/29 07:56:16 - mmengine - INFO - Iter(train) [112500/640000] base_lr: 1.8528e-04 lr: 1.8662e-05 eta: 6 days, 19:05:07 time: 1.1209 data_time: 0.0349 memory: 21522 grad_norm: 2.6290 loss: 1.5396 caption_loss_cls: 2.5326 grounding_loss_reg: 3.3009 detection_loss_cls: 0.0464 detection_loss_reg: 0.3696 semantic_segmentation_loss_cls: 0.0126 instance_segmentation_loss_cls: 0.0485 instance_segmentation_loss_reg: 0.3735 instance_segmentation_loss_poly: 1.0039 +2023/10/29 08:05:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 08:05:14 - mmengine - INFO - Iter(train) [113000/640000] base_lr: 1.8516e-04 lr: 1.8651e-05 eta: 6 days, 18:51:50 time: 1.1192 data_time: 0.0349 memory: 21522 grad_norm: 2.6347 loss: 1.5348 caption_loss_cls: 2.5317 grounding_loss_reg: 3.2981 detection_loss_cls: 0.0464 detection_loss_reg: 0.3706 semantic_segmentation_loss_cls: 0.0126 instance_segmentation_loss_cls: 0.0487 instance_segmentation_loss_reg: 0.3747 instance_segmentation_loss_poly: 1.0059 +2023/10/29 08:05:14 - mmengine - INFO - Saving checkpoint at 113000 iterations +2023/10/29 08:15:04 - mmengine - INFO - Iter(train) [113500/640000] base_lr: 1.8503e-04 lr: 1.8639e-05 eta: 6 days, 18:49:57 time: 1.1284 data_time: 0.0353 memory: 21522 grad_norm: 2.6330 loss: 1.5390 caption_loss_cls: 2.5292 grounding_loss_reg: 3.2953 detection_loss_cls: 0.0465 detection_loss_reg: 0.3710 semantic_segmentation_loss_cls: 0.0126 instance_segmentation_loss_cls: 0.0488 instance_segmentation_loss_reg: 0.3752 instance_segmentation_loss_poly: 1.0069 +2023/10/29 08:24:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 08:24:09 - mmengine - INFO - Iter(train) [114000/640000] base_lr: 1.8490e-04 lr: 1.8627e-05 eta: 6 days, 18:38:00 time: 1.1283 data_time: 0.0352 memory: 21522 grad_norm: 2.6508 loss: 1.5469 caption_loss_cls: 2.5289 grounding_loss_reg: 3.2876 detection_loss_cls: 0.0466 detection_loss_reg: 0.3718 semantic_segmentation_loss_cls: 0.0126 instance_segmentation_loss_cls: 0.0490 instance_segmentation_loss_reg: 0.3762 instance_segmentation_loss_poly: 1.0097 +2023/10/29 08:24:09 - mmengine - INFO - Saving checkpoint at 114000 iterations +2023/10/29 08:32:58 - mmengine - INFO - Iter(train) [114500/640000] base_lr: 1.8477e-04 lr: 1.8616e-05 eta: 6 days, 18:22:54 time: 1.1156 data_time: 0.0347 memory: 21522 grad_norm: 2.6645 loss: 1.5382 caption_loss_cls: 2.5269 grounding_loss_reg: 3.2867 detection_loss_cls: 0.0467 detection_loss_reg: 0.3727 semantic_segmentation_loss_cls: 0.0126 instance_segmentation_loss_cls: 0.0489 instance_segmentation_loss_reg: 0.3757 instance_segmentation_loss_poly: 1.0092 +2023/10/29 08:42:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 08:42:04 - mmengine - INFO - Iter(train) [115000/640000] base_lr: 1.8464e-04 lr: 1.8604e-05 eta: 6 days, 18:11:27 time: 1.1087 data_time: 0.0345 memory: 21522 grad_norm: 2.6412 loss: 1.5415 caption_loss_cls: 2.5267 grounding_loss_reg: 3.2842 detection_loss_cls: 0.0469 detection_loss_reg: 0.3746 semantic_segmentation_loss_cls: 0.0125 instance_segmentation_loss_cls: 0.0487 instance_segmentation_loss_reg: 0.3748 instance_segmentation_loss_poly: 1.0080 +2023/10/29 08:42:05 - mmengine - INFO - Saving checkpoint at 115000 iterations +2023/10/29 08:51:06 - mmengine - INFO - Iter(train) [115500/640000] base_lr: 1.8451e-04 lr: 1.8592e-05 eta: 6 days, 17:59:07 time: 1.1141 data_time: 0.0345 memory: 21522 grad_norm: 2.6248 loss: 1.5251 caption_loss_cls: 2.5231 grounding_loss_reg: 3.2819 detection_loss_cls: 0.0468 detection_loss_reg: 0.3736 semantic_segmentation_loss_cls: 0.0125 instance_segmentation_loss_cls: 0.0486 instance_segmentation_loss_reg: 0.3741 instance_segmentation_loss_poly: 1.0072 +2023/10/29 09:00:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 09:00:02 - mmengine - INFO - Iter(train) [116000/640000] base_lr: 1.8438e-04 lr: 1.8580e-05 eta: 6 days, 17:45:40 time: 1.1050 data_time: 0.0341 memory: 21522 grad_norm: 2.6581 loss: 1.5290 caption_loss_cls: 2.5229 grounding_loss_reg: 3.2832 detection_loss_cls: 0.0466 detection_loss_reg: 0.3725 semantic_segmentation_loss_cls: 0.0125 instance_segmentation_loss_cls: 0.0485 instance_segmentation_loss_reg: 0.3736 instance_segmentation_loss_poly: 1.0050 +2023/10/29 09:00:02 - mmengine - INFO - Saving checkpoint at 116000 iterations +2023/10/29 09:09:13 - mmengine - INFO - Iter(train) [116500/640000] base_lr: 1.8425e-04 lr: 1.8568e-05 eta: 6 days, 17:35:29 time: 1.0942 data_time: 0.0338 memory: 21522 grad_norm: 2.7051 loss: 1.5408 caption_loss_cls: 2.5217 grounding_loss_reg: 3.2802 detection_loss_cls: 0.0466 detection_loss_reg: 0.3733 semantic_segmentation_loss_cls: 0.0125 instance_segmentation_loss_cls: 0.0485 instance_segmentation_loss_reg: 0.3740 instance_segmentation_loss_poly: 1.0056 +2023/10/29 09:18:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 09:18:50 - mmengine - INFO - Iter(train) [117000/640000] base_lr: 1.8412e-04 lr: 1.8556e-05 eta: 6 days, 17:30:25 time: 1.1036 data_time: 0.0340 memory: 21522 grad_norm: 2.6944 loss: 1.5358 caption_loss_cls: 2.5213 grounding_loss_reg: 3.2781 detection_loss_cls: 0.0465 detection_loss_reg: 0.3731 semantic_segmentation_loss_cls: 0.0125 instance_segmentation_loss_cls: 0.0486 instance_segmentation_loss_reg: 0.3749 instance_segmentation_loss_poly: 1.0072 +2023/10/29 09:18:50 - mmengine - INFO - Saving checkpoint at 117000 iterations +2023/10/29 09:28:15 - mmengine - INFO - Iter(train) [117500/640000] base_lr: 1.8398e-04 lr: 1.8544e-05 eta: 6 days, 17:22:59 time: 1.0975 data_time: 0.0340 memory: 21522 grad_norm: 2.7156 loss: 1.5480 caption_loss_cls: 2.5188 grounding_loss_reg: 3.2752 detection_loss_cls: 0.0466 detection_loss_reg: 0.3743 semantic_segmentation_loss_cls: 0.0125 instance_segmentation_loss_cls: 0.0487 instance_segmentation_loss_reg: 0.3754 instance_segmentation_loss_poly: 1.0084 +2023/10/29 09:37:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 09:37:29 - mmengine - INFO - Iter(train) [118000/640000] base_lr: 1.8385e-04 lr: 1.8532e-05 eta: 6 days, 17:13:23 time: 1.0999 data_time: 0.0341 memory: 21522 grad_norm: 2.7106 loss: 1.5476 caption_loss_cls: 2.5175 grounding_loss_reg: 3.2736 detection_loss_cls: 0.0468 detection_loss_reg: 0.3756 semantic_segmentation_loss_cls: 0.0125 instance_segmentation_loss_cls: 0.0487 instance_segmentation_loss_reg: 0.3747 instance_segmentation_loss_poly: 1.0077 +2023/10/29 09:37:29 - mmengine - INFO - Saving checkpoint at 118000 iterations +2023/10/29 09:47:30 - mmengine - INFO - Iter(train) [118500/640000] base_lr: 1.8372e-04 lr: 1.8520e-05 eta: 6 days, 17:12:52 time: 1.1177 data_time: 0.0359 memory: 21522 grad_norm: 2.6997 loss: 1.5459 caption_loss_cls: 2.5157 grounding_loss_reg: 3.2734 detection_loss_cls: 0.0466 detection_loss_reg: 0.3740 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0484 instance_segmentation_loss_reg: 0.3741 instance_segmentation_loss_poly: 1.0058 +2023/10/29 09:56:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 09:56:42 - mmengine - INFO - Iter(train) [119000/640000] base_lr: 1.8358e-04 lr: 1.8508e-05 eta: 6 days, 17:02:37 time: 1.1190 data_time: 0.0361 memory: 21522 grad_norm: 2.7315 loss: 1.5519 caption_loss_cls: 2.5144 grounding_loss_reg: 3.2715 detection_loss_cls: 0.0466 detection_loss_reg: 0.3745 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0486 instance_segmentation_loss_reg: 0.3749 instance_segmentation_loss_poly: 1.0076 +2023/10/29 09:56:42 - mmengine - INFO - Saving checkpoint at 119000 iterations +2023/10/29 10:06:15 - mmengine - INFO - Iter(train) [119500/640000] base_lr: 1.8345e-04 lr: 1.8496e-05 eta: 6 days, 16:56:33 time: 1.1270 data_time: 0.0365 memory: 21522 grad_norm: 2.6978 loss: 1.5495 caption_loss_cls: 2.5143 grounding_loss_reg: 3.2728 detection_loss_cls: 0.0464 detection_loss_reg: 0.3739 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0485 instance_segmentation_loss_reg: 0.3744 instance_segmentation_loss_poly: 1.0068 +2023/10/29 10:15:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 10:15:55 - mmengine - INFO - Iter(train) [120000/640000] base_lr: 1.8332e-04 lr: 1.8483e-05 eta: 6 days, 16:51:36 time: 1.1379 data_time: 0.0369 memory: 21522 grad_norm: 2.6617 loss: 1.5426 caption_loss_cls: 2.5142 grounding_loss_reg: 3.2735 detection_loss_cls: 0.0464 detection_loss_reg: 0.3736 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0485 instance_segmentation_loss_reg: 0.3743 instance_segmentation_loss_poly: 1.0061 +2023/10/29 10:15:55 - mmengine - INFO - Saving checkpoint at 120000 iterations +2023/10/29 10:24:37 - mmengine - INFO - Evaluating bbox... +2023/10/29 10:25:33 - mmengine - INFO - bbox_mAP_copypaste: 0.358 0.526 0.388 0.216 0.415 0.473 +2023/10/29 10:25:33 - mmengine - INFO - Evaluating segm... +2023/10/29 10:26:41 - mmengine - INFO - segm_mAP_copypaste: 0.227 0.438 0.213 0.106 0.270 0.369 +2023/10/29 10:31:20 - mmengine - INFO - per class results: +2023/10/29 10:31:20 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 74.55 | 85.21 | +| building | 80.59 | 89.33 | +| sky | 92.56 | 97.08 | +| floor | 79.19 | 88.74 | +| tree | 69.45 | 87.27 | +| ceiling | 80.2 | 89.1 | +| road | 81.58 | 87.33 | +| bed | 85.08 | 93.11 | +| windowpane | 57.33 | 77.37 | +| grass | 65.18 | 76.99 | +| cabinet | 55.13 | 72.87 | +| sidewalk | 60.7 | 78.74 | +| person | 77.71 | 89.49 | +| earth | 37.21 | 52.55 | +| door | 43.4 | 61.53 | +| table | 51.43 | 73.72 | +| mountain | 56.62 | 74.22 | +| plant | 46.49 | 59.42 | +| curtain | 70.5 | 80.0 | +| chair | 50.86 | 68.89 | +| car | 80.17 | 89.0 | +| water | 37.0 | 44.82 | +| painting | 66.81 | 83.14 | +| sofa | 57.58 | 65.06 | +| shelf | 37.21 | 69.29 | +| house | 48.43 | 76.48 | +| sea | 48.98 | 73.15 | +| mirror | 58.15 | 75.75 | +| rug | 58.54 | 62.8 | +| field | 29.6 | 47.36 | +| armchair | 37.53 | 55.7 | +| seat | 56.34 | 78.1 | +| fence | 32.88 | 47.53 | +| desk | 35.29 | 60.1 | +| rock | 31.75 | 47.7 | +| wardrobe | 51.7 | 60.51 | +| lamp | 53.51 | 67.6 | +| bathtub | 65.34 | 71.12 | +| railing | 27.01 | 47.36 | +| cushion | 47.52 | 60.97 | +| base | 17.21 | 24.67 | +| box | 18.34 | 24.48 | +| column | 45.76 | 66.44 | +| signboard | 31.23 | 39.5 | +| chest of drawers | 26.6 | 38.2 | +| counter | 37.0 | 56.5 | +| sand | 28.21 | 46.75 | +| sink | 60.81 | 78.1 | +| skyscraper | 62.01 | 75.39 | +| fireplace | 61.48 | 81.64 | +| refrigerator | 61.55 | 83.0 | +| grandstand | 34.99 | 71.98 | +| path | 23.72 | 27.73 | +| stairs | 29.16 | 36.57 | +| runway | 77.7 | 88.81 | +| case | 7.09 | 7.16 | +| pool table | 90.12 | 92.96 | +| pillow | 48.31 | 64.81 | +| screen door | 44.83 | 46.16 | +| stairway | 34.35 | 39.87 | +| river | 13.56 | 54.33 | +| bridge | 44.22 | 67.3 | +| bookcase | 32.94 | 52.58 | +| blind | 22.52 | 25.22 | +| coffee table | 56.93 | 68.2 | +| toilet | 79.17 | 86.41 | +| flower | 31.05 | 43.76 | +| book | 40.84 | 59.57 | +| hill | 14.24 | 23.02 | +| bench | 41.87 | 50.89 | +| countertop | 47.93 | 60.77 | +| stove | 61.64 | 73.72 | +| palm | 43.03 | 57.85 | +| kitchen island | 31.44 | 56.9 | +| computer | 64.74 | 77.69 | +| swivel chair | 44.3 | 68.51 | +| boat | 68.24 | 78.67 | +| bar | 20.02 | 22.99 | +| arcade machine | 35.47 | 39.16 | +| hovel | 13.16 | 14.24 | +| bus | 75.48 | 94.17 | +| towel | 54.87 | 69.25 | +| light | 41.67 | 47.76 | +| truck | 30.03 | 56.36 | +| tower | 28.0 | 61.62 | +| chandelier | 61.66 | 82.92 | +| awning | 23.2 | 39.04 | +| streetlight | 24.37 | 33.47 | +| booth | 32.82 | 42.98 | +| television receiver | 62.36 | 76.25 | +| airplane | 55.61 | 64.46 | +| dirt track | 4.4 | 29.07 | +| apparel | 15.95 | 26.19 | +| pole | 24.25 | 38.13 | +| land | 0.01 | 0.02 | +| bannister | 5.4 | 7.0 | +| escalator | 3.7 | 3.72 | +| ottoman | 27.11 | 74.6 | +| bottle | 18.95 | 23.1 | +| buffet | 34.38 | 36.36 | +| poster | 24.0 | 29.7 | +| stage | 10.37 | 21.5 | +| van | 31.42 | 40.24 | +| ship | 9.39 | 11.09 | +| fountain | 3.19 | 3.28 | +| conveyer belt | 61.65 | 64.32 | +| canopy | 36.01 | 51.6 | +| washer | 65.18 | 70.96 | +| plaything | 16.75 | 53.14 | +| swimming pool | 35.82 | 44.64 | +| stool | 37.08 | 47.86 | +| barrel | 31.3 | 48.16 | +| basket | 23.39 | 32.14 | +| waterfall | 44.67 | 56.9 | +| tent | 90.91 | 97.14 | +| bag | 13.89 | 21.16 | +| minibike | 65.27 | 74.8 | +| cradle | 63.98 | 82.46 | +| oven | 12.93 | 66.66 | +| ball | 36.72 | 48.04 | +| food | 38.76 | 44.25 | +| step | 11.28 | 13.75 | +| tank | 35.82 | 66.58 | +| trade name | 16.95 | 18.09 | +| microwave | 50.1 | 55.89 | +| pot | 35.21 | 41.28 | +| animal | 58.8 | 62.81 | +| bicycle | 54.36 | 72.68 | +| lake | 36.08 | 40.02 | +| dishwasher | 35.3 | 43.28 | +| screen | 66.83 | 84.05 | +| blanket | 3.08 | 3.36 | +| sculpture | 42.28 | 58.19 | +| hood | 42.71 | 45.18 | +| sconce | 27.61 | 31.89 | +| vase | 30.18 | 37.14 | +| traffic light | 28.0 | 47.62 | +| tray | 4.8 | 18.71 | +| ashcan | 30.2 | 41.41 | +| fan | 42.39 | 71.02 | +| pier | 55.68 | 69.31 | +| crt screen | 3.81 | 8.78 | +| plate | 47.21 | 54.23 | +| monitor | 5.35 | 6.14 | +| bulletin board | 28.25 | 33.78 | +| shower | 1.62 | 13.52 | +| radiator | 42.53 | 49.99 | +| glass | 8.34 | 8.52 | +| clock | 16.8 | 19.68 | +| flag | 38.39 | 49.36 | ++---------------------+-------+-------+ +2023/10/29 10:31:35 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.3580 coco/bbox_mAP_50: 0.5260 coco/bbox_mAP_75: 0.3880 coco/bbox_mAP_s: 0.2160 coco/bbox_mAP_m: 0.4150 coco/bbox_mAP_l: 0.4730 coco/segm_mAP: 0.2270 coco/segm_mAP_50: 0.4380 coco/segm_mAP_75: 0.2130 coco/segm_mAP_s: 0.1060 coco/segm_mAP_m: 0.2700 coco/segm_mAP_l: 0.3690 Bleu_1: 0.6963 Bleu_2: 0.5182 Bleu_3: 0.3736 Bleu_4: 0.2687 METEOR: 0.2372 ROUGE_L: 0.5107 CIDEr: 0.8440 SPICE: 0.1667 aAcc: 79.8700 mIoU: 41.3500 mAcc: 54.1500 visual-grounding/miou: 0.7132 visual-grounding/acc: 0.8009 data_time: 0.0047 time: 0.5243 +2023/10/29 10:40:45 - mmengine - INFO - Iter(train) [120500/640000] base_lr: 1.8318e-04 lr: 1.8471e-05 eta: 6 days, 16:41:23 time: 1.1380 data_time: 0.0340 memory: 21522 grad_norm: 2.6411 loss: 1.5400 caption_loss_cls: 2.5152 grounding_loss_reg: 3.2769 detection_loss_cls: 0.0464 detection_loss_reg: 0.3733 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0488 instance_segmentation_loss_reg: 0.3751 instance_segmentation_loss_poly: 1.0080 +2023/10/29 10:50:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 10:50:21 - mmengine - INFO - Iter(train) [121000/640000] base_lr: 1.8304e-04 lr: 1.8459e-05 eta: 6 days, 16:35:39 time: 1.1380 data_time: 0.0341 memory: 21522 grad_norm: 2.5898 loss: 1.5290 caption_loss_cls: 2.5128 grounding_loss_reg: 3.2750 detection_loss_cls: 0.0464 detection_loss_reg: 0.3736 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0489 instance_segmentation_loss_reg: 0.3756 instance_segmentation_loss_poly: 1.0090 +2023/10/29 10:50:21 - mmengine - INFO - Saving checkpoint at 121000 iterations +2023/10/29 10:59:52 - mmengine - INFO - Iter(train) [121500/640000] base_lr: 1.8291e-04 lr: 1.8446e-05 eta: 6 days, 16:28:55 time: 1.1395 data_time: 0.0343 memory: 21522 grad_norm: 2.5807 loss: 1.5255 caption_loss_cls: 2.5128 grounding_loss_reg: 3.2712 detection_loss_cls: 0.0463 detection_loss_reg: 0.3732 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0489 instance_segmentation_loss_reg: 0.3749 instance_segmentation_loss_poly: 1.0069 +2023/10/29 11:09:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 11:09:32 - mmengine - INFO - Iter(train) [122000/640000] base_lr: 1.8277e-04 lr: 1.8434e-05 eta: 6 days, 16:23:40 time: 1.1458 data_time: 0.0347 memory: 21522 grad_norm: 2.5618 loss: 1.5208 caption_loss_cls: 2.5100 grounding_loss_reg: 3.2699 detection_loss_cls: 0.0464 detection_loss_reg: 0.3739 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0489 instance_segmentation_loss_reg: 0.3748 instance_segmentation_loss_poly: 1.0059 +2023/10/29 11:09:32 - mmengine - INFO - Saving checkpoint at 122000 iterations +2023/10/29 11:19:29 - mmengine - INFO - Iter(train) [122500/640000] base_lr: 1.8263e-04 lr: 1.8421e-05 eta: 6 days, 16:21:25 time: 1.1449 data_time: 0.0339 memory: 21522 grad_norm: 2.5695 loss: 1.5275 caption_loss_cls: 2.5074 grounding_loss_reg: 3.2660 detection_loss_cls: 0.0465 detection_loss_reg: 0.3738 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0490 instance_segmentation_loss_reg: 0.3761 instance_segmentation_loss_poly: 1.0080 +2023/10/29 11:28:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 11:28:53 - mmengine - INFO - Iter(train) [123000/640000] base_lr: 1.8250e-04 lr: 1.8409e-05 eta: 6 days, 16:13:10 time: 1.1479 data_time: 0.0338 memory: 21522 grad_norm: 2.5280 loss: 1.5029 caption_loss_cls: 2.5089 grounding_loss_reg: 3.2656 detection_loss_cls: 0.0464 detection_loss_reg: 0.3732 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0489 instance_segmentation_loss_reg: 0.3759 instance_segmentation_loss_poly: 1.0075 +2023/10/29 11:28:53 - mmengine - INFO - Saving checkpoint at 123000 iterations +2023/10/29 11:38:14 - mmengine - INFO - Iter(train) [123500/640000] base_lr: 1.8236e-04 lr: 1.8396e-05 eta: 6 days, 16:04:21 time: 1.1448 data_time: 0.0338 memory: 21522 grad_norm: 2.5358 loss: 1.5097 caption_loss_cls: 2.5089 grounding_loss_reg: 3.2645 detection_loss_cls: 0.0464 detection_loss_reg: 0.3741 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0489 instance_segmentation_loss_reg: 0.3764 instance_segmentation_loss_poly: 1.0084 +2023/10/29 11:47:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 11:47:40 - mmengine - INFO - Iter(train) [124000/640000] base_lr: 1.8222e-04 lr: 1.8384e-05 eta: 6 days, 15:56:25 time: 1.1413 data_time: 0.0336 memory: 21522 grad_norm: 2.5628 loss: 1.5160 caption_loss_cls: 2.5100 grounding_loss_reg: 3.2622 detection_loss_cls: 0.0464 detection_loss_reg: 0.3737 semantic_segmentation_loss_cls: 0.0123 instance_segmentation_loss_cls: 0.0487 instance_segmentation_loss_reg: 0.3747 instance_segmentation_loss_poly: 1.0044 +2023/10/29 11:47:40 - mmengine - INFO - Saving checkpoint at 124000 iterations +2023/10/29 11:56:58 - mmengine - INFO - Iter(train) [124500/640000] base_lr: 1.8208e-04 lr: 1.8371e-05 eta: 6 days, 15:47:11 time: 1.1430 data_time: 0.0363 memory: 21522 grad_norm: 2.5504 loss: 1.5044 caption_loss_cls: 2.5085 grounding_loss_reg: 3.2609 detection_loss_cls: 0.0465 detection_loss_reg: 0.3743 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0485 instance_segmentation_loss_reg: 0.3735 instance_segmentation_loss_poly: 1.0017 +2023/10/29 12:05:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 12:05:56 - mmengine - INFO - Iter(train) [125000/640000] base_lr: 1.8194e-04 lr: 1.8358e-05 eta: 6 days, 15:34:34 time: 1.1335 data_time: 0.0361 memory: 21522 grad_norm: 2.6114 loss: 1.5166 caption_loss_cls: 2.5046 grounding_loss_reg: 3.2574 detection_loss_cls: 0.0464 detection_loss_reg: 0.3738 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0484 instance_segmentation_loss_reg: 0.3732 instance_segmentation_loss_poly: 1.0010 +2023/10/29 12:05:56 - mmengine - INFO - Saving checkpoint at 125000 iterations +2023/10/29 12:15:20 - mmengine - INFO - Iter(train) [125500/640000] base_lr: 1.8180e-04 lr: 1.8346e-05 eta: 6 days, 15:26:17 time: 1.1317 data_time: 0.0356 memory: 21522 grad_norm: 2.6031 loss: 1.4955 caption_loss_cls: 2.5056 grounding_loss_reg: 3.2574 detection_loss_cls: 0.0461 detection_loss_reg: 0.3720 semantic_segmentation_loss_cls: 0.0123 instance_segmentation_loss_cls: 0.0483 instance_segmentation_loss_reg: 0.3725 instance_segmentation_loss_poly: 0.9996 +2023/10/29 12:24:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 12:24:41 - mmengine - INFO - Iter(train) [126000/640000] base_lr: 1.8166e-04 lr: 1.8333e-05 eta: 6 days, 15:17:27 time: 1.1270 data_time: 0.0356 memory: 21522 grad_norm: 2.6242 loss: 1.5056 caption_loss_cls: 2.5064 grounding_loss_reg: 3.2576 detection_loss_cls: 0.0460 detection_loss_reg: 0.3719 semantic_segmentation_loss_cls: 0.0123 instance_segmentation_loss_cls: 0.0483 instance_segmentation_loss_reg: 0.3722 instance_segmentation_loss_poly: 0.9985 +2023/10/29 12:24:41 - mmengine - INFO - Saving checkpoint at 126000 iterations +2023/10/29 12:33:30 - mmengine - INFO - Iter(train) [126500/640000] base_lr: 1.8152e-04 lr: 1.8320e-05 eta: 6 days, 15:03:22 time: 1.1099 data_time: 0.0346 memory: 21522 grad_norm: 2.6407 loss: 1.5060 caption_loss_cls: 2.5049 grounding_loss_reg: 3.2529 detection_loss_cls: 0.0459 detection_loss_reg: 0.3710 semantic_segmentation_loss_cls: 0.0123 instance_segmentation_loss_cls: 0.0483 instance_segmentation_loss_reg: 0.3723 instance_segmentation_loss_poly: 0.9986 +2023/10/29 12:43:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 12:43:24 - mmengine - INFO - Iter(train) [127000/640000] base_lr: 1.8138e-04 lr: 1.8307e-05 eta: 6 days, 14:59:57 time: 1.1175 data_time: 0.0353 memory: 21522 grad_norm: 2.6421 loss: 1.5085 caption_loss_cls: 2.5024 grounding_loss_reg: 3.2533 detection_loss_cls: 0.0458 detection_loss_reg: 0.3711 semantic_segmentation_loss_cls: 0.0123 instance_segmentation_loss_cls: 0.0482 instance_segmentation_loss_reg: 0.3718 instance_segmentation_loss_poly: 0.9977 +2023/10/29 12:43:24 - mmengine - INFO - Saving checkpoint at 127000 iterations +2023/10/29 12:52:45 - mmengine - INFO - Iter(train) [127500/640000] base_lr: 1.8124e-04 lr: 1.8294e-05 eta: 6 days, 14:51:08 time: 1.1175 data_time: 0.0353 memory: 21522 grad_norm: 2.6570 loss: 1.5115 caption_loss_cls: 2.5003 grounding_loss_reg: 3.2515 detection_loss_cls: 0.0458 detection_loss_reg: 0.3708 semantic_segmentation_loss_cls: 0.0123 instance_segmentation_loss_cls: 0.0482 instance_segmentation_loss_reg: 0.3731 instance_segmentation_loss_poly: 1.0001 +2023/10/29 13:01:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 13:01:58 - mmengine - INFO - Iter(train) [128000/640000] base_lr: 1.8109e-04 lr: 1.8281e-05 eta: 6 days, 14:41:02 time: 1.1143 data_time: 0.0354 memory: 21522 grad_norm: 2.6563 loss: 1.5066 caption_loss_cls: 2.5000 grounding_loss_reg: 3.2472 detection_loss_cls: 0.0458 detection_loss_reg: 0.3711 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0483 instance_segmentation_loss_reg: 0.3739 instance_segmentation_loss_poly: 1.0010 +2023/10/29 13:01:58 - mmengine - INFO - Saving checkpoint at 128000 iterations +2023/10/29 13:10:59 - mmengine - INFO - Iter(train) [128500/640000] base_lr: 1.8095e-04 lr: 1.8268e-05 eta: 6 days, 14:29:04 time: 1.1099 data_time: 0.0353 memory: 21522 grad_norm: 2.6690 loss: 1.5030 caption_loss_cls: 2.4971 grounding_loss_reg: 3.2465 detection_loss_cls: 0.0457 detection_loss_reg: 0.3710 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0483 instance_segmentation_loss_reg: 0.3742 instance_segmentation_loss_poly: 1.0020 +2023/10/29 13:20:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 13:20:16 - mmengine - INFO - Iter(train) [129000/640000] base_lr: 1.8081e-04 lr: 1.8255e-05 eta: 6 days, 14:19:39 time: 1.1146 data_time: 0.0355 memory: 21522 grad_norm: 2.6620 loss: 1.5153 caption_loss_cls: 2.4971 grounding_loss_reg: 3.2445 detection_loss_cls: 0.0458 detection_loss_reg: 0.3721 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0482 instance_segmentation_loss_reg: 0.3739 instance_segmentation_loss_poly: 1.0015 +2023/10/29 13:20:16 - mmengine - INFO - Saving checkpoint at 129000 iterations +2023/10/29 13:29:27 - mmengine - INFO - Iter(train) [129500/640000] base_lr: 1.8066e-04 lr: 1.8242e-05 eta: 6 days, 14:09:16 time: 1.1113 data_time: 0.0357 memory: 21522 grad_norm: 2.6719 loss: 1.5322 caption_loss_cls: 2.4962 grounding_loss_reg: 3.2469 detection_loss_cls: 0.0458 detection_loss_reg: 0.3722 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0481 instance_segmentation_loss_reg: 0.3743 instance_segmentation_loss_poly: 1.0016 +2023/10/29 13:37:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 13:37:40 - mmengine - INFO - Iter(train) [130000/640000] base_lr: 1.8052e-04 lr: 1.8229e-05 eta: 6 days, 13:50:14 time: 1.0945 data_time: 0.0349 memory: 21522 grad_norm: 2.7055 loss: 1.5338 caption_loss_cls: 2.4961 grounding_loss_reg: 3.2434 detection_loss_cls: 0.0458 detection_loss_reg: 0.3721 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0480 instance_segmentation_loss_reg: 0.3736 instance_segmentation_loss_poly: 1.0005 +2023/10/29 13:37:40 - mmengine - INFO - Saving checkpoint at 130000 iterations +2023/10/29 13:47:12 - mmengine - INFO - Iter(train) [130500/640000] base_lr: 1.8037e-04 lr: 1.8216e-05 eta: 6 days, 13:43:11 time: 1.1054 data_time: 0.0353 memory: 21522 grad_norm: 2.6704 loss: 1.5214 caption_loss_cls: 2.4937 grounding_loss_reg: 3.2420 detection_loss_cls: 0.0457 detection_loss_reg: 0.3716 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0479 instance_segmentation_loss_reg: 0.3737 instance_segmentation_loss_poly: 1.0005 +2023/10/29 13:56:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 13:56:20 - mmengine - INFO - Iter(train) [131000/640000] base_lr: 1.8023e-04 lr: 1.8202e-05 eta: 6 days, 13:32:30 time: 1.0938 data_time: 0.0347 memory: 21522 grad_norm: 2.7177 loss: 1.5368 caption_loss_cls: 2.4919 grounding_loss_reg: 3.2413 detection_loss_cls: 0.0457 detection_loss_reg: 0.3722 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0480 instance_segmentation_loss_reg: 0.3745 instance_segmentation_loss_poly: 1.0011 +2023/10/29 13:56:20 - mmengine - INFO - Saving checkpoint at 131000 iterations +2023/10/29 14:06:14 - mmengine - INFO - Iter(train) [131500/640000] base_lr: 1.8008e-04 lr: 1.8189e-05 eta: 6 days, 13:28:32 time: 1.1019 data_time: 0.0350 memory: 21522 grad_norm: 2.7084 loss: 1.5296 caption_loss_cls: 2.4929 grounding_loss_reg: 3.2428 detection_loss_cls: 0.0456 detection_loss_reg: 0.3730 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0480 instance_segmentation_loss_reg: 0.3742 instance_segmentation_loss_poly: 0.9998 +2023/10/29 14:15:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 14:15:18 - mmengine - INFO - Iter(train) [132000/640000] base_lr: 1.7994e-04 lr: 1.8176e-05 eta: 6 days, 13:17:18 time: 1.0998 data_time: 0.0355 memory: 21522 grad_norm: 2.7241 loss: 1.5302 caption_loss_cls: 2.4888 grounding_loss_reg: 3.2405 detection_loss_cls: 0.0456 detection_loss_reg: 0.3730 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0480 instance_segmentation_loss_reg: 0.3736 instance_segmentation_loss_poly: 0.9986 +2023/10/29 14:15:18 - mmengine - INFO - Saving checkpoint at 132000 iterations +2023/10/29 14:25:19 - mmengine - INFO - Iter(train) [132500/640000] base_lr: 1.7979e-04 lr: 1.8163e-05 eta: 6 days, 13:14:22 time: 1.1149 data_time: 0.0363 memory: 21522 grad_norm: 2.6854 loss: 1.5346 caption_loss_cls: 2.4918 grounding_loss_reg: 3.2405 detection_loss_cls: 0.0457 detection_loss_reg: 0.3730 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0478 instance_segmentation_loss_reg: 0.3739 instance_segmentation_loss_poly: 0.9990 +2023/10/29 14:34:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 14:34:35 - mmengine - INFO - Iter(train) [133000/640000] base_lr: 1.7964e-04 lr: 1.8149e-05 eta: 6 days, 13:04:49 time: 1.1146 data_time: 0.0362 memory: 21522 grad_norm: 2.6819 loss: 1.5214 caption_loss_cls: 2.4903 grounding_loss_reg: 3.2393 detection_loss_cls: 0.0456 detection_loss_reg: 0.3720 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0477 instance_segmentation_loss_reg: 0.3734 instance_segmentation_loss_poly: 0.9984 +2023/10/29 14:34:35 - mmengine - INFO - Saving checkpoint at 133000 iterations +2023/10/29 14:44:10 - mmengine - INFO - Iter(train) [133500/640000] base_lr: 1.7949e-04 lr: 1.8136e-05 eta: 6 days, 12:57:57 time: 1.1206 data_time: 0.0363 memory: 21522 grad_norm: 2.6730 loss: 1.5139 caption_loss_cls: 2.4884 grounding_loss_reg: 3.2398 detection_loss_cls: 0.0455 detection_loss_reg: 0.3729 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0476 instance_segmentation_loss_reg: 0.3730 instance_segmentation_loss_poly: 0.9960 +2023/10/29 14:53:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 14:53:22 - mmengine - INFO - Iter(train) [134000/640000] base_lr: 1.7934e-04 lr: 1.8122e-05 eta: 6 days, 12:47:43 time: 1.1351 data_time: 0.0368 memory: 21522 grad_norm: 2.6369 loss: 1.5091 caption_loss_cls: 2.4936 grounding_loss_reg: 3.2400 detection_loss_cls: 0.0453 detection_loss_reg: 0.3716 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0475 instance_segmentation_loss_reg: 0.3730 instance_segmentation_loss_poly: 0.9954 +2023/10/29 14:53:22 - mmengine - INFO - Saving checkpoint at 134000 iterations +2023/10/29 15:02:58 - mmengine - INFO - Iter(train) [134500/640000] base_lr: 1.7920e-04 lr: 1.8109e-05 eta: 6 days, 12:40:56 time: 1.1360 data_time: 0.0370 memory: 21522 grad_norm: 2.6591 loss: 1.5202 caption_loss_cls: 2.4895 grounding_loss_reg: 3.2381 detection_loss_cls: 0.0452 detection_loss_reg: 0.3709 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0476 instance_segmentation_loss_reg: 0.3745 instance_segmentation_loss_poly: 0.9985 +2023/10/29 15:12:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 15:12:30 - mmengine - INFO - Iter(train) [135000/640000] base_lr: 1.7905e-04 lr: 1.8095e-05 eta: 6 days, 12:33:34 time: 1.1421 data_time: 0.0373 memory: 21522 grad_norm: 2.6214 loss: 1.5156 caption_loss_cls: 2.4919 grounding_loss_reg: 3.2368 detection_loss_cls: 0.0452 detection_loss_reg: 0.3709 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0476 instance_segmentation_loss_reg: 0.3755 instance_segmentation_loss_poly: 0.9994 +2023/10/29 15:12:30 - mmengine - INFO - Saving checkpoint at 135000 iterations +2023/10/29 15:22:13 - mmengine - INFO - Iter(train) [135500/640000] base_lr: 1.7890e-04 lr: 1.8082e-05 eta: 6 days, 12:27:41 time: 1.1395 data_time: 0.0373 memory: 21522 grad_norm: 2.6080 loss: 1.5089 caption_loss_cls: 2.4915 grounding_loss_reg: 3.2335 detection_loss_cls: 0.0452 detection_loss_reg: 0.3707 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0476 instance_segmentation_loss_reg: 0.3756 instance_segmentation_loss_poly: 0.9996 +2023/10/29 15:30:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 15:30:54 - mmengine - INFO - Iter(train) [136000/640000] base_lr: 1.7875e-04 lr: 1.8068e-05 eta: 6 days, 12:13:18 time: 1.1337 data_time: 0.0361 memory: 21522 grad_norm: 2.5779 loss: 1.5049 caption_loss_cls: 2.4943 grounding_loss_reg: 3.2306 detection_loss_cls: 0.0452 detection_loss_reg: 0.3711 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0476 instance_segmentation_loss_reg: 0.3759 instance_segmentation_loss_poly: 1.0002 +2023/10/29 15:30:54 - mmengine - INFO - Saving checkpoint at 136000 iterations +2023/10/29 15:40:31 - mmengine - INFO - Iter(train) [136500/640000] base_lr: 1.7860e-04 lr: 1.8054e-05 eta: 6 days, 12:06:36 time: 1.1277 data_time: 0.0354 memory: 21522 grad_norm: 2.6078 loss: 1.5057 caption_loss_cls: 2.4938 grounding_loss_reg: 3.2305 detection_loss_cls: 0.0452 detection_loss_reg: 0.3714 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0475 instance_segmentation_loss_reg: 0.3747 instance_segmentation_loss_poly: 0.9972 +2023/10/29 15:49:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 15:49:32 - mmengine - INFO - Iter(train) [137000/640000] base_lr: 1.7844e-04 lr: 1.8040e-05 eta: 6 days, 11:54:58 time: 1.1238 data_time: 0.0352 memory: 21522 grad_norm: 2.6111 loss: 1.5123 caption_loss_cls: 2.4933 grounding_loss_reg: 3.2307 detection_loss_cls: 0.0451 detection_loss_reg: 0.3710 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0473 instance_segmentation_loss_reg: 0.3732 instance_segmentation_loss_poly: 0.9948 +2023/10/29 15:49:32 - mmengine - INFO - Saving checkpoint at 137000 iterations +2023/10/29 15:58:53 - mmengine - INFO - Iter(train) [137500/640000] base_lr: 1.7829e-04 lr: 1.8027e-05 eta: 6 days, 11:46:06 time: 1.1205 data_time: 0.0352 memory: 21522 grad_norm: 2.6231 loss: 1.5164 caption_loss_cls: 2.4918 grounding_loss_reg: 3.2295 detection_loss_cls: 0.0451 detection_loss_reg: 0.3706 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0472 instance_segmentation_loss_reg: 0.3723 instance_segmentation_loss_poly: 0.9923 +2023/10/29 16:08:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 16:08:30 - mmengine - INFO - Iter(train) [138000/640000] base_lr: 1.7814e-04 lr: 1.8013e-05 eta: 6 days, 11:39:15 time: 1.1268 data_time: 0.0354 memory: 21522 grad_norm: 2.6170 loss: 1.5139 caption_loss_cls: 2.4966 grounding_loss_reg: 3.2277 detection_loss_cls: 0.0449 detection_loss_reg: 0.3686 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0472 instance_segmentation_loss_reg: 0.3726 instance_segmentation_loss_poly: 0.9926 +2023/10/29 16:08:30 - mmengine - INFO - Saving checkpoint at 138000 iterations +2023/10/29 16:18:17 - mmengine - INFO - Iter(train) [138500/640000] base_lr: 1.7799e-04 lr: 1.7999e-05 eta: 6 days, 11:33:40 time: 1.1296 data_time: 0.0374 memory: 21522 grad_norm: 2.5856 loss: 1.4960 caption_loss_cls: 2.4943 grounding_loss_reg: 3.2293 detection_loss_cls: 0.0447 detection_loss_reg: 0.3678 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0471 instance_segmentation_loss_reg: 0.3716 instance_segmentation_loss_poly: 0.9909 +2023/10/29 16:27:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 16:27:36 - mmengine - INFO - Iter(train) [139000/640000] base_lr: 1.7784e-04 lr: 1.7985e-05 eta: 6 days, 11:24:26 time: 1.1263 data_time: 0.0373 memory: 21522 grad_norm: 2.6083 loss: 1.4954 caption_loss_cls: 2.4954 grounding_loss_reg: 3.2254 detection_loss_cls: 0.0447 detection_loss_reg: 0.3671 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0472 instance_segmentation_loss_reg: 0.3717 instance_segmentation_loss_poly: 0.9908 +2023/10/29 16:27:36 - mmengine - INFO - Saving checkpoint at 139000 iterations +2023/10/29 16:37:32 - mmengine - INFO - Iter(train) [139500/640000] base_lr: 1.7768e-04 lr: 1.7971e-05 eta: 6 days, 11:19:48 time: 1.1293 data_time: 0.0372 memory: 21522 grad_norm: 2.6027 loss: 1.4881 caption_loss_cls: 2.4916 grounding_loss_reg: 3.2213 detection_loss_cls: 0.0448 detection_loss_reg: 0.3679 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0470 instance_segmentation_loss_reg: 0.3709 instance_segmentation_loss_poly: 0.9882 +2023/10/29 16:46:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 16:46:44 - mmengine - INFO - Iter(train) [140000/640000] base_lr: 1.7753e-04 lr: 1.7957e-05 eta: 6 days, 11:09:40 time: 1.1372 data_time: 0.0373 memory: 21522 grad_norm: 2.5981 loss: 1.4773 caption_loss_cls: 2.4873 grounding_loss_reg: 3.2165 detection_loss_cls: 0.0447 detection_loss_reg: 0.3676 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0467 instance_segmentation_loss_reg: 0.3694 instance_segmentation_loss_poly: 0.9849 +2023/10/29 16:46:44 - mmengine - INFO - Saving checkpoint at 140000 iterations +2023/10/29 16:55:32 - mmengine - INFO - Evaluating bbox... +2023/10/29 16:56:28 - mmengine - INFO - bbox_mAP_copypaste: 0.375 0.548 0.408 0.226 0.426 0.491 +2023/10/29 16:56:28 - mmengine - INFO - Evaluating segm... +2023/10/29 16:57:39 - mmengine - INFO - segm_mAP_copypaste: 0.234 0.447 0.219 0.105 0.274 0.384 +2023/10/29 17:02:32 - mmengine - INFO - per class results: +2023/10/29 17:02:32 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 74.99 | 85.98 | +| building | 80.58 | 91.12 | +| sky | 92.34 | 97.2 | +| floor | 78.66 | 88.07 | +| tree | 71.84 | 85.51 | +| ceiling | 81.86 | 90.55 | +| road | 80.13 | 87.8 | +| bed | 83.78 | 94.46 | +| windowpane | 57.29 | 78.14 | +| grass | 66.45 | 81.93 | +| cabinet | 51.75 | 67.15 | +| sidewalk | 60.18 | 82.74 | +| person | 77.7 | 91.25 | +| earth | 36.11 | 51.3 | +| door | 40.56 | 54.07 | +| table | 53.56 | 75.72 | +| mountain | 50.11 | 62.15 | +| plant | 46.84 | 56.47 | +| curtain | 67.24 | 83.53 | +| chair | 48.96 | 61.47 | +| car | 80.87 | 93.2 | +| water | 53.83 | 72.71 | +| painting | 66.47 | 82.85 | +| sofa | 60.48 | 71.97 | +| shelf | 39.29 | 63.91 | +| house | 37.03 | 48.65 | +| sea | 48.32 | 74.14 | +| mirror | 57.09 | 73.28 | +| rug | 63.26 | 71.33 | +| field | 28.52 | 43.13 | +| armchair | 39.28 | 64.86 | +| seat | 58.69 | 75.98 | +| fence | 35.36 | 42.86 | +| desk | 36.08 | 58.73 | +| rock | 30.55 | 43.33 | +| wardrobe | 37.61 | 79.23 | +| lamp | 53.27 | 67.39 | +| bathtub | 73.65 | 86.37 | +| railing | 26.57 | 36.51 | +| cushion | 47.72 | 57.12 | +| base | 14.53 | 22.51 | +| box | 20.39 | 24.67 | +| column | 45.88 | 57.9 | +| signboard | 34.75 | 47.35 | +| chest of drawers | 35.0 | 68.86 | +| counter | 10.32 | 10.87 | +| sand | 31.91 | 50.19 | +| sink | 62.82 | 76.23 | +| skyscraper | 51.0 | 62.94 | +| fireplace | 52.92 | 76.33 | +| refrigerator | 72.41 | 82.89 | +| grandstand | 39.47 | 65.36 | +| path | 17.14 | 22.59 | +| stairs | 26.63 | 34.02 | +| runway | 68.78 | 80.52 | +| case | 8.16 | 8.39 | +| pool table | 88.07 | 95.39 | +| pillow | 46.27 | 56.56 | +| screen door | 9.68 | 10.68 | +| stairway | 33.34 | 40.85 | +| river | 14.75 | 19.74 | +| bridge | 49.83 | 79.14 | +| bookcase | 36.03 | 45.5 | +| blind | 16.37 | 17.76 | +| coffee table | 55.26 | 74.22 | +| toilet | 80.46 | 85.89 | +| flower | 26.22 | 44.45 | +| book | 45.07 | 63.32 | +| hill | 9.13 | 20.81 | +| bench | 35.35 | 39.61 | +| countertop | 48.65 | 63.72 | +| stove | 58.77 | 87.38 | +| palm | 42.08 | 61.41 | +| kitchen island | 30.84 | 93.35 | +| computer | 64.42 | 80.07 | +| swivel chair | 40.86 | 54.5 | +| boat | 62.39 | 87.82 | +| bar | 10.58 | 12.46 | +| arcade machine | 58.7 | 74.04 | +| hovel | 2.18 | 2.33 | +| bus | 71.94 | 95.34 | +| towel | 57.34 | 66.13 | +| light | 46.33 | 56.21 | +| truck | 34.06 | 43.11 | +| tower | 27.13 | 34.49 | +| chandelier | 57.01 | 83.37 | +| awning | 13.85 | 40.4 | +| streetlight | 21.99 | 30.44 | +| booth | 38.78 | 44.02 | +| television receiver | 55.61 | 76.01 | +| airplane | 55.55 | 63.19 | +| dirt track | 0.0 | 0.0 | +| apparel | 18.89 | 36.13 | +| pole | 17.95 | 25.16 | +| land | 2.56 | 3.11 | +| bannister | 9.38 | 14.53 | +| escalator | 22.85 | 24.9 | +| ottoman | 45.14 | 61.08 | +| bottle | 18.16 | 19.72 | +| buffet | 49.71 | 64.47 | +| poster | 21.87 | 32.24 | +| stage | 4.8 | 5.05 | +| van | 31.14 | 35.91 | +| ship | 77.93 | 81.1 | +| fountain | 7.04 | 7.15 | +| conveyer belt | 61.33 | 83.12 | +| canopy | 22.31 | 26.65 | +| washer | 55.37 | 61.44 | +| plaything | 18.15 | 24.28 | +| swimming pool | 40.65 | 44.25 | +| stool | 25.75 | 28.55 | +| barrel | 4.18 | 70.33 | +| basket | 21.14 | 27.57 | +| waterfall | 57.82 | 63.58 | +| tent | 32.45 | 97.52 | +| bag | 9.55 | 10.58 | +| minibike | 56.62 | 70.77 | +| cradle | 65.04 | 94.94 | +| oven | 31.21 | 44.4 | +| ball | 17.94 | 23.74 | +| food | 45.93 | 53.43 | +| step | 13.48 | 15.19 | +| tank | 28.91 | 30.32 | +| trade name | 25.89 | 36.29 | +| microwave | 71.06 | 86.61 | +| pot | 45.11 | 52.37 | +| animal | 55.95 | 58.65 | +| bicycle | 47.19 | 74.8 | +| lake | 58.69 | 61.35 | +| dishwasher | 47.27 | 67.75 | +| screen | 68.63 | 88.32 | +| blanket | 8.3 | 14.66 | +| sculpture | 51.62 | 67.4 | +| hood | 42.2 | 48.47 | +| sconce | 25.65 | 29.54 | +| vase | 36.18 | 52.16 | +| traffic light | 27.48 | 55.72 | +| tray | 2.67 | 3.01 | +| ashcan | 29.97 | 45.95 | +| fan | 48.93 | 66.31 | +| pier | 43.32 | 69.9 | +| crt screen | 4.52 | 9.5 | +| plate | 47.32 | 58.08 | +| monitor | 12.8 | 14.78 | +| bulletin board | 36.19 | 56.06 | +| shower | 0.33 | 0.33 | +| radiator | 32.53 | 40.96 | +| glass | 13.26 | 14.27 | +| clock | 18.31 | 23.8 | +| flag | 32.54 | 36.38 | ++---------------------+-------+-------+ +2023/10/29 17:03:04 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.3750 coco/bbox_mAP_50: 0.5480 coco/bbox_mAP_75: 0.4080 coco/bbox_mAP_s: 0.2260 coco/bbox_mAP_m: 0.4260 coco/bbox_mAP_l: 0.4910 coco/segm_mAP: 0.2340 coco/segm_mAP_50: 0.4470 coco/segm_mAP_75: 0.2190 coco/segm_mAP_s: 0.1050 coco/segm_mAP_m: 0.2740 coco/segm_mAP_l: 0.3840 Bleu_1: 0.6978 Bleu_2: 0.5218 Bleu_3: 0.3812 Bleu_4: 0.2778 METEOR: 0.2364 ROUGE_L: 0.5125 CIDEr: 0.8606 SPICE: 0.1724 aAcc: 80.0900 mIoU: 41.2100 mAcc: 54.1600 visual-grounding/miou: 0.7077 visual-grounding/acc: 0.7902 data_time: 0.0879 time: 0.6088 +2023/10/29 17:12:10 - mmengine - INFO - Iter(train) [140500/640000] base_lr: 1.7737e-04 lr: 1.7943e-05 eta: 6 days, 10:58:54 time: 1.1296 data_time: 0.0346 memory: 21522 grad_norm: 2.5908 loss: 1.4730 caption_loss_cls: 2.4888 grounding_loss_reg: 3.2143 detection_loss_cls: 0.0447 detection_loss_reg: 0.3666 semantic_segmentation_loss_cls: 0.0120 instance_segmentation_loss_cls: 0.0465 instance_segmentation_loss_reg: 0.3690 instance_segmentation_loss_poly: 0.9840 +2023/10/29 17:21:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 17:21:24 - mmengine - INFO - Iter(train) [141000/640000] base_lr: 1.7722e-04 lr: 1.7929e-05 eta: 6 days, 10:49:02 time: 1.1329 data_time: 0.0348 memory: 21522 grad_norm: 2.5719 loss: 1.4613 caption_loss_cls: 2.4832 grounding_loss_reg: 3.2110 detection_loss_cls: 0.0444 detection_loss_reg: 0.3646 semantic_segmentation_loss_cls: 0.0120 instance_segmentation_loss_cls: 0.0465 instance_segmentation_loss_reg: 0.3684 instance_segmentation_loss_poly: 0.9834 +2023/10/29 17:21:24 - mmengine - INFO - Saving checkpoint at 141000 iterations +2023/10/29 17:30:33 - mmengine - INFO - Iter(train) [141500/640000] base_lr: 1.7706e-04 lr: 1.7915e-05 eta: 6 days, 10:38:35 time: 1.1299 data_time: 0.0347 memory: 21522 grad_norm: 2.5696 loss: 1.4588 caption_loss_cls: 2.4839 grounding_loss_reg: 3.2062 detection_loss_cls: 0.0443 detection_loss_reg: 0.3647 semantic_segmentation_loss_cls: 0.0120 instance_segmentation_loss_cls: 0.0465 instance_segmentation_loss_reg: 0.3689 instance_segmentation_loss_poly: 0.9839 +2023/10/29 17:39:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 17:39:58 - mmengine - INFO - Iter(train) [142000/640000] base_lr: 1.7691e-04 lr: 1.7901e-05 eta: 6 days, 10:29:59 time: 1.1268 data_time: 0.0347 memory: 21522 grad_norm: 2.5600 loss: 1.4490 caption_loss_cls: 2.4835 grounding_loss_reg: 3.2057 detection_loss_cls: 0.0441 detection_loss_reg: 0.3638 semantic_segmentation_loss_cls: 0.0120 instance_segmentation_loss_cls: 0.0465 instance_segmentation_loss_reg: 0.3694 instance_segmentation_loss_poly: 0.9847 +2023/10/29 17:39:58 - mmengine - INFO - Saving checkpoint at 142000 iterations +2023/10/29 17:49:24 - mmengine - INFO - Iter(train) [142500/640000] base_lr: 1.7675e-04 lr: 1.7887e-05 eta: 6 days, 10:21:39 time: 1.1217 data_time: 0.0323 memory: 21522 grad_norm: 2.5973 loss: 1.4654 caption_loss_cls: 2.4821 grounding_loss_reg: 3.2022 detection_loss_cls: 0.0442 detection_loss_reg: 0.3647 semantic_segmentation_loss_cls: 0.0120 instance_segmentation_loss_cls: 0.0463 instance_segmentation_loss_reg: 0.3681 instance_segmentation_loss_poly: 0.9813 +2023/10/29 17:58:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 17:58:53 - mmengine - INFO - Iter(train) [143000/640000] base_lr: 1.7660e-04 lr: 1.7872e-05 eta: 6 days, 10:13:36 time: 1.1242 data_time: 0.0324 memory: 21522 grad_norm: 2.5712 loss: 1.4616 caption_loss_cls: 2.4843 grounding_loss_reg: 3.1990 detection_loss_cls: 0.0441 detection_loss_reg: 0.3644 semantic_segmentation_loss_cls: 0.0120 instance_segmentation_loss_cls: 0.0464 instance_segmentation_loss_reg: 0.3690 instance_segmentation_loss_poly: 0.9824 +2023/10/29 17:58:53 - mmengine - INFO - Saving checkpoint at 143000 iterations +2023/10/29 18:08:18 - mmengine - INFO - Iter(train) [143500/640000] base_lr: 1.7644e-04 lr: 1.7858e-05 eta: 6 days, 10:05:02 time: 1.1167 data_time: 0.0323 memory: 21522 grad_norm: 2.5924 loss: 1.4702 caption_loss_cls: 2.4783 grounding_loss_reg: 3.1962 detection_loss_cls: 0.0440 detection_loss_reg: 0.3633 semantic_segmentation_loss_cls: 0.0120 instance_segmentation_loss_cls: 0.0464 instance_segmentation_loss_reg: 0.3682 instance_segmentation_loss_poly: 0.9806 +2023/10/29 18:17:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 18:17:52 - mmengine - INFO - Iter(train) [144000/640000] base_lr: 1.7628e-04 lr: 1.7844e-05 eta: 6 days, 9:57:26 time: 1.1219 data_time: 0.0328 memory: 21522 grad_norm: 2.5939 loss: 1.4857 caption_loss_cls: 2.4836 grounding_loss_reg: 3.1955 detection_loss_cls: 0.0440 detection_loss_reg: 0.3636 semantic_segmentation_loss_cls: 0.0119 instance_segmentation_loss_cls: 0.0465 instance_segmentation_loss_reg: 0.3690 instance_segmentation_loss_poly: 0.9824 +2023/10/29 18:17:52 - mmengine - INFO - Saving checkpoint at 144000 iterations +2023/10/29 18:26:52 - mmengine - INFO - Iter(train) [144500/640000] base_lr: 1.7612e-04 lr: 1.7829e-05 eta: 6 days, 9:45:56 time: 1.1202 data_time: 0.0355 memory: 21522 grad_norm: 2.6154 loss: 1.4928 caption_loss_cls: 2.4850 grounding_loss_reg: 3.1949 detection_loss_cls: 0.0440 detection_loss_reg: 0.3633 semantic_segmentation_loss_cls: 0.0119 instance_segmentation_loss_cls: 0.0466 instance_segmentation_loss_reg: 0.3703 instance_segmentation_loss_poly: 0.9849 +2023/10/29 18:37:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 18:37:20 - mmengine - INFO - Iter(train) [145000/640000] base_lr: 1.7596e-04 lr: 1.7815e-05 eta: 6 days, 9:44:41 time: 1.1387 data_time: 0.0380 memory: 21522 grad_norm: 2.6451 loss: 1.5032 caption_loss_cls: 2.4836 grounding_loss_reg: 3.1960 detection_loss_cls: 0.0439 detection_loss_reg: 0.3634 semantic_segmentation_loss_cls: 0.0119 instance_segmentation_loss_cls: 0.0466 instance_segmentation_loss_reg: 0.3702 instance_segmentation_loss_poly: 0.9851 +2023/10/29 18:37:20 - mmengine - INFO - Saving checkpoint at 145000 iterations +2023/10/29 18:46:33 - mmengine - INFO - Iter(train) [145500/640000] base_lr: 1.7581e-04 lr: 1.7800e-05 eta: 6 days, 9:34:37 time: 1.1395 data_time: 0.0381 memory: 21522 grad_norm: 2.6301 loss: 1.5003 caption_loss_cls: 2.4850 grounding_loss_reg: 3.1949 detection_loss_cls: 0.0441 detection_loss_reg: 0.3647 semantic_segmentation_loss_cls: 0.0119 instance_segmentation_loss_cls: 0.0466 instance_segmentation_loss_reg: 0.3708 instance_segmentation_loss_poly: 0.9863 +2023/10/29 18:55:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 18:55:29 - mmengine - INFO - Iter(train) [146000/640000] base_lr: 1.7565e-04 lr: 1.7786e-05 eta: 6 days, 9:22:43 time: 1.1326 data_time: 0.0379 memory: 21522 grad_norm: 2.6456 loss: 1.5013 caption_loss_cls: 2.4828 grounding_loss_reg: 3.1926 detection_loss_cls: 0.0441 detection_loss_reg: 0.3650 semantic_segmentation_loss_cls: 0.0119 instance_segmentation_loss_cls: 0.0467 instance_segmentation_loss_reg: 0.3708 instance_segmentation_loss_poly: 0.9855 +2023/10/29 18:55:29 - mmengine - INFO - Saving checkpoint at 146000 iterations +2023/10/29 19:05:28 - mmengine - INFO - Iter(train) [146500/640000] base_lr: 1.7549e-04 lr: 1.7771e-05 eta: 6 days, 9:17:54 time: 1.1406 data_time: 0.0398 memory: 21522 grad_norm: 2.6300 loss: 1.5019 caption_loss_cls: 2.4810 grounding_loss_reg: 3.1922 detection_loss_cls: 0.0441 detection_loss_reg: 0.3647 semantic_segmentation_loss_cls: 0.0119 instance_segmentation_loss_cls: 0.0468 instance_segmentation_loss_reg: 0.3724 instance_segmentation_loss_poly: 0.9886 +2023/10/29 19:14:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231028_202629 +2023/10/29 19:14:52 - mmengine - INFO - Iter(train) [147000/640000] base_lr: 1.7533e-04 lr: 1.7757e-05 eta: 6 days, 9:09:09 time: 1.1394 data_time: 0.0396 memory: 21522 grad_norm: 2.6395 loss: 1.5007 caption_loss_cls: 2.4797 grounding_loss_reg: 3.1922 detection_loss_cls: 0.0443 detection_loss_reg: 0.3656 semantic_segmentation_loss_cls: 0.0119 instance_segmentation_loss_cls: 0.0468 instance_segmentation_loss_reg: 0.3724 instance_segmentation_loss_poly: 0.9888 +2023/10/29 19:14:52 - mmengine - INFO - Saving checkpoint at 147000 iterations +2023/10/29 19:39:31 - mmengine - INFO - Iter(train) [147500/640000] base_lr: 1.7516e-04 lr: 1.7742e-05 eta: 6 days, 13:58:58 time: 1.1425 data_time: 0.0360 memory: 21513 grad_norm: 2.6290 loss: 1.4944 caption_loss_cls: 2.4767 grounding_loss_reg: 3.1898 detection_loss_cls: 0.0441 detection_loss_reg: 0.3648 semantic_segmentation_loss_cls: 0.0119 instance_segmentation_loss_cls: 0.0467 instance_segmentation_loss_reg: 0.3715 instance_segmentation_loss_poly: 0.9871 +2023/10/29 19:48:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/29 19:48:45 - mmengine - INFO - Iter(train) [148000/640000] base_lr: 1.7500e-04 lr: 1.7728e-05 eta: 6 days, 10:41:23 time: 1.1379 data_time: 0.0354 memory: 21513 grad_norm: 2.6566 loss: 1.4829 caption_loss_cls: 2.4754 grounding_loss_reg: 3.1887 detection_loss_cls: 0.0439 detection_loss_reg: 0.3643 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0467 instance_segmentation_loss_reg: 0.3714 instance_segmentation_loss_poly: 0.9866 +2023/10/29 19:48:45 - mmengine - INFO - Saving checkpoint at 148000 iterations +2023/10/29 19:58:12 - mmengine - INFO - Iter(train) [148500/640000] base_lr: 1.7484e-04 lr: 1.7713e-05 eta: 6 days, 10:36:45 time: 1.1446 data_time: 0.0352 memory: 21513 grad_norm: 2.6418 loss: 1.4703 caption_loss_cls: 2.4747 grounding_loss_reg: 3.1877 detection_loss_cls: 0.0439 detection_loss_reg: 0.3638 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0466 instance_segmentation_loss_reg: 0.3710 instance_segmentation_loss_poly: 0.9862 +2023/10/29 20:07:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/29 20:07:47 - mmengine - INFO - Iter(train) [149000/640000] base_lr: 1.7468e-04 lr: 1.7698e-05 eta: 6 days, 11:03:23 time: 1.1314 data_time: 0.0331 memory: 21513 grad_norm: 2.6408 loss: 1.4593 caption_loss_cls: 2.4696 grounding_loss_reg: 3.1857 detection_loss_cls: 0.0438 detection_loss_reg: 0.3638 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0465 instance_segmentation_loss_reg: 0.3705 instance_segmentation_loss_poly: 0.9854 +2023/10/29 20:07:47 - mmengine - INFO - Saving checkpoint at 149000 iterations +2023/10/29 20:17:19 - mmengine - INFO - Iter(train) [149500/640000] base_lr: 1.7452e-04 lr: 1.7683e-05 eta: 6 days, 11:04:59 time: 1.1362 data_time: 0.0329 memory: 21513 grad_norm: 2.6236 loss: 1.4533 caption_loss_cls: 2.4663 grounding_loss_reg: 3.1802 detection_loss_cls: 0.0440 detection_loss_reg: 0.3641 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0463 instance_segmentation_loss_reg: 0.3700 instance_segmentation_loss_poly: 0.9850 +2023/10/29 20:26:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/29 20:26:45 - mmengine - INFO - Iter(train) [150000/640000] base_lr: 1.7435e-04 lr: 1.7669e-05 eta: 6 days, 10:46:04 time: 1.1435 data_time: 0.0326 memory: 21513 grad_norm: 2.6232 loss: 1.4483 caption_loss_cls: 2.4641 grounding_loss_reg: 3.1749 detection_loss_cls: 0.0439 detection_loss_reg: 0.3636 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0461 instance_segmentation_loss_reg: 0.3694 instance_segmentation_loss_poly: 0.9850 +2023/10/29 20:26:45 - mmengine - INFO - Saving checkpoint at 150000 iterations +2023/10/29 20:36:33 - mmengine - INFO - Iter(train) [150500/640000] base_lr: 1.7419e-04 lr: 1.7654e-05 eta: 6 days, 11:22:38 time: 1.1409 data_time: 0.0305 memory: 21513 grad_norm: 2.5994 loss: 1.4276 caption_loss_cls: 2.4639 grounding_loss_reg: 3.1739 detection_loss_cls: 0.0440 detection_loss_reg: 0.3642 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0460 instance_segmentation_loss_reg: 0.3693 instance_segmentation_loss_poly: 0.9852 +2023/10/29 20:45:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/29 20:45:57 - mmengine - INFO - Iter(train) [151000/640000] base_lr: 1.7403e-04 lr: 1.7639e-05 eta: 6 days, 10:56:04 time: 1.1406 data_time: 0.0304 memory: 21513 grad_norm: 2.6310 loss: 1.4280 caption_loss_cls: 2.4586 grounding_loss_reg: 3.1685 detection_loss_cls: 0.0440 detection_loss_reg: 0.3641 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0459 instance_segmentation_loss_reg: 0.3683 instance_segmentation_loss_poly: 0.9835 +2023/10/29 20:45:57 - mmengine - INFO - Saving checkpoint at 151000 iterations +2023/10/29 20:55:36 - mmengine - INFO - Iter(train) [151500/640000] base_lr: 1.7386e-04 lr: 1.7624e-05 eta: 6 days, 11:03:25 time: 1.1412 data_time: 0.0338 memory: 21513 grad_norm: 2.6434 loss: 1.4376 caption_loss_cls: 2.4593 grounding_loss_reg: 3.1664 detection_loss_cls: 0.0440 detection_loss_reg: 0.3640 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0458 instance_segmentation_loss_reg: 0.3686 instance_segmentation_loss_poly: 0.9830 +2023/10/29 21:03:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/29 21:03:51 - mmengine - INFO - Iter(train) [152000/640000] base_lr: 1.7370e-04 lr: 1.7609e-05 eta: 6 days, 8:48:26 time: 1.1261 data_time: 0.0336 memory: 21513 grad_norm: 2.6835 loss: 1.4617 caption_loss_cls: 2.4567 grounding_loss_reg: 3.1636 detection_loss_cls: 0.0439 detection_loss_reg: 0.3637 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0457 instance_segmentation_loss_reg: 0.3682 instance_segmentation_loss_poly: 0.9830 +2023/10/29 21:03:51 - mmengine - INFO - Saving checkpoint at 152000 iterations +2023/10/29 21:13:32 - mmengine - INFO - Iter(train) [152500/640000] base_lr: 1.7353e-04 lr: 1.7594e-05 eta: 6 days, 9:04:56 time: 1.1297 data_time: 0.0336 memory: 21513 grad_norm: 2.6924 loss: 1.4657 caption_loss_cls: 2.4563 grounding_loss_reg: 3.1607 detection_loss_cls: 0.0439 detection_loss_reg: 0.3638 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0457 instance_segmentation_loss_reg: 0.3681 instance_segmentation_loss_poly: 0.9833 +2023/10/29 21:23:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/29 21:23:08 - mmengine - INFO - Iter(train) [153000/640000] base_lr: 1.7337e-04 lr: 1.7579e-05 eta: 6 days, 9:10:19 time: 1.1300 data_time: 0.0330 memory: 21513 grad_norm: 2.6527 loss: 1.4533 caption_loss_cls: 2.4529 grounding_loss_reg: 3.1592 detection_loss_cls: 0.0439 detection_loss_reg: 0.3643 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0458 instance_segmentation_loss_reg: 0.3689 instance_segmentation_loss_poly: 0.9842 +2023/10/29 21:23:08 - mmengine - INFO - Saving checkpoint at 153000 iterations +2023/10/29 21:32:54 - mmengine - INFO - Iter(train) [153500/640000] base_lr: 1.7320e-04 lr: 1.7564e-05 eta: 6 days, 9:25:15 time: 1.1334 data_time: 0.0331 memory: 21513 grad_norm: 2.6901 loss: 1.4621 caption_loss_cls: 2.4498 grounding_loss_reg: 3.1564 detection_loss_cls: 0.0438 detection_loss_reg: 0.3644 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0457 instance_segmentation_loss_reg: 0.3687 instance_segmentation_loss_poly: 0.9837 +2023/10/29 21:42:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/29 21:42:23 - mmengine - INFO - Iter(train) [154000/640000] base_lr: 1.7304e-04 lr: 1.7549e-05 eta: 6 days, 9:17:29 time: 1.1343 data_time: 0.0342 memory: 21513 grad_norm: 2.6899 loss: 1.4677 caption_loss_cls: 2.4467 grounding_loss_reg: 3.1527 detection_loss_cls: 0.0438 detection_loss_reg: 0.3647 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0456 instance_segmentation_loss_reg: 0.3681 instance_segmentation_loss_poly: 0.9823 +2023/10/29 21:42:23 - mmengine - INFO - Saving checkpoint at 154000 iterations +2023/10/29 21:51:00 - mmengine - INFO - Iter(train) [154500/640000] base_lr: 1.7287e-04 lr: 1.7533e-05 eta: 6 days, 8:12:22 time: 1.1163 data_time: 0.0337 memory: 21513 grad_norm: 2.7595 loss: 1.4883 caption_loss_cls: 2.4447 grounding_loss_reg: 3.1505 detection_loss_cls: 0.0439 detection_loss_reg: 0.3649 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0454 instance_segmentation_loss_reg: 0.3671 instance_segmentation_loss_poly: 0.9804 +2023/10/29 21:59:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/29 21:59:45 - mmengine - INFO - Iter(train) [155000/640000] base_lr: 1.7270e-04 lr: 1.7518e-05 eta: 6 days, 7:23:20 time: 1.1068 data_time: 0.0335 memory: 21513 grad_norm: 2.7822 loss: 1.5058 caption_loss_cls: 2.4447 grounding_loss_reg: 3.1515 detection_loss_cls: 0.0438 detection_loss_reg: 0.3648 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0453 instance_segmentation_loss_reg: 0.3665 instance_segmentation_loss_poly: 0.9799 +2023/10/29 21:59:45 - mmengine - INFO - Saving checkpoint at 155000 iterations +2023/10/29 22:08:40 - mmengine - INFO - Iter(train) [155500/640000] base_lr: 1.7253e-04 lr: 1.7503e-05 eta: 6 days, 6:48:49 time: 1.0957 data_time: 0.0332 memory: 21513 grad_norm: 2.8143 loss: 1.5117 caption_loss_cls: 2.4413 grounding_loss_reg: 3.1472 detection_loss_cls: 0.0439 detection_loss_reg: 0.3648 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0450 instance_segmentation_loss_reg: 0.3653 instance_segmentation_loss_poly: 0.9781 +2023/10/29 22:17:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/29 22:17:58 - mmengine - INFO - Iter(train) [156000/640000] base_lr: 1.7236e-04 lr: 1.7488e-05 eta: 6 days, 6:37:03 time: 1.1116 data_time: 0.0337 memory: 21513 grad_norm: 2.7660 loss: 1.4945 caption_loss_cls: 2.4418 grounding_loss_reg: 3.1437 detection_loss_cls: 0.0438 detection_loss_reg: 0.3642 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0449 instance_segmentation_loss_reg: 0.3653 instance_segmentation_loss_poly: 0.9783 +2023/10/29 22:17:58 - mmengine - INFO - Saving checkpoint at 156000 iterations +2023/10/29 22:27:13 - mmengine - INFO - Iter(train) [156500/640000] base_lr: 1.7220e-04 lr: 1.7472e-05 eta: 6 days, 6:22:44 time: 1.1049 data_time: 0.0337 memory: 21513 grad_norm: 2.7738 loss: 1.4970 caption_loss_cls: 2.4408 grounding_loss_reg: 3.1450 detection_loss_cls: 0.0437 detection_loss_reg: 0.3631 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0448 instance_segmentation_loss_reg: 0.3654 instance_segmentation_loss_poly: 0.9795 +2023/10/29 22:36:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/29 22:36:12 - mmengine - INFO - Iter(train) [157000/640000] base_lr: 1.7203e-04 lr: 1.7457e-05 eta: 6 days, 5:56:49 time: 1.0956 data_time: 0.0337 memory: 21513 grad_norm: 2.8417 loss: 1.5224 caption_loss_cls: 2.4356 grounding_loss_reg: 3.1397 detection_loss_cls: 0.0437 detection_loss_reg: 0.3633 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0448 instance_segmentation_loss_reg: 0.3661 instance_segmentation_loss_poly: 0.9801 +2023/10/29 22:36:12 - mmengine - INFO - Saving checkpoint at 157000 iterations +2023/10/29 22:45:42 - mmengine - INFO - Iter(train) [157500/640000] base_lr: 1.7186e-04 lr: 1.7442e-05 eta: 6 days, 5:55:45 time: 1.0916 data_time: 0.0336 memory: 21513 grad_norm: 2.8524 loss: 1.5301 caption_loss_cls: 2.4344 grounding_loss_reg: 3.1363 detection_loss_cls: 0.0437 detection_loss_reg: 0.3644 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0449 instance_segmentation_loss_reg: 0.3681 instance_segmentation_loss_poly: 0.9835 +2023/10/29 22:54:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/29 22:54:29 - mmengine - INFO - Iter(train) [158000/640000] base_lr: 1.7169e-04 lr: 1.7426e-05 eta: 6 days, 5:23:12 time: 1.0812 data_time: 0.0324 memory: 21513 grad_norm: 2.8773 loss: 1.5402 caption_loss_cls: 2.4320 grounding_loss_reg: 3.1359 detection_loss_cls: 0.0438 detection_loss_reg: 0.3654 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0448 instance_segmentation_loss_reg: 0.3683 instance_segmentation_loss_poly: 0.9840 +2023/10/29 22:54:29 - mmengine - INFO - Saving checkpoint at 158000 iterations +2023/10/29 23:03:42 - mmengine - INFO - Iter(train) [158500/640000] base_lr: 1.7152e-04 lr: 1.7411e-05 eta: 6 days, 5:09:51 time: 1.0902 data_time: 0.0327 memory: 21513 grad_norm: 2.8660 loss: 1.5384 caption_loss_cls: 2.4272 grounding_loss_reg: 3.1304 detection_loss_cls: 0.0439 detection_loss_reg: 0.3666 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0448 instance_segmentation_loss_reg: 0.3683 instance_segmentation_loss_poly: 0.9848 +2023/10/29 23:12:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/29 23:12:52 - mmengine - INFO - Iter(train) [159000/640000] base_lr: 1.7135e-04 lr: 1.7395e-05 eta: 6 days, 4:55:19 time: 1.0964 data_time: 0.0327 memory: 21513 grad_norm: 2.8196 loss: 1.5162 caption_loss_cls: 2.4260 grounding_loss_reg: 3.1299 detection_loss_cls: 0.0440 detection_loss_reg: 0.3677 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0447 instance_segmentation_loss_reg: 0.3687 instance_segmentation_loss_poly: 0.9859 +2023/10/29 23:12:52 - mmengine - INFO - Saving checkpoint at 159000 iterations +2023/10/29 23:22:34 - mmengine - INFO - Iter(train) [159500/640000] base_lr: 1.7118e-04 lr: 1.7380e-05 eta: 6 days, 5:02:23 time: 1.1082 data_time: 0.0329 memory: 21513 grad_norm: 2.7894 loss: 1.5038 caption_loss_cls: 2.4243 grounding_loss_reg: 3.1325 detection_loss_cls: 0.0439 detection_loss_reg: 0.3678 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0446 instance_segmentation_loss_reg: 0.3686 instance_segmentation_loss_poly: 0.9865 +2023/10/29 23:31:49 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/29 23:31:49 - mmengine - INFO - Iter(train) [160000/640000] base_lr: 1.7100e-04 lr: 1.7364e-05 eta: 6 days, 4:50:44 time: 1.1074 data_time: 0.0328 memory: 21513 grad_norm: 2.7873 loss: 1.4976 caption_loss_cls: 2.4208 grounding_loss_reg: 3.1298 detection_loss_cls: 0.0437 detection_loss_reg: 0.3664 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0448 instance_segmentation_loss_reg: 0.3696 instance_segmentation_loss_poly: 0.9893 +2023/10/29 23:31:49 - mmengine - INFO - Saving checkpoint at 160000 iterations +2023/10/29 23:40:21 - mmengine - INFO - Evaluating bbox... +2023/10/29 23:41:16 - mmengine - INFO - bbox_mAP_copypaste: 0.377 0.546 0.410 0.220 0.432 0.489 +2023/10/29 23:41:16 - mmengine - INFO - Evaluating segm... +2023/10/29 23:42:27 - mmengine - INFO - segm_mAP_copypaste: 0.236 0.446 0.228 0.107 0.280 0.374 +2023/10/29 23:47:54 - mmengine - INFO - per class results: +2023/10/29 23:47:54 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 73.67 | 86.33 | +| building | 79.44 | 90.77 | +| sky | 92.4 | 95.94 | +| floor | 77.67 | 88.68 | +| tree | 71.32 | 87.48 | +| ceiling | 79.99 | 93.21 | +| road | 81.7 | 88.8 | +| bed | 85.7 | 94.79 | +| windowpane | 56.42 | 79.03 | +| grass | 66.62 | 81.36 | +| cabinet | 52.8 | 67.01 | +| sidewalk | 61.67 | 75.28 | +| person | 75.78 | 87.45 | +| earth | 33.92 | 42.99 | +| door | 41.05 | 51.55 | +| table | 55.02 | 73.72 | +| mountain | 60.48 | 79.23 | +| plant | 49.45 | 64.16 | +| curtain | 68.35 | 79.64 | +| chair | 49.1 | 62.59 | +| car | 78.27 | 84.33 | +| water | 43.2 | 54.1 | +| painting | 66.15 | 85.07 | +| sofa | 57.43 | 71.24 | +| shelf | 37.38 | 66.25 | +| house | 35.2 | 46.95 | +| sea | 50.33 | 89.08 | +| mirror | 61.22 | 74.24 | +| rug | 49.48 | 53.54 | +| field | 32.91 | 44.28 | +| armchair | 39.29 | 63.62 | +| seat | 50.92 | 61.36 | +| fence | 32.68 | 43.44 | +| desk | 40.71 | 55.74 | +| rock | 43.82 | 63.08 | +| wardrobe | 45.22 | 52.89 | +| lamp | 50.44 | 64.04 | +| bathtub | 65.09 | 79.54 | +| railing | 23.45 | 33.8 | +| cushion | 47.02 | 60.19 | +| base | 17.43 | 23.78 | +| box | 17.43 | 19.85 | +| column | 44.44 | 61.4 | +| signboard | 26.04 | 32.42 | +| chest of drawers | 27.79 | 74.16 | +| counter | 22.29 | 27.58 | +| sand | 41.06 | 53.0 | +| sink | 61.84 | 66.97 | +| skyscraper | 61.48 | 78.69 | +| fireplace | 61.53 | 85.25 | +| refrigerator | 62.01 | 67.81 | +| grandstand | 35.6 | 74.5 | +| path | 21.18 | 24.88 | +| stairs | 25.34 | 33.29 | +| runway | 74.94 | 93.42 | +| case | 42.84 | 52.05 | +| pool table | 88.59 | 95.88 | +| pillow | 43.32 | 52.17 | +| screen door | 31.08 | 31.97 | +| stairway | 25.72 | 35.89 | +| river | 17.39 | 26.11 | +| bridge | 65.3 | 73.88 | +| bookcase | 28.96 | 69.93 | +| blind | 37.59 | 51.71 | +| coffee table | 50.68 | 79.7 | +| toilet | 80.65 | 86.21 | +| flower | 28.19 | 36.93 | +| book | 40.64 | 53.49 | +| hill | 8.2 | 21.07 | +| bench | 41.1 | 48.43 | +| countertop | 47.51 | 72.89 | +| stove | 54.52 | 61.07 | +| palm | 40.42 | 56.26 | +| kitchen island | 35.8 | 53.22 | +| computer | 58.75 | 66.55 | +| swivel chair | 41.26 | 60.34 | +| boat | 58.75 | 67.8 | +| bar | 39.87 | 67.46 | +| arcade machine | 45.49 | 48.8 | +| hovel | 17.14 | 36.67 | +| bus | 67.61 | 95.27 | +| towel | 49.03 | 52.67 | +| light | 39.57 | 44.88 | +| truck | 28.88 | 41.8 | +| tower | 33.73 | 58.43 | +| chandelier | 57.39 | 74.59 | +| awning | 25.56 | 28.69 | +| streetlight | 20.02 | 25.15 | +| booth | 34.14 | 34.46 | +| television receiver | 48.02 | 81.86 | +| airplane | 54.57 | 58.67 | +| dirt track | 4.07 | 7.78 | +| apparel | 28.37 | 49.19 | +| pole | 9.02 | 9.92 | +| land | 1.67 | 2.5 | +| bannister | 10.0 | 12.85 | +| escalator | 24.31 | 34.47 | +| ottoman | 43.61 | 60.11 | +| bottle | 20.16 | 26.27 | +| buffet | 36.64 | 47.42 | +| poster | 12.21 | 19.02 | +| stage | 8.73 | 18.83 | +| van | 34.59 | 57.2 | +| ship | 82.78 | 92.5 | +| fountain | 11.46 | 11.85 | +| conveyer belt | 55.32 | 66.9 | +| canopy | 21.96 | 27.93 | +| washer | 60.19 | 62.13 | +| plaything | 23.05 | 27.96 | +| swimming pool | 61.08 | 73.72 | +| stool | 30.42 | 37.25 | +| barrel | 26.97 | 60.56 | +| basket | 15.76 | 20.61 | +| waterfall | 57.61 | 81.98 | +| tent | 84.6 | 96.9 | +| bag | 11.03 | 12.12 | +| minibike | 68.83 | 78.19 | +| cradle | 61.77 | 97.08 | +| oven | 25.38 | 64.11 | +| ball | 14.34 | 15.5 | +| food | 34.86 | 37.86 | +| step | 4.82 | 6.78 | +| tank | 36.25 | 38.85 | +| trade name | 18.5 | 20.43 | +| microwave | 52.19 | 60.57 | +| pot | 38.43 | 43.77 | +| animal | 62.21 | 66.74 | +| bicycle | 54.21 | 68.38 | +| lake | 41.67 | 58.35 | +| dishwasher | 38.53 | 47.6 | +| screen | 50.77 | 90.2 | +| blanket | 1.78 | 1.86 | +| sculpture | 44.65 | 55.53 | +| hood | 46.01 | 56.02 | +| sconce | 35.55 | 57.19 | +| vase | 28.65 | 34.77 | +| traffic light | 26.21 | 47.67 | +| tray | 2.34 | 2.9 | +| ashcan | 30.53 | 37.28 | +| fan | 38.31 | 45.64 | +| pier | 41.86 | 75.07 | +| crt screen | 10.39 | 15.22 | +| plate | 49.95 | 62.91 | +| monitor | 33.59 | 53.86 | +| bulletin board | 17.24 | 19.24 | +| shower | 0.08 | 0.33 | +| radiator | 38.57 | 43.44 | +| glass | 12.85 | 13.81 | +| clock | 16.11 | 17.63 | +| flag | 22.88 | 24.92 | ++---------------------+-------+-------+ +2023/10/29 23:48:11 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.3770 coco/bbox_mAP_50: 0.5460 coco/bbox_mAP_75: 0.4100 coco/bbox_mAP_s: 0.2200 coco/bbox_mAP_m: 0.4320 coco/bbox_mAP_l: 0.4890 coco/segm_mAP: 0.2360 coco/segm_mAP_50: 0.4460 coco/segm_mAP_75: 0.2280 coco/segm_mAP_s: 0.1070 coco/segm_mAP_m: 0.2800 coco/segm_mAP_l: 0.3740 Bleu_1: 0.6790 Bleu_2: 0.5000 Bleu_3: 0.3617 Bleu_4: 0.2608 METEOR: 0.2302 ROUGE_L: 0.4980 CIDEr: 0.8235 SPICE: 0.1658 aAcc: 80.0200 mIoU: 41.7800 mAcc: 54.1000 visual-grounding/miou: 0.7136 visual-grounding/acc: 0.7920 data_time: 0.0094 time: 0.5323 +2023/10/29 23:57:36 - mmengine - INFO - Iter(train) [160500/640000] base_lr: 1.7083e-04 lr: 1.7348e-05 eta: 6 days, 4:46:34 time: 1.1106 data_time: 0.0300 memory: 21513 grad_norm: 2.7675 loss: 1.4963 caption_loss_cls: 2.4204 grounding_loss_reg: 3.1287 detection_loss_cls: 0.0436 detection_loss_reg: 0.3661 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0447 instance_segmentation_loss_reg: 0.3688 instance_segmentation_loss_poly: 0.9869 +2023/10/30 00:06:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 00:06:56 - mmengine - INFO - Iter(train) [161000/640000] base_lr: 1.7066e-04 lr: 1.7333e-05 eta: 6 days, 4:38:13 time: 1.1158 data_time: 0.0301 memory: 21513 grad_norm: 2.7385 loss: 1.4853 caption_loss_cls: 2.4216 grounding_loss_reg: 3.1302 detection_loss_cls: 0.0437 detection_loss_reg: 0.3669 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0447 instance_segmentation_loss_reg: 0.3689 instance_segmentation_loss_poly: 0.9875 +2023/10/30 00:06:56 - mmengine - INFO - Saving checkpoint at 161000 iterations +2023/10/30 00:16:32 - mmengine - INFO - Iter(train) [161500/640000] base_lr: 1.7049e-04 lr: 1.7317e-05 eta: 6 days, 4:38:10 time: 1.1173 data_time: 0.0302 memory: 21513 grad_norm: 2.6982 loss: 1.4582 caption_loss_cls: 2.4179 grounding_loss_reg: 3.1287 detection_loss_cls: 0.0437 detection_loss_reg: 0.3675 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0447 instance_segmentation_loss_reg: 0.3684 instance_segmentation_loss_poly: 0.9872 +2023/10/30 00:25:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 00:25:37 - mmengine - INFO - Iter(train) [162000/640000] base_lr: 1.7031e-04 lr: 1.7301e-05 eta: 6 days, 4:21:04 time: 1.1215 data_time: 0.0308 memory: 21513 grad_norm: 2.6877 loss: 1.4592 caption_loss_cls: 2.4170 grounding_loss_reg: 3.1287 detection_loss_cls: 0.0436 detection_loss_reg: 0.3667 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0447 instance_segmentation_loss_reg: 0.3688 instance_segmentation_loss_poly: 0.9875 +2023/10/30 00:25:37 - mmengine - INFO - Saving checkpoint at 162000 iterations +2023/10/30 00:34:59 - mmengine - INFO - Iter(train) [162500/640000] base_lr: 1.7014e-04 lr: 1.7285e-05 eta: 6 days, 4:13:43 time: 1.1241 data_time: 0.0312 memory: 21513 grad_norm: 2.6833 loss: 1.4613 caption_loss_cls: 2.4118 grounding_loss_reg: 3.1280 detection_loss_cls: 0.0436 detection_loss_reg: 0.3671 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0447 instance_segmentation_loss_reg: 0.3684 instance_segmentation_loss_poly: 0.9865 +2023/10/30 00:44:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 00:44:19 - mmengine - INFO - Iter(train) [163000/640000] base_lr: 1.6997e-04 lr: 1.7270e-05 eta: 6 days, 4:05:02 time: 1.1267 data_time: 0.0314 memory: 21513 grad_norm: 2.6999 loss: 1.4635 caption_loss_cls: 2.4096 grounding_loss_reg: 3.1285 detection_loss_cls: 0.0436 detection_loss_reg: 0.3672 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0444 instance_segmentation_loss_reg: 0.3671 instance_segmentation_loss_poly: 0.9834 +2023/10/30 00:44:19 - mmengine - INFO - Saving checkpoint at 163000 iterations +2023/10/30 00:53:19 - mmengine - INFO - Iter(train) [163500/640000] base_lr: 1.6979e-04 lr: 1.7254e-05 eta: 6 days, 3:46:16 time: 1.1158 data_time: 0.0315 memory: 21513 grad_norm: 2.7359 loss: 1.4796 caption_loss_cls: 2.4121 grounding_loss_reg: 3.1272 detection_loss_cls: 0.0435 detection_loss_reg: 0.3672 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0444 instance_segmentation_loss_reg: 0.3675 instance_segmentation_loss_poly: 0.9832 +2023/10/30 01:02:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 01:02:06 - mmengine - INFO - Iter(train) [164000/640000] base_lr: 1.6962e-04 lr: 1.7238e-05 eta: 6 days, 3:22:25 time: 1.1089 data_time: 0.0314 memory: 21513 grad_norm: 2.7394 loss: 1.4818 caption_loss_cls: 2.4105 grounding_loss_reg: 3.1219 detection_loss_cls: 0.0434 detection_loss_reg: 0.3665 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0445 instance_segmentation_loss_reg: 0.3683 instance_segmentation_loss_poly: 0.9854 +2023/10/30 01:02:06 - mmengine - INFO - Saving checkpoint at 164000 iterations +2023/10/30 01:11:24 - mmengine - INFO - Iter(train) [164500/640000] base_lr: 1.6944e-04 lr: 1.7222e-05 eta: 6 days, 3:13:19 time: 1.1066 data_time: 0.0344 memory: 21513 grad_norm: 2.7227 loss: 1.4740 caption_loss_cls: 2.4042 grounding_loss_reg: 3.1201 detection_loss_cls: 0.0433 detection_loss_reg: 0.3668 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0445 instance_segmentation_loss_reg: 0.3683 instance_segmentation_loss_poly: 0.9856 +2023/10/30 01:20:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 01:20:25 - mmengine - INFO - Iter(train) [165000/640000] base_lr: 1.6926e-04 lr: 1.7206e-05 eta: 6 days, 2:56:54 time: 1.1018 data_time: 0.0344 memory: 21513 grad_norm: 2.7422 loss: 1.4797 caption_loss_cls: 2.4031 grounding_loss_reg: 3.1155 detection_loss_cls: 0.0433 detection_loss_reg: 0.3668 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0444 instance_segmentation_loss_reg: 0.3685 instance_segmentation_loss_poly: 0.9861 +2023/10/30 01:20:25 - mmengine - INFO - Saving checkpoint at 165000 iterations +2023/10/30 01:29:56 - mmengine - INFO - Iter(train) [165500/640000] base_lr: 1.6909e-04 lr: 1.7190e-05 eta: 6 days, 2:53:23 time: 1.1006 data_time: 0.0344 memory: 21513 grad_norm: 2.7683 loss: 1.4939 caption_loss_cls: 2.4012 grounding_loss_reg: 3.1156 detection_loss_cls: 0.0433 detection_loss_reg: 0.3668 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0444 instance_segmentation_loss_reg: 0.3688 instance_segmentation_loss_poly: 0.9867 +2023/10/30 01:39:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 01:39:14 - mmengine - INFO - Iter(train) [166000/640000] base_lr: 1.6891e-04 lr: 1.7174e-05 eta: 6 days, 2:44:22 time: 1.1039 data_time: 0.0342 memory: 21513 grad_norm: 2.7694 loss: 1.4835 caption_loss_cls: 2.4044 grounding_loss_reg: 3.1108 detection_loss_cls: 0.0432 detection_loss_reg: 0.3663 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0443 instance_segmentation_loss_reg: 0.3678 instance_segmentation_loss_poly: 0.9853 +2023/10/30 01:39:14 - mmengine - INFO - Saving checkpoint at 166000 iterations +2023/10/30 01:48:20 - mmengine - INFO - Iter(train) [166500/640000] base_lr: 1.6874e-04 lr: 1.7158e-05 eta: 6 days, 2:30:31 time: 1.0998 data_time: 0.0337 memory: 21513 grad_norm: 2.7583 loss: 1.4759 caption_loss_cls: 2.4065 grounding_loss_reg: 3.1101 detection_loss_cls: 0.0431 detection_loss_reg: 0.3669 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0441 instance_segmentation_loss_reg: 0.3669 instance_segmentation_loss_poly: 0.9842 +2023/10/30 01:57:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 01:57:28 - mmengine - INFO - Iter(train) [167000/640000] base_lr: 1.6856e-04 lr: 1.7142e-05 eta: 6 days, 2:17:34 time: 1.0967 data_time: 0.0336 memory: 21513 grad_norm: 2.7573 loss: 1.4809 caption_loss_cls: 2.4069 grounding_loss_reg: 3.1082 detection_loss_cls: 0.0431 detection_loss_reg: 0.3668 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0443 instance_segmentation_loss_reg: 0.3678 instance_segmentation_loss_poly: 0.9857 +2023/10/30 01:57:28 - mmengine - INFO - Saving checkpoint at 167000 iterations +2023/10/30 02:07:07 - mmengine - INFO - Iter(train) [167500/640000] base_lr: 1.6838e-04 lr: 1.7125e-05 eta: 6 days, 2:16:49 time: 1.1066 data_time: 0.0338 memory: 21513 grad_norm: 2.7452 loss: 1.4696 caption_loss_cls: 2.4093 grounding_loss_reg: 3.1081 detection_loss_cls: 0.0430 detection_loss_reg: 0.3657 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0441 instance_segmentation_loss_reg: 0.3663 instance_segmentation_loss_poly: 0.9832 +2023/10/30 02:16:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 02:16:19 - mmengine - INFO - Iter(train) [168000/640000] base_lr: 1.6820e-04 lr: 1.7109e-05 eta: 6 days, 2:05:39 time: 1.1130 data_time: 0.0340 memory: 21513 grad_norm: 2.7241 loss: 1.4613 caption_loss_cls: 2.4092 grounding_loss_reg: 3.1071 detection_loss_cls: 0.0432 detection_loss_reg: 0.3658 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0441 instance_segmentation_loss_reg: 0.3666 instance_segmentation_loss_poly: 0.9833 +2023/10/30 02:16:19 - mmengine - INFO - Saving checkpoint at 168000 iterations +2023/10/30 02:25:20 - mmengine - INFO - Iter(train) [168500/640000] base_lr: 1.6802e-04 lr: 1.7093e-05 eta: 6 days, 1:50:13 time: 1.1086 data_time: 0.0338 memory: 21513 grad_norm: 2.7849 loss: 1.4751 caption_loss_cls: 2.4092 grounding_loss_reg: 3.1049 detection_loss_cls: 0.0433 detection_loss_reg: 0.3658 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0442 instance_segmentation_loss_reg: 0.3669 instance_segmentation_loss_poly: 0.9838 +2023/10/30 02:34:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 02:34:40 - mmengine - INFO - Iter(train) [169000/640000] base_lr: 1.6784e-04 lr: 1.7077e-05 eta: 6 days, 1:42:07 time: 1.1133 data_time: 0.0342 memory: 21513 grad_norm: 2.7577 loss: 1.4742 caption_loss_cls: 2.4124 grounding_loss_reg: 3.1059 detection_loss_cls: 0.0432 detection_loss_reg: 0.3655 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0443 instance_segmentation_loss_reg: 0.3671 instance_segmentation_loss_poly: 0.9836 +2023/10/30 02:34:40 - mmengine - INFO - Saving checkpoint at 169000 iterations +2023/10/30 02:44:16 - mmengine - INFO - Iter(train) [169500/640000] base_lr: 1.6766e-04 lr: 1.7060e-05 eta: 6 days, 1:39:34 time: 1.1148 data_time: 0.0342 memory: 21513 grad_norm: 2.7785 loss: 1.4748 caption_loss_cls: 2.4092 grounding_loss_reg: 3.1060 detection_loss_cls: 0.0432 detection_loss_reg: 0.3659 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0443 instance_segmentation_loss_reg: 0.3666 instance_segmentation_loss_poly: 0.9820 +2023/10/30 02:53:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 02:53:57 - mmengine - INFO - Iter(train) [170000/640000] base_lr: 1.6748e-04 lr: 1.7044e-05 eta: 6 days, 1:38:18 time: 1.1205 data_time: 0.0342 memory: 21513 grad_norm: 2.7575 loss: 1.4723 caption_loss_cls: 2.4140 grounding_loss_reg: 3.1094 detection_loss_cls: 0.0432 detection_loss_reg: 0.3655 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0446 instance_segmentation_loss_reg: 0.3681 instance_segmentation_loss_poly: 0.9834 +2023/10/30 02:53:57 - mmengine - INFO - Saving checkpoint at 170000 iterations +2023/10/30 03:03:34 - mmengine - INFO - Iter(train) [170500/640000] base_lr: 1.6730e-04 lr: 1.7028e-05 eta: 6 days, 1:35:24 time: 1.1283 data_time: 0.0348 memory: 21513 grad_norm: 2.7424 loss: 1.4753 caption_loss_cls: 2.4135 grounding_loss_reg: 3.1094 detection_loss_cls: 0.0432 detection_loss_reg: 0.3660 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0448 instance_segmentation_loss_reg: 0.3684 instance_segmentation_loss_poly: 0.9835 +2023/10/30 03:12:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 03:12:33 - mmengine - INFO - Iter(train) [171000/640000] base_lr: 1.6712e-04 lr: 1.7011e-05 eta: 6 days, 1:19:44 time: 1.1260 data_time: 0.0348 memory: 21513 grad_norm: 2.7606 loss: 1.4834 caption_loss_cls: 2.4158 grounding_loss_reg: 3.1081 detection_loss_cls: 0.0430 detection_loss_reg: 0.3648 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0448 instance_segmentation_loss_reg: 0.3682 instance_segmentation_loss_poly: 0.9835 +2023/10/30 03:12:33 - mmengine - INFO - Saving checkpoint at 171000 iterations +2023/10/30 03:22:25 - mmengine - INFO - Iter(train) [171500/640000] base_lr: 1.6694e-04 lr: 1.6995e-05 eta: 6 days, 1:21:25 time: 1.1293 data_time: 0.0348 memory: 21513 grad_norm: 2.6972 loss: 1.4699 caption_loss_cls: 2.4135 grounding_loss_reg: 3.1089 detection_loss_cls: 0.0430 detection_loss_reg: 0.3653 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0448 instance_segmentation_loss_reg: 0.3678 instance_segmentation_loss_poly: 0.9838 +2023/10/30 03:32:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 03:32:17 - mmengine - INFO - Iter(train) [172000/640000] base_lr: 1.6676e-04 lr: 1.6978e-05 eta: 6 days, 1:22:17 time: 1.1391 data_time: 0.0353 memory: 21513 grad_norm: 2.6807 loss: 1.4709 caption_loss_cls: 2.4140 grounding_loss_reg: 3.1100 detection_loss_cls: 0.0430 detection_loss_reg: 0.3649 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0449 instance_segmentation_loss_reg: 0.3690 instance_segmentation_loss_poly: 0.9854 +2023/10/30 03:32:17 - mmengine - INFO - Saving checkpoint at 172000 iterations +2023/10/30 03:41:51 - mmengine - INFO - Iter(train) [172500/640000] base_lr: 1.6658e-04 lr: 1.6962e-05 eta: 6 days, 1:17:24 time: 1.1474 data_time: 0.0356 memory: 21513 grad_norm: 2.6537 loss: 1.4724 caption_loss_cls: 2.4167 grounding_loss_reg: 3.1095 detection_loss_cls: 0.0431 detection_loss_reg: 0.3653 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0450 instance_segmentation_loss_reg: 0.3702 instance_segmentation_loss_poly: 0.9885 +2023/10/30 03:52:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 03:52:13 - mmengine - INFO - Iter(train) [173000/640000] base_lr: 1.6640e-04 lr: 1.6945e-05 eta: 6 days, 1:27:02 time: 1.1631 data_time: 0.0425 memory: 21513 grad_norm: 2.6294 loss: 1.4568 caption_loss_cls: 2.4162 grounding_loss_reg: 3.1089 detection_loss_cls: 0.0431 detection_loss_reg: 0.3657 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0449 instance_segmentation_loss_reg: 0.3694 instance_segmentation_loss_poly: 0.9867 +2023/10/30 03:52:13 - mmengine - INFO - Saving checkpoint at 173000 iterations +2023/10/30 04:01:36 - mmengine - INFO - Iter(train) [173500/640000] base_lr: 1.6621e-04 lr: 1.6929e-05 eta: 6 days, 1:18:15 time: 1.1596 data_time: 0.0425 memory: 21513 grad_norm: 2.5786 loss: 1.4491 caption_loss_cls: 2.4170 grounding_loss_reg: 3.1075 detection_loss_cls: 0.0431 detection_loss_reg: 0.3663 semantic_segmentation_loss_cls: 0.0115 instance_segmentation_loss_cls: 0.0449 instance_segmentation_loss_reg: 0.3700 instance_segmentation_loss_poly: 0.9877 +2023/10/30 04:10:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 04:10:52 - mmengine - INFO - Iter(train) [174000/640000] base_lr: 1.6603e-04 lr: 1.6912e-05 eta: 6 days, 1:07:25 time: 1.1533 data_time: 0.0422 memory: 21513 grad_norm: 2.6074 loss: 1.4498 caption_loss_cls: 2.4148 grounding_loss_reg: 3.1079 detection_loss_cls: 0.0432 detection_loss_reg: 0.3663 semantic_segmentation_loss_cls: 0.0115 instance_segmentation_loss_cls: 0.0449 instance_segmentation_loss_reg: 0.3699 instance_segmentation_loss_poly: 0.9876 +2023/10/30 04:10:52 - mmengine - INFO - Saving checkpoint at 174000 iterations +2023/10/30 04:20:21 - mmengine - INFO - Iter(train) [174500/640000] base_lr: 1.6585e-04 lr: 1.6895e-05 eta: 6 days, 1:00:32 time: 1.1514 data_time: 0.0420 memory: 21513 grad_norm: 2.6103 loss: 1.4442 caption_loss_cls: 2.4115 grounding_loss_reg: 3.1066 detection_loss_cls: 0.0432 detection_loss_reg: 0.3666 semantic_segmentation_loss_cls: 0.0115 instance_segmentation_loss_cls: 0.0449 instance_segmentation_loss_reg: 0.3701 instance_segmentation_loss_poly: 0.9874 +2023/10/30 04:29:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 04:29:45 - mmengine - INFO - Iter(train) [175000/640000] base_lr: 1.6566e-04 lr: 1.6879e-05 eta: 6 days, 0:51:56 time: 1.1576 data_time: 0.0420 memory: 21513 grad_norm: 2.5905 loss: 1.4322 caption_loss_cls: 2.4098 grounding_loss_reg: 3.1053 detection_loss_cls: 0.0430 detection_loss_reg: 0.3666 semantic_segmentation_loss_cls: 0.0114 instance_segmentation_loss_cls: 0.0449 instance_segmentation_loss_reg: 0.3701 instance_segmentation_loss_poly: 0.9870 +2023/10/30 04:29:45 - mmengine - INFO - Saving checkpoint at 175000 iterations +2023/10/30 04:39:03 - mmengine - INFO - Iter(train) [175500/640000] base_lr: 1.6548e-04 lr: 1.6862e-05 eta: 6 days, 0:41:50 time: 1.1490 data_time: 0.0417 memory: 21513 grad_norm: 2.6500 loss: 1.4462 caption_loss_cls: 2.4123 grounding_loss_reg: 3.1051 detection_loss_cls: 0.0430 detection_loss_reg: 0.3663 semantic_segmentation_loss_cls: 0.0115 instance_segmentation_loss_cls: 0.0449 instance_segmentation_loss_reg: 0.3700 instance_segmentation_loss_poly: 0.9867 +2023/10/30 04:47:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 04:47:44 - mmengine - INFO - Iter(train) [176000/640000] base_lr: 1.6530e-04 lr: 1.6845e-05 eta: 6 days, 0:21:43 time: 1.1313 data_time: 0.0411 memory: 21513 grad_norm: 2.7094 loss: 1.4594 caption_loss_cls: 2.4127 grounding_loss_reg: 3.1011 detection_loss_cls: 0.0428 detection_loss_reg: 0.3661 semantic_segmentation_loss_cls: 0.0114 instance_segmentation_loss_cls: 0.0448 instance_segmentation_loss_reg: 0.3699 instance_segmentation_loss_poly: 0.9869 +2023/10/30 04:47:44 - mmengine - INFO - Saving checkpoint at 176000 iterations +2023/10/30 04:57:10 - mmengine - INFO - Iter(train) [176500/640000] base_lr: 1.6511e-04 lr: 1.6828e-05 eta: 6 days, 0:13:55 time: 1.1294 data_time: 0.0411 memory: 21513 grad_norm: 2.7311 loss: 1.4548 caption_loss_cls: 2.4126 grounding_loss_reg: 3.1010 detection_loss_cls: 0.0427 detection_loss_reg: 0.3649 semantic_segmentation_loss_cls: 0.0114 instance_segmentation_loss_cls: 0.0449 instance_segmentation_loss_reg: 0.3697 instance_segmentation_loss_poly: 0.9850 +2023/10/30 05:06:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 05:06:14 - mmengine - INFO - Iter(train) [177000/640000] base_lr: 1.6493e-04 lr: 1.6811e-05 eta: 6 days, 0:00:26 time: 1.1097 data_time: 0.0339 memory: 21513 grad_norm: 2.7834 loss: 1.4732 caption_loss_cls: 2.4129 grounding_loss_reg: 3.1022 detection_loss_cls: 0.0427 detection_loss_reg: 0.3649 semantic_segmentation_loss_cls: 0.0114 instance_segmentation_loss_cls: 0.0450 instance_segmentation_loss_reg: 0.3696 instance_segmentation_loss_poly: 0.9835 +2023/10/30 05:06:14 - mmengine - INFO - Saving checkpoint at 177000 iterations +2023/10/30 05:16:23 - mmengine - INFO - Iter(train) [177500/640000] base_lr: 1.6474e-04 lr: 1.6795e-05 eta: 6 days, 0:03:29 time: 1.1213 data_time: 0.0344 memory: 21513 grad_norm: 2.7987 loss: 1.4798 caption_loss_cls: 2.4142 grounding_loss_reg: 3.0991 detection_loss_cls: 0.0426 detection_loss_reg: 0.3637 semantic_segmentation_loss_cls: 0.0114 instance_segmentation_loss_cls: 0.0451 instance_segmentation_loss_reg: 0.3697 instance_segmentation_loss_poly: 0.9839 +2023/10/30 05:25:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 05:25:51 - mmengine - INFO - Iter(train) [178000/640000] base_lr: 1.6455e-04 lr: 1.6778e-05 eta: 5 days, 23:55:58 time: 1.1244 data_time: 0.0348 memory: 21513 grad_norm: 2.7796 loss: 1.4836 caption_loss_cls: 2.4096 grounding_loss_reg: 3.0995 detection_loss_cls: 0.0426 detection_loss_reg: 0.3642 semantic_segmentation_loss_cls: 0.0114 instance_segmentation_loss_cls: 0.0449 instance_segmentation_loss_reg: 0.3686 instance_segmentation_loss_poly: 0.9829 +2023/10/30 05:25:51 - mmengine - INFO - Saving checkpoint at 178000 iterations +2023/10/30 05:35:12 - mmengine - INFO - Iter(train) [178500/640000] base_lr: 1.6437e-04 lr: 1.6761e-05 eta: 5 days, 23:46:37 time: 1.1223 data_time: 0.0344 memory: 21513 grad_norm: 2.7611 loss: 1.4633 caption_loss_cls: 2.4110 grounding_loss_reg: 3.0972 detection_loss_cls: 0.0424 detection_loss_reg: 0.3628 semantic_segmentation_loss_cls: 0.0114 instance_segmentation_loss_cls: 0.0448 instance_segmentation_loss_reg: 0.3673 instance_segmentation_loss_poly: 0.9805 +2023/10/30 05:44:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 05:44:29 - mmengine - INFO - Iter(train) [179000/640000] base_lr: 1.6418e-04 lr: 1.6744e-05 eta: 5 days, 23:36:16 time: 1.1206 data_time: 0.0346 memory: 21513 grad_norm: 2.7738 loss: 1.4659 caption_loss_cls: 2.4095 grounding_loss_reg: 3.0975 detection_loss_cls: 0.0423 detection_loss_reg: 0.3613 semantic_segmentation_loss_cls: 0.0114 instance_segmentation_loss_cls: 0.0447 instance_segmentation_loss_reg: 0.3672 instance_segmentation_loss_poly: 0.9796 +2023/10/30 05:44:29 - mmengine - INFO - Saving checkpoint at 179000 iterations +2023/10/30 05:54:28 - mmengine - INFO - Iter(train) [179500/640000] base_lr: 1.6399e-04 lr: 1.6727e-05 eta: 5 days, 23:35:56 time: 1.1308 data_time: 0.0359 memory: 21513 grad_norm: 2.7425 loss: 1.4612 caption_loss_cls: 2.4118 grounding_loss_reg: 3.0996 detection_loss_cls: 0.0423 detection_loss_reg: 0.3610 semantic_segmentation_loss_cls: 0.0114 instance_segmentation_loss_cls: 0.0448 instance_segmentation_loss_reg: 0.3679 instance_segmentation_loss_poly: 0.9802 +2023/10/30 06:03:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 06:03:34 - mmengine - INFO - Iter(train) [180000/640000] base_lr: 1.6381e-04 lr: 1.6710e-05 eta: 5 days, 23:22:59 time: 1.1372 data_time: 0.0360 memory: 21513 grad_norm: 2.7171 loss: 1.4520 caption_loss_cls: 2.4129 grounding_loss_reg: 3.1024 detection_loss_cls: 0.0424 detection_loss_reg: 0.3618 semantic_segmentation_loss_cls: 0.0113 instance_segmentation_loss_cls: 0.0448 instance_segmentation_loss_reg: 0.3684 instance_segmentation_loss_poly: 0.9814 +2023/10/30 06:03:34 - mmengine - INFO - Saving checkpoint at 180000 iterations +2023/10/30 06:12:18 - mmengine - INFO - Evaluating bbox... +2023/10/30 06:13:13 - mmengine - INFO - bbox_mAP_copypaste: 0.383 0.557 0.417 0.240 0.433 0.503 +2023/10/30 06:13:13 - mmengine - INFO - Evaluating segm... +2023/10/30 06:14:23 - mmengine - INFO - segm_mAP_copypaste: 0.246 0.467 0.234 0.125 0.292 0.393 +2023/10/30 06:18:55 - mmengine - INFO - per class results: +2023/10/30 06:18:55 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 74.21 | 86.42 | +| building | 78.97 | 91.97 | +| sky | 92.69 | 97.72 | +| floor | 79.21 | 85.94 | +| tree | 70.95 | 83.24 | +| ceiling | 82.21 | 90.93 | +| road | 81.68 | 89.71 | +| bed | 85.0 | 94.47 | +| windowpane | 59.45 | 73.88 | +| grass | 69.16 | 84.51 | +| cabinet | 52.03 | 61.71 | +| sidewalk | 61.52 | 77.35 | +| person | 78.04 | 92.07 | +| earth | 36.67 | 50.01 | +| door | 41.39 | 55.27 | +| table | 52.18 | 72.17 | +| mountain | 53.64 | 72.43 | +| plant | 43.6 | 48.75 | +| curtain | 69.39 | 78.44 | +| chair | 48.81 | 65.01 | +| car | 81.05 | 91.89 | +| water | 42.5 | 49.53 | +| painting | 65.33 | 87.51 | +| sofa | 61.94 | 75.89 | +| shelf | 31.7 | 39.07 | +| house | 28.48 | 37.28 | +| sea | 52.11 | 84.78 | +| mirror | 58.75 | 67.14 | +| rug | 58.85 | 70.32 | +| field | 31.64 | 41.32 | +| armchair | 39.4 | 64.5 | +| seat | 46.14 | 57.75 | +| fence | 31.69 | 44.85 | +| desk | 27.89 | 79.54 | +| rock | 32.73 | 61.72 | +| wardrobe | 41.55 | 87.12 | +| lamp | 54.94 | 72.33 | +| bathtub | 66.07 | 74.97 | +| railing | 29.99 | 53.07 | +| cushion | 48.55 | 56.79 | +| base | 12.83 | 17.5 | +| box | 23.51 | 35.69 | +| column | 46.95 | 63.25 | +| signboard | 34.2 | 46.5 | +| chest of drawers | 41.2 | 66.89 | +| counter | 34.45 | 51.5 | +| sand | 44.46 | 55.51 | +| sink | 62.29 | 77.51 | +| skyscraper | 52.37 | 67.7 | +| fireplace | 59.94 | 71.87 | +| refrigerator | 61.34 | 87.95 | +| grandstand | 41.08 | 70.11 | +| path | 21.75 | 37.43 | +| stairs | 21.09 | 23.75 | +| runway | 70.62 | 87.05 | +| case | 32.94 | 37.75 | +| pool table | 88.69 | 95.39 | +| pillow | 50.33 | 68.85 | +| screen door | 21.76 | 22.46 | +| stairway | 29.08 | 46.12 | +| river | 24.5 | 65.92 | +| bridge | 35.71 | 53.42 | +| bookcase | 31.32 | 41.66 | +| blind | 24.05 | 26.91 | +| coffee table | 60.12 | 74.12 | +| toilet | 75.86 | 87.04 | +| flower | 31.63 | 67.45 | +| book | 43.92 | 68.32 | +| hill | 2.34 | 3.92 | +| bench | 44.84 | 64.14 | +| countertop | 47.82 | 53.69 | +| stove | 65.94 | 72.55 | +| palm | 47.91 | 66.52 | +| kitchen island | 35.44 | 52.19 | +| computer | 67.27 | 87.06 | +| swivel chair | 43.89 | 61.95 | +| boat | 61.27 | 79.19 | +| bar | 28.17 | 29.8 | +| arcade machine | 32.85 | 35.69 | +| hovel | 10.63 | 15.87 | +| bus | 83.06 | 95.54 | +| towel | 56.64 | 71.14 | +| light | 44.22 | 52.8 | +| truck | 30.2 | 49.73 | +| tower | 27.28 | 39.54 | +| chandelier | 62.47 | 77.02 | +| awning | 26.95 | 32.1 | +| streetlight | 21.78 | 29.59 | +| booth | 35.92 | 43.44 | +| television receiver | 54.07 | 78.94 | +| airplane | 58.74 | 65.15 | +| dirt track | 0.0 | 0.0 | +| apparel | 17.43 | 30.22 | +| pole | 19.07 | 26.21 | +| land | 1.96 | 4.1 | +| bannister | 10.15 | 11.83 | +| escalator | 16.52 | 18.98 | +| ottoman | 34.51 | 66.92 | +| bottle | 31.46 | 46.9 | +| buffet | 42.87 | 50.28 | +| poster | 35.57 | 48.95 | +| stage | 9.57 | 27.22 | +| van | 21.5 | 27.64 | +| ship | 65.04 | 85.03 | +| fountain | 13.56 | 13.8 | +| conveyer belt | 69.34 | 73.65 | +| canopy | 13.16 | 13.71 | +| washer | 45.63 | 56.02 | +| plaything | 18.04 | 29.38 | +| swimming pool | 43.09 | 87.48 | +| stool | 36.48 | 52.4 | +| barrel | 11.66 | 85.16 | +| basket | 27.83 | 38.27 | +| waterfall | 65.62 | 91.16 | +| tent | 76.82 | 96.84 | +| bag | 18.7 | 26.08 | +| minibike | 73.69 | 81.92 | +| cradle | 65.48 | 83.82 | +| oven | 30.84 | 38.35 | +| ball | 24.32 | 27.47 | +| food | 56.48 | 66.21 | +| step | 14.11 | 15.0 | +| tank | 29.3 | 36.69 | +| trade name | 26.15 | 39.57 | +| microwave | 58.2 | 68.03 | +| pot | 44.33 | 60.48 | +| animal | 63.53 | 68.14 | +| bicycle | 54.59 | 75.26 | +| lake | 58.36 | 59.69 | +| dishwasher | 45.64 | 58.53 | +| screen | 59.08 | 69.69 | +| blanket | 9.66 | 12.12 | +| sculpture | 46.13 | 54.51 | +| hood | 51.24 | 55.0 | +| sconce | 19.05 | 20.74 | +| vase | 32.8 | 41.77 | +| traffic light | 31.69 | 50.96 | +| tray | 5.93 | 17.14 | +| ashcan | 30.55 | 42.14 | +| fan | 46.87 | 69.18 | +| pier | 25.86 | 34.18 | +| crt screen | 7.22 | 22.85 | +| plate | 52.81 | 63.93 | +| monitor | 0.2 | 0.26 | +| bulletin board | 17.12 | 22.18 | +| shower | 0.65 | 2.84 | +| radiator | 41.88 | 48.52 | +| glass | 15.4 | 17.76 | +| clock | 21.4 | 22.88 | +| flag | 28.13 | 31.19 | ++---------------------+-------+-------+ +2023/10/30 06:19:11 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.3830 coco/bbox_mAP_50: 0.5570 coco/bbox_mAP_75: 0.4170 coco/bbox_mAP_s: 0.2400 coco/bbox_mAP_m: 0.4330 coco/bbox_mAP_l: 0.5030 coco/segm_mAP: 0.2460 coco/segm_mAP_50: 0.4670 coco/segm_mAP_75: 0.2340 coco/segm_mAP_s: 0.1250 coco/segm_mAP_m: 0.2920 coco/segm_mAP_l: 0.3930 Bleu_1: 0.6961 Bleu_2: 0.5220 Bleu_3: 0.3850 Bleu_4: 0.2842 METEOR: 0.2411 ROUGE_L: 0.5164 CIDEr: 0.8820 SPICE: 0.1752 aAcc: 80.0100 mIoU: 42.2900 mAcc: 55.4000 visual-grounding/miou: 0.7249 visual-grounding/acc: 0.8065 data_time: 0.0055 time: 0.5262 +2023/10/30 06:28:01 - mmengine - INFO - Iter(train) [180500/640000] base_lr: 1.6362e-04 lr: 1.6692e-05 eta: 5 days, 23:07:05 time: 1.1288 data_time: 0.0331 memory: 21513 grad_norm: 2.7193 loss: 1.4580 caption_loss_cls: 2.4157 grounding_loss_reg: 3.1010 detection_loss_cls: 0.0425 detection_loss_reg: 0.3623 semantic_segmentation_loss_cls: 0.0113 instance_segmentation_loss_cls: 0.0447 instance_segmentation_loss_reg: 0.3683 instance_segmentation_loss_poly: 0.9810 +2023/10/30 06:37:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 06:37:24 - mmengine - INFO - Iter(train) [181000/640000] base_lr: 1.6343e-04 lr: 1.6675e-05 eta: 5 days, 22:58:16 time: 1.1336 data_time: 0.0333 memory: 21513 grad_norm: 2.7000 loss: 1.4539 caption_loss_cls: 2.4145 grounding_loss_reg: 3.0978 detection_loss_cls: 0.0425 detection_loss_reg: 0.3618 semantic_segmentation_loss_cls: 0.0113 instance_segmentation_loss_cls: 0.0446 instance_segmentation_loss_reg: 0.3682 instance_segmentation_loss_poly: 0.9804 +2023/10/30 06:37:24 - mmengine - INFO - Saving checkpoint at 181000 iterations +2023/10/30 06:46:58 - mmengine - INFO - Iter(train) [181500/640000] base_lr: 1.6324e-04 lr: 1.6658e-05 eta: 5 days, 22:51:44 time: 1.1247 data_time: 0.0332 memory: 21513 grad_norm: 2.6992 loss: 1.4580 caption_loss_cls: 2.4146 grounding_loss_reg: 3.0966 detection_loss_cls: 0.0424 detection_loss_reg: 0.3613 semantic_segmentation_loss_cls: 0.0113 instance_segmentation_loss_cls: 0.0444 instance_segmentation_loss_reg: 0.3683 instance_segmentation_loss_poly: 0.9805 +2023/10/30 06:56:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 06:56:04 - mmengine - INFO - Iter(train) [182000/640000] base_lr: 1.6305e-04 lr: 1.6641e-05 eta: 5 days, 22:39:08 time: 1.1192 data_time: 0.0329 memory: 21513 grad_norm: 2.7008 loss: 1.4553 caption_loss_cls: 2.4169 grounding_loss_reg: 3.0930 detection_loss_cls: 0.0426 detection_loss_reg: 0.3631 semantic_segmentation_loss_cls: 0.0113 instance_segmentation_loss_cls: 0.0444 instance_segmentation_loss_reg: 0.3670 instance_segmentation_loss_poly: 0.9784 +2023/10/30 06:56:04 - mmengine - INFO - Saving checkpoint at 182000 iterations +2023/10/30 07:05:17 - mmengine - INFO - Iter(train) [182500/640000] base_lr: 1.6286e-04 lr: 1.6624e-05 eta: 5 days, 22:28:16 time: 1.1174 data_time: 0.0330 memory: 21513 grad_norm: 2.7263 loss: 1.4694 caption_loss_cls: 2.4210 grounding_loss_reg: 3.0910 detection_loss_cls: 0.0425 detection_loss_reg: 0.3616 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0444 instance_segmentation_loss_reg: 0.3667 instance_segmentation_loss_poly: 0.9773 +2023/10/30 07:14:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 07:14:24 - mmengine - INFO - Iter(train) [183000/640000] base_lr: 1.6267e-04 lr: 1.6607e-05 eta: 5 days, 22:15:56 time: 1.1149 data_time: 0.0330 memory: 21513 grad_norm: 2.7152 loss: 1.4682 caption_loss_cls: 2.4230 grounding_loss_reg: 3.0925 detection_loss_cls: 0.0424 detection_loss_reg: 0.3611 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0444 instance_segmentation_loss_reg: 0.3668 instance_segmentation_loss_poly: 0.9788 +2023/10/30 07:14:24 - mmengine - INFO - Saving checkpoint at 183000 iterations +2023/10/30 07:24:07 - mmengine - INFO - Iter(train) [183500/640000] base_lr: 1.6248e-04 lr: 1.6589e-05 eta: 5 days, 22:11:15 time: 1.1108 data_time: 0.0321 memory: 21513 grad_norm: 2.7347 loss: 1.4748 caption_loss_cls: 2.4193 grounding_loss_reg: 3.0906 detection_loss_cls: 0.0424 detection_loss_reg: 0.3614 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0443 instance_segmentation_loss_reg: 0.3667 instance_segmentation_loss_poly: 0.9781 +2023/10/30 07:33:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 07:33:40 - mmengine - INFO - Iter(train) [184000/640000] base_lr: 1.6229e-04 lr: 1.6572e-05 eta: 5 days, 22:04:29 time: 1.1176 data_time: 0.0325 memory: 21513 grad_norm: 2.7560 loss: 1.4772 caption_loss_cls: 2.4169 grounding_loss_reg: 3.0917 detection_loss_cls: 0.0424 detection_loss_reg: 0.3611 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0441 instance_segmentation_loss_reg: 0.3653 instance_segmentation_loss_poly: 0.9750 +2023/10/30 07:33:40 - mmengine - INFO - Saving checkpoint at 184000 iterations +2023/10/30 07:42:31 - mmengine - INFO - Iter(train) [184500/640000] base_lr: 1.6210e-04 lr: 1.6555e-05 eta: 5 days, 21:48:56 time: 1.1171 data_time: 0.0352 memory: 21513 grad_norm: 2.7763 loss: 1.4776 caption_loss_cls: 2.4163 grounding_loss_reg: 3.0907 detection_loss_cls: 0.0423 detection_loss_reg: 0.3602 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0439 instance_segmentation_loss_reg: 0.3642 instance_segmentation_loss_poly: 0.9722 +2023/10/30 07:52:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 07:52:40 - mmengine - INFO - Iter(train) [185000/640000] base_lr: 1.6191e-04 lr: 1.6537e-05 eta: 5 days, 21:49:17 time: 1.1286 data_time: 0.0354 memory: 21513 grad_norm: 2.7654 loss: 1.4769 caption_loss_cls: 2.4187 grounding_loss_reg: 3.0907 detection_loss_cls: 0.0423 detection_loss_reg: 0.3603 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0438 instance_segmentation_loss_reg: 0.3646 instance_segmentation_loss_poly: 0.9723 +2023/10/30 07:52:40 - mmengine - INFO - Saving checkpoint at 185000 iterations +2023/10/30 08:02:58 - mmengine - INFO - Iter(train) [185500/640000] base_lr: 1.6172e-04 lr: 1.6520e-05 eta: 5 days, 21:51:10 time: 1.1398 data_time: 0.0363 memory: 21513 grad_norm: 2.7548 loss: 1.4648 caption_loss_cls: 2.4157 grounding_loss_reg: 3.0904 detection_loss_cls: 0.0423 detection_loss_reg: 0.3596 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0438 instance_segmentation_loss_reg: 0.3645 instance_segmentation_loss_poly: 0.9707 +2023/10/30 08:12:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 08:12:03 - mmengine - INFO - Iter(train) [186000/640000] base_lr: 1.6152e-04 lr: 1.6502e-05 eta: 5 days, 21:38:26 time: 1.1394 data_time: 0.0362 memory: 21513 grad_norm: 2.7669 loss: 1.4638 caption_loss_cls: 2.4148 grounding_loss_reg: 3.0921 detection_loss_cls: 0.0422 detection_loss_reg: 0.3595 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0438 instance_segmentation_loss_reg: 0.3635 instance_segmentation_loss_poly: 0.9676 +2023/10/30 08:12:03 - mmengine - INFO - Saving checkpoint at 186000 iterations +2023/10/30 08:21:21 - mmengine - INFO - Iter(train) [186500/640000] base_lr: 1.6133e-04 lr: 1.6485e-05 eta: 5 days, 21:28:25 time: 1.1406 data_time: 0.0365 memory: 21513 grad_norm: 2.7704 loss: 1.4715 caption_loss_cls: 2.4148 grounding_loss_reg: 3.0892 detection_loss_cls: 0.0423 detection_loss_reg: 0.3601 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0438 instance_segmentation_loss_reg: 0.3628 instance_segmentation_loss_poly: 0.9662 +2023/10/30 08:30:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 08:30:27 - mmengine - INFO - Iter(train) [187000/640000] base_lr: 1.6114e-04 lr: 1.6467e-05 eta: 5 days, 21:16:06 time: 1.1404 data_time: 0.0362 memory: 21513 grad_norm: 2.7902 loss: 1.4703 caption_loss_cls: 2.4130 grounding_loss_reg: 3.0908 detection_loss_cls: 0.0422 detection_loss_reg: 0.3594 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0436 instance_segmentation_loss_reg: 0.3627 instance_segmentation_loss_poly: 0.9654 +2023/10/30 08:30:27 - mmengine - INFO - Saving checkpoint at 187000 iterations +2023/10/30 08:39:19 - mmengine - INFO - Iter(train) [187500/640000] base_lr: 1.6095e-04 lr: 1.6450e-05 eta: 5 days, 21:01:11 time: 1.1276 data_time: 0.0357 memory: 21513 grad_norm: 2.7997 loss: 1.4703 caption_loss_cls: 2.4143 grounding_loss_reg: 3.0918 detection_loss_cls: 0.0421 detection_loss_reg: 0.3585 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0437 instance_segmentation_loss_reg: 0.3638 instance_segmentation_loss_poly: 0.9676 +2023/10/30 08:48:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 08:48:27 - mmengine - INFO - Iter(train) [188000/640000] base_lr: 1.6075e-04 lr: 1.6432e-05 eta: 5 days, 20:49:32 time: 1.1214 data_time: 0.0355 memory: 21513 grad_norm: 2.7643 loss: 1.4690 caption_loss_cls: 2.4135 grounding_loss_reg: 3.0947 detection_loss_cls: 0.0420 detection_loss_reg: 0.3586 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0436 instance_segmentation_loss_reg: 0.3630 instance_segmentation_loss_poly: 0.9656 +2023/10/30 08:48:27 - mmengine - INFO - Saving checkpoint at 188000 iterations +2023/10/30 08:57:33 - mmengine - INFO - Iter(train) [188500/640000] base_lr: 1.6056e-04 lr: 1.6414e-05 eta: 5 days, 20:37:25 time: 1.1252 data_time: 0.0353 memory: 21513 grad_norm: 2.7439 loss: 1.4554 caption_loss_cls: 2.4118 grounding_loss_reg: 3.0920 detection_loss_cls: 0.0419 detection_loss_reg: 0.3586 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0435 instance_segmentation_loss_reg: 0.3623 instance_segmentation_loss_poly: 0.9652 +2023/10/30 09:06:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 09:06:31 - mmengine - INFO - Iter(train) [189000/640000] base_lr: 1.6036e-04 lr: 1.6397e-05 eta: 5 days, 20:23:57 time: 1.1074 data_time: 0.0350 memory: 21513 grad_norm: 2.7780 loss: 1.4667 caption_loss_cls: 2.4157 grounding_loss_reg: 3.0934 detection_loss_cls: 0.0419 detection_loss_reg: 0.3585 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0436 instance_segmentation_loss_reg: 0.3635 instance_segmentation_loss_poly: 0.9676 +2023/10/30 09:06:31 - mmengine - INFO - Saving checkpoint at 189000 iterations +2023/10/30 09:15:45 - mmengine - INFO - Iter(train) [189500/640000] base_lr: 1.6017e-04 lr: 1.6379e-05 eta: 5 days, 20:13:33 time: 1.0915 data_time: 0.0338 memory: 21513 grad_norm: 2.8250 loss: 1.4832 caption_loss_cls: 2.4177 grounding_loss_reg: 3.0916 detection_loss_cls: 0.0419 detection_loss_reg: 0.3589 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0435 instance_segmentation_loss_reg: 0.3627 instance_segmentation_loss_poly: 0.9666 +2023/10/30 09:25:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 09:25:21 - mmengine - INFO - Iter(train) [190000/640000] base_lr: 1.5997e-04 lr: 1.6361e-05 eta: 5 days, 20:06:48 time: 1.0991 data_time: 0.0341 memory: 21513 grad_norm: 2.8087 loss: 1.4800 caption_loss_cls: 2.4155 grounding_loss_reg: 3.0922 detection_loss_cls: 0.0419 detection_loss_reg: 0.3595 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0435 instance_segmentation_loss_reg: 0.3632 instance_segmentation_loss_poly: 0.9673 +2023/10/30 09:25:21 - mmengine - INFO - Saving checkpoint at 190000 iterations +2023/10/30 09:35:00 - mmengine - INFO - Iter(train) [190500/640000] base_lr: 1.5978e-04 lr: 1.6344e-05 eta: 5 days, 20:00:41 time: 1.1044 data_time: 0.0342 memory: 21513 grad_norm: 2.8236 loss: 1.4863 caption_loss_cls: 2.4141 grounding_loss_reg: 3.0894 detection_loss_cls: 0.0419 detection_loss_reg: 0.3595 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0437 instance_segmentation_loss_reg: 0.3641 instance_segmentation_loss_poly: 0.9688 +2023/10/30 09:44:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 09:44:27 - mmengine - INFO - Iter(train) [191000/640000] base_lr: 1.5958e-04 lr: 1.6326e-05 eta: 5 days, 19:52:18 time: 1.1095 data_time: 0.0343 memory: 21513 grad_norm: 2.8185 loss: 1.4854 caption_loss_cls: 2.4130 grounding_loss_reg: 3.0864 detection_loss_cls: 0.0420 detection_loss_reg: 0.3606 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0436 instance_segmentation_loss_reg: 0.3635 instance_segmentation_loss_poly: 0.9662 +2023/10/30 09:44:27 - mmengine - INFO - Saving checkpoint at 191000 iterations +2023/10/30 09:54:00 - mmengine - INFO - Iter(train) [191500/640000] base_lr: 1.5939e-04 lr: 1.6308e-05 eta: 5 days, 19:45:05 time: 1.1200 data_time: 0.0345 memory: 21513 grad_norm: 2.8055 loss: 1.4782 caption_loss_cls: 2.4130 grounding_loss_reg: 3.0832 detection_loss_cls: 0.0420 detection_loss_reg: 0.3598 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0437 instance_segmentation_loss_reg: 0.3636 instance_segmentation_loss_poly: 0.9660 +2023/10/30 10:03:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 10:03:13 - mmengine - INFO - Iter(train) [192000/640000] base_lr: 1.5919e-04 lr: 1.6290e-05 eta: 5 days, 19:34:26 time: 1.1211 data_time: 0.0347 memory: 21513 grad_norm: 2.8365 loss: 1.4874 caption_loss_cls: 2.4133 grounding_loss_reg: 3.0789 detection_loss_cls: 0.0420 detection_loss_reg: 0.3601 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0438 instance_segmentation_loss_reg: 0.3634 instance_segmentation_loss_poly: 0.9658 +2023/10/30 10:03:13 - mmengine - INFO - Saving checkpoint at 192000 iterations +2023/10/30 10:12:54 - mmengine - INFO - Iter(train) [192500/640000] base_lr: 1.5899e-04 lr: 1.6272e-05 eta: 5 days, 19:28:19 time: 1.1299 data_time: 0.0355 memory: 21513 grad_norm: 2.7960 loss: 1.4899 caption_loss_cls: 2.4132 grounding_loss_reg: 3.0789 detection_loss_cls: 0.0420 detection_loss_reg: 0.3600 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0436 instance_segmentation_loss_reg: 0.3623 instance_segmentation_loss_poly: 0.9632 +2023/10/30 10:22:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 10:22:43 - mmengine - INFO - Iter(train) [193000/640000] base_lr: 1.5880e-04 lr: 1.6254e-05 eta: 5 days, 19:23:24 time: 1.1426 data_time: 0.0358 memory: 21513 grad_norm: 2.7546 loss: 1.4688 caption_loss_cls: 2.4104 grounding_loss_reg: 3.0808 detection_loss_cls: 0.0421 detection_loss_reg: 0.3601 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0438 instance_segmentation_loss_reg: 0.3623 instance_segmentation_loss_poly: 0.9628 +2023/10/30 10:22:43 - mmengine - INFO - Saving checkpoint at 193000 iterations +2023/10/30 10:32:57 - mmengine - INFO - Iter(train) [193500/640000] base_lr: 1.5860e-04 lr: 1.6236e-05 eta: 5 days, 19:22:32 time: 1.1576 data_time: 0.0380 memory: 21513 grad_norm: 2.7296 loss: 1.4564 caption_loss_cls: 2.4079 grounding_loss_reg: 3.0790 detection_loss_cls: 0.0420 detection_loss_reg: 0.3589 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0439 instance_segmentation_loss_reg: 0.3626 instance_segmentation_loss_poly: 0.9648 +2023/10/30 10:42:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 10:42:39 - mmengine - INFO - Iter(train) [194000/640000] base_lr: 1.5840e-04 lr: 1.6218e-05 eta: 5 days, 19:16:20 time: 1.1593 data_time: 0.0381 memory: 21513 grad_norm: 2.6783 loss: 1.4472 caption_loss_cls: 2.4112 grounding_loss_reg: 3.0809 detection_loss_cls: 0.0420 detection_loss_reg: 0.3588 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0440 instance_segmentation_loss_reg: 0.3629 instance_segmentation_loss_poly: 0.9652 +2023/10/30 10:42:39 - mmengine - INFO - Saving checkpoint at 194000 iterations +2023/10/30 10:52:06 - mmengine - INFO - Iter(train) [194500/640000] base_lr: 1.5820e-04 lr: 1.6200e-05 eta: 5 days, 19:07:37 time: 1.1560 data_time: 0.0382 memory: 21513 grad_norm: 2.6723 loss: 1.4540 caption_loss_cls: 2.4151 grounding_loss_reg: 3.0808 detection_loss_cls: 0.0421 detection_loss_reg: 0.3584 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0442 instance_segmentation_loss_reg: 0.3636 instance_segmentation_loss_poly: 0.9666 +2023/10/30 11:01:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 11:01:37 - mmengine - INFO - Iter(train) [195000/640000] base_lr: 1.5801e-04 lr: 1.6182e-05 eta: 5 days, 18:59:37 time: 1.1572 data_time: 0.0384 memory: 21513 grad_norm: 2.6509 loss: 1.4539 caption_loss_cls: 2.4160 grounding_loss_reg: 3.0819 detection_loss_cls: 0.0422 detection_loss_reg: 0.3593 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0443 instance_segmentation_loss_reg: 0.3633 instance_segmentation_loss_poly: 0.9654 +2023/10/30 11:01:37 - mmengine - INFO - Saving checkpoint at 195000 iterations +2023/10/30 11:11:07 - mmengine - INFO - Iter(train) [195500/640000] base_lr: 1.5781e-04 lr: 1.6164e-05 eta: 5 days, 18:51:26 time: 1.1563 data_time: 0.0384 memory: 21513 grad_norm: 2.6588 loss: 1.4633 caption_loss_cls: 2.4133 grounding_loss_reg: 3.0833 detection_loss_cls: 0.0422 detection_loss_reg: 0.3592 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0444 instance_segmentation_loss_reg: 0.3637 instance_segmentation_loss_poly: 0.9655 +2023/10/30 11:20:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 11:20:36 - mmengine - INFO - Iter(train) [196000/640000] base_lr: 1.5761e-04 lr: 1.6146e-05 eta: 5 days, 18:43:05 time: 1.1603 data_time: 0.0384 memory: 21513 grad_norm: 2.6119 loss: 1.4398 caption_loss_cls: 2.4175 grounding_loss_reg: 3.0810 detection_loss_cls: 0.0423 detection_loss_reg: 0.3594 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0445 instance_segmentation_loss_reg: 0.3646 instance_segmentation_loss_poly: 0.9676 +2023/10/30 11:20:36 - mmengine - INFO - Saving checkpoint at 196000 iterations +2023/10/30 11:30:01 - mmengine - INFO - Iter(train) [196500/640000] base_lr: 1.5741e-04 lr: 1.6128e-05 eta: 5 days, 18:34:01 time: 1.1563 data_time: 0.0377 memory: 21513 grad_norm: 2.6313 loss: 1.4366 caption_loss_cls: 2.4172 grounding_loss_reg: 3.0812 detection_loss_cls: 0.0423 detection_loss_reg: 0.3599 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0443 instance_segmentation_loss_reg: 0.3639 instance_segmentation_loss_poly: 0.9670 +2023/10/30 11:39:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 11:39:30 - mmengine - INFO - Iter(train) [197000/640000] base_lr: 1.5721e-04 lr: 1.6110e-05 eta: 5 days, 18:25:39 time: 1.1515 data_time: 0.0375 memory: 21513 grad_norm: 2.6605 loss: 1.4432 caption_loss_cls: 2.4145 grounding_loss_reg: 3.0777 detection_loss_cls: 0.0423 detection_loss_reg: 0.3606 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0440 instance_segmentation_loss_reg: 0.3623 instance_segmentation_loss_poly: 0.9641 +2023/10/30 11:39:30 - mmengine - INFO - Saving checkpoint at 197000 iterations +2023/10/30 11:48:53 - mmengine - INFO - Iter(train) [197500/640000] base_lr: 1.5701e-04 lr: 1.6092e-05 eta: 5 days, 18:16:11 time: 1.1384 data_time: 0.0355 memory: 21513 grad_norm: 2.6605 loss: 1.4432 caption_loss_cls: 2.4117 grounding_loss_reg: 3.0787 detection_loss_cls: 0.0422 detection_loss_reg: 0.3604 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0440 instance_segmentation_loss_reg: 0.3626 instance_segmentation_loss_poly: 0.9633 +2023/10/30 11:57:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 11:57:50 - mmengine - INFO - Iter(train) [198000/640000] base_lr: 1.5681e-04 lr: 1.6073e-05 eta: 5 days, 18:03:09 time: 1.1272 data_time: 0.0352 memory: 21513 grad_norm: 2.7222 loss: 1.4552 caption_loss_cls: 2.4167 grounding_loss_reg: 3.0761 detection_loss_cls: 0.0421 detection_loss_reg: 0.3595 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0441 instance_segmentation_loss_reg: 0.3635 instance_segmentation_loss_poly: 0.9654 +2023/10/30 11:57:50 - mmengine - INFO - Saving checkpoint at 198000 iterations +2023/10/30 12:07:28 - mmengine - INFO - Iter(train) [198500/640000] base_lr: 1.5661e-04 lr: 1.6055e-05 eta: 5 days, 17:55:59 time: 1.1301 data_time: 0.0349 memory: 21513 grad_norm: 2.7080 loss: 1.4284 caption_loss_cls: 2.4156 grounding_loss_reg: 3.0765 detection_loss_cls: 0.0421 detection_loss_reg: 0.3593 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0440 instance_segmentation_loss_reg: 0.3631 instance_segmentation_loss_poly: 0.9646 +2023/10/30 12:17:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 12:17:42 - mmengine - INFO - Iter(train) [199000/640000] base_lr: 1.5641e-04 lr: 1.6037e-05 eta: 5 days, 17:53:59 time: 1.1410 data_time: 0.0399 memory: 21513 grad_norm: 2.7259 loss: 1.4343 caption_loss_cls: 2.4196 grounding_loss_reg: 3.0720 detection_loss_cls: 0.0421 detection_loss_reg: 0.3600 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0440 instance_segmentation_loss_reg: 0.3629 instance_segmentation_loss_poly: 0.9639 +2023/10/30 12:17:42 - mmengine - INFO - Saving checkpoint at 199000 iterations +2023/10/30 12:26:42 - mmengine - INFO - Iter(train) [199500/640000] base_lr: 1.5620e-04 lr: 1.6019e-05 eta: 5 days, 17:41:23 time: 1.1334 data_time: 0.0397 memory: 21513 grad_norm: 2.7421 loss: 1.4378 caption_loss_cls: 2.4212 grounding_loss_reg: 3.0718 detection_loss_cls: 0.0421 detection_loss_reg: 0.3607 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0439 instance_segmentation_loss_reg: 0.3624 instance_segmentation_loss_poly: 0.9625 +2023/10/30 12:36:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 12:36:38 - mmengine - INFO - Iter(train) [200000/640000] base_lr: 1.5600e-04 lr: 1.6000e-05 eta: 5 days, 17:36:30 time: 1.1399 data_time: 0.0400 memory: 21513 grad_norm: 2.7403 loss: 1.4466 caption_loss_cls: 2.4201 grounding_loss_reg: 3.0712 detection_loss_cls: 0.0420 detection_loss_reg: 0.3606 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0441 instance_segmentation_loss_reg: 0.3638 instance_segmentation_loss_poly: 0.9645 +2023/10/30 12:36:38 - mmengine - INFO - Saving checkpoint at 200000 iterations +2023/10/30 12:45:27 - mmengine - INFO - Evaluating bbox... +2023/10/30 12:46:24 - mmengine - INFO - bbox_mAP_copypaste: 0.395 0.567 0.430 0.240 0.435 0.516 +2023/10/30 12:46:24 - mmengine - INFO - Evaluating segm... +2023/10/30 12:47:34 - mmengine - INFO - segm_mAP_copypaste: 0.257 0.478 0.247 0.126 0.292 0.399 +2023/10/30 12:52:31 - mmengine - INFO - per class results: +2023/10/30 12:52:31 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 72.81 | 87.64 | +| building | 79.75 | 92.74 | +| sky | 91.17 | 98.36 | +| floor | 78.37 | 86.56 | +| tree | 69.2 | 81.81 | +| ceiling | 81.14 | 90.37 | +| road | 79.98 | 86.8 | +| bed | 83.69 | 91.56 | +| windowpane | 56.78 | 79.0 | +| grass | 66.76 | 80.44 | +| cabinet | 55.94 | 77.93 | +| sidewalk | 60.93 | 78.47 | +| person | 75.52 | 87.26 | +| earth | 36.91 | 54.36 | +| door | 46.3 | 61.84 | +| table | 53.89 | 72.54 | +| mountain | 50.96 | 69.2 | +| plant | 45.3 | 52.95 | +| curtain | 68.86 | 78.93 | +| chair | 51.88 | 64.78 | +| car | 79.01 | 85.97 | +| water | 44.78 | 62.38 | +| painting | 67.36 | 80.81 | +| sofa | 61.07 | 75.8 | +| shelf | 36.27 | 45.88 | +| house | 41.76 | 48.23 | +| sea | 42.65 | 62.32 | +| mirror | 59.23 | 70.28 | +| rug | 60.55 | 65.43 | +| field | 27.48 | 40.26 | +| armchair | 39.6 | 55.16 | +| seat | 56.27 | 78.06 | +| fence | 37.5 | 49.45 | +| desk | 40.97 | 64.15 | +| rock | 29.62 | 40.03 | +| wardrobe | 44.12 | 49.52 | +| lamp | 52.8 | 63.18 | +| bathtub | 69.11 | 77.79 | +| railing | 28.54 | 44.61 | +| cushion | 49.04 | 62.87 | +| base | 27.63 | 39.55 | +| box | 19.44 | 28.17 | +| column | 47.65 | 53.44 | +| signboard | 31.18 | 49.17 | +| chest of drawers | 31.32 | 46.0 | +| counter | 22.89 | 29.79 | +| sand | 30.26 | 47.46 | +| sink | 65.8 | 74.8 | +| skyscraper | 41.23 | 48.42 | +| fireplace | 66.08 | 80.47 | +| refrigerator | 64.4 | 73.43 | +| grandstand | 33.65 | 45.34 | +| path | 21.7 | 26.68 | +| stairs | 26.01 | 32.42 | +| runway | 72.67 | 93.26 | +| case | 39.21 | 55.8 | +| pool table | 88.88 | 94.13 | +| pillow | 48.12 | 70.34 | +| screen door | 62.8 | 76.75 | +| stairway | 32.61 | 38.73 | +| river | 15.71 | 32.73 | +| bridge | 56.67 | 78.91 | +| bookcase | 31.99 | 48.52 | +| blind | 20.56 | 23.34 | +| coffee table | 51.23 | 76.89 | +| toilet | 80.01 | 82.9 | +| flower | 24.69 | 36.61 | +| book | 44.62 | 66.14 | +| hill | 5.14 | 7.88 | +| bench | 39.88 | 47.41 | +| countertop | 52.08 | 64.08 | +| stove | 69.81 | 82.49 | +| palm | 42.71 | 61.16 | +| kitchen island | 32.74 | 65.07 | +| computer | 65.2 | 73.68 | +| swivel chair | 40.01 | 51.48 | +| boat | 69.08 | 78.43 | +| bar | 17.41 | 22.65 | +| arcade machine | 41.07 | 42.6 | +| hovel | 19.22 | 27.98 | +| bus | 84.25 | 94.26 | +| towel | 51.48 | 57.97 | +| light | 42.56 | 51.6 | +| truck | 34.75 | 47.85 | +| tower | 26.65 | 37.45 | +| chandelier | 54.57 | 66.85 | +| awning | 4.29 | 4.47 | +| streetlight | 17.47 | 20.08 | +| booth | 37.29 | 38.03 | +| television receiver | 66.23 | 72.9 | +| airplane | 51.76 | 60.97 | +| dirt track | 0.9 | 1.77 | +| apparel | 30.04 | 51.23 | +| pole | 22.3 | 25.57 | +| land | 0.0 | 0.0 | +| bannister | 6.61 | 7.85 | +| escalator | 10.5 | 10.83 | +| ottoman | 37.45 | 50.48 | +| bottle | 18.79 | 22.63 | +| buffet | 37.24 | 38.22 | +| poster | 35.01 | 44.32 | +| stage | 11.13 | 21.9 | +| van | 37.37 | 58.62 | +| ship | 66.14 | 75.21 | +| fountain | 1.61 | 1.63 | +| conveyer belt | 56.68 | 64.03 | +| canopy | 23.2 | 34.77 | +| washer | 52.07 | 52.57 | +| plaything | 17.86 | 19.09 | +| swimming pool | 41.48 | 69.66 | +| stool | 28.87 | 33.94 | +| barrel | 17.56 | 46.87 | +| basket | 29.61 | 44.38 | +| waterfall | 46.14 | 51.94 | +| tent | 79.27 | 97.58 | +| bag | 16.82 | 19.84 | +| minibike | 63.38 | 71.26 | +| cradle | 63.51 | 83.06 | +| oven | 15.23 | 42.17 | +| ball | 10.56 | 11.33 | +| food | 56.2 | 75.53 | +| step | 16.18 | 20.93 | +| tank | 37.53 | 49.18 | +| trade name | 0.0 | 0.0 | +| microwave | 35.55 | 38.89 | +| pot | 42.03 | 46.27 | +| animal | 57.33 | 63.62 | +| bicycle | 52.47 | 71.9 | +| lake | 55.48 | 55.52 | +| dishwasher | 42.48 | 46.94 | +| screen | 47.67 | 89.48 | +| blanket | 1.67 | 1.85 | +| sculpture | 33.5 | 54.15 | +| hood | 50.05 | 55.61 | +| sconce | 17.65 | 18.65 | +| vase | 34.1 | 42.07 | +| traffic light | 29.97 | 41.51 | +| tray | 3.27 | 4.13 | +| ashcan | 27.15 | 32.62 | +| fan | 36.81 | 40.74 | +| pier | 26.41 | 33.88 | +| crt screen | 8.37 | 10.24 | +| plate | 49.5 | 56.88 | +| monitor | 66.2 | 76.63 | +| bulletin board | 28.54 | 38.85 | +| shower | 0.0 | 0.0 | +| radiator | 23.2 | 24.0 | +| glass | 10.51 | 11.02 | +| clock | 19.72 | 24.13 | +| flag | 24.99 | 28.57 | ++---------------------+-------+-------+ +2023/10/30 12:52:46 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.3950 coco/bbox_mAP_50: 0.5670 coco/bbox_mAP_75: 0.4300 coco/bbox_mAP_s: 0.2400 coco/bbox_mAP_m: 0.4350 coco/bbox_mAP_l: 0.5160 coco/segm_mAP: 0.2570 coco/segm_mAP_50: 0.4780 coco/segm_mAP_75: 0.2470 coco/segm_mAP_s: 0.1260 coco/segm_mAP_m: 0.2920 coco/segm_mAP_l: 0.3990 Bleu_1: 0.7066 Bleu_2: 0.5309 Bleu_3: 0.3898 Bleu_4: 0.2852 METEOR: 0.2414 ROUGE_L: 0.5178 CIDEr: 0.8872 SPICE: 0.1706 aAcc: 80.0200 mIoU: 41.6700 mAcc: 52.2000 visual-grounding/miou: 0.7249 visual-grounding/acc: 0.8044 data_time: 0.0045 time: 0.5286 +2023/10/30 13:02:43 - mmengine - INFO - Iter(train) [200500/640000] base_lr: 1.5580e-04 lr: 1.5982e-05 eta: 5 days, 17:31:53 time: 1.1483 data_time: 0.0393 memory: 21513 grad_norm: 2.7408 loss: 1.4530 caption_loss_cls: 2.4171 grounding_loss_reg: 3.0658 detection_loss_cls: 0.0419 detection_loss_reg: 0.3600 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0441 instance_segmentation_loss_reg: 0.3641 instance_segmentation_loss_poly: 0.9656 +2023/10/30 13:11:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 13:11:57 - mmengine - INFO - Iter(train) [201000/640000] base_lr: 1.5560e-04 lr: 1.5963e-05 eta: 5 days, 17:21:14 time: 1.1444 data_time: 0.0392 memory: 21513 grad_norm: 2.7334 loss: 1.4540 caption_loss_cls: 2.4184 grounding_loss_reg: 3.0633 detection_loss_cls: 0.0420 detection_loss_reg: 0.3615 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0440 instance_segmentation_loss_reg: 0.3629 instance_segmentation_loss_poly: 0.9629 +2023/10/30 13:11:57 - mmengine - INFO - Saving checkpoint at 201000 iterations +2023/10/30 13:21:02 - mmengine - INFO - Iter(train) [201500/640000] base_lr: 1.5539e-04 lr: 1.5945e-05 eta: 5 days, 17:09:25 time: 1.1402 data_time: 0.0389 memory: 21513 grad_norm: 2.7340 loss: 1.4498 caption_loss_cls: 2.4176 grounding_loss_reg: 3.0634 detection_loss_cls: 0.0420 detection_loss_reg: 0.3616 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0440 instance_segmentation_loss_reg: 0.3637 instance_segmentation_loss_poly: 0.9639 +2023/10/30 13:30:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 13:30:22 - mmengine - INFO - Iter(train) [202000/640000] base_lr: 1.5519e-04 lr: 1.5926e-05 eta: 5 days, 16:59:31 time: 1.1458 data_time: 0.0392 memory: 21513 grad_norm: 2.7226 loss: 1.4546 caption_loss_cls: 2.4161 grounding_loss_reg: 3.0627 detection_loss_cls: 0.0417 detection_loss_reg: 0.3597 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0441 instance_segmentation_loss_reg: 0.3650 instance_segmentation_loss_poly: 0.9665 +2023/10/30 13:30:22 - mmengine - INFO - Saving checkpoint at 202000 iterations +2023/10/30 13:40:18 - mmengine - INFO - Iter(train) [202500/640000] base_lr: 1.5499e-04 lr: 1.5908e-05 eta: 5 days, 16:54:28 time: 1.1503 data_time: 0.0392 memory: 21513 grad_norm: 2.7404 loss: 1.4690 caption_loss_cls: 2.4120 grounding_loss_reg: 3.0652 detection_loss_cls: 0.0418 detection_loss_reg: 0.3613 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0441 instance_segmentation_loss_reg: 0.3647 instance_segmentation_loss_poly: 0.9654 +2023/10/30 13:48:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 13:48:34 - mmengine - INFO - Iter(train) [203000/640000] base_lr: 1.5478e-04 lr: 1.5889e-05 eta: 5 days, 16:36:17 time: 1.1206 data_time: 0.0336 memory: 21513 grad_norm: 2.7733 loss: 1.4704 caption_loss_cls: 2.4097 grounding_loss_reg: 3.0597 detection_loss_cls: 0.0418 detection_loss_reg: 0.3608 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0440 instance_segmentation_loss_reg: 0.3644 instance_segmentation_loss_poly: 0.9649 +2023/10/30 13:48:34 - mmengine - INFO - Saving checkpoint at 203000 iterations +2023/10/30 13:58:35 - mmengine - INFO - Iter(train) [203500/640000] base_lr: 1.5458e-04 lr: 1.5871e-05 eta: 5 days, 16:31:55 time: 1.1361 data_time: 0.0341 memory: 21513 grad_norm: 2.7387 loss: 1.4538 caption_loss_cls: 2.4120 grounding_loss_reg: 3.0581 detection_loss_cls: 0.0419 detection_loss_reg: 0.3616 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0439 instance_segmentation_loss_reg: 0.3635 instance_segmentation_loss_poly: 0.9635 +2023/10/30 14:07:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 14:07:43 - mmengine - INFO - Iter(train) [204000/640000] base_lr: 1.5438e-04 lr: 1.5852e-05 eta: 5 days, 16:20:36 time: 1.1242 data_time: 0.0337 memory: 21513 grad_norm: 2.7899 loss: 1.4610 caption_loss_cls: 2.4107 grounding_loss_reg: 3.0571 detection_loss_cls: 0.0418 detection_loss_reg: 0.3611 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0438 instance_segmentation_loss_reg: 0.3624 instance_segmentation_loss_poly: 0.9618 +2023/10/30 14:07:43 - mmengine - INFO - Saving checkpoint at 204000 iterations +2023/10/30 14:17:00 - mmengine - INFO - Iter(train) [204500/640000] base_lr: 1.5417e-04 lr: 1.5834e-05 eta: 5 days, 16:10:21 time: 1.1138 data_time: 0.0343 memory: 21513 grad_norm: 2.7831 loss: 1.4510 caption_loss_cls: 2.4109 grounding_loss_reg: 3.0549 detection_loss_cls: 0.0418 detection_loss_reg: 0.3608 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0438 instance_segmentation_loss_reg: 0.3622 instance_segmentation_loss_poly: 0.9617 +2023/10/30 14:25:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 14:25:54 - mmengine - INFO - Iter(train) [205000/640000] base_lr: 1.5397e-04 lr: 1.5815e-05 eta: 5 days, 15:57:25 time: 1.1089 data_time: 0.0341 memory: 21513 grad_norm: 2.8122 loss: 1.4534 caption_loss_cls: 2.4126 grounding_loss_reg: 3.0563 detection_loss_cls: 0.0416 detection_loss_reg: 0.3597 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0439 instance_segmentation_loss_reg: 0.3618 instance_segmentation_loss_poly: 0.9618 +2023/10/30 14:25:54 - mmengine - INFO - Saving checkpoint at 205000 iterations +2023/10/30 14:36:07 - mmengine - INFO - Iter(train) [205500/640000] base_lr: 1.5376e-04 lr: 1.5796e-05 eta: 5 days, 15:54:16 time: 1.1259 data_time: 0.0350 memory: 21513 grad_norm: 2.7797 loss: 1.4517 caption_loss_cls: 2.4096 grounding_loss_reg: 3.0542 detection_loss_cls: 0.0416 detection_loss_reg: 0.3600 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0438 instance_segmentation_loss_reg: 0.3616 instance_segmentation_loss_poly: 0.9621 +2023/10/30 14:45:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 14:45:25 - mmengine - INFO - Iter(train) [206000/640000] base_lr: 1.5355e-04 lr: 1.5778e-05 eta: 5 days, 15:44:10 time: 1.1254 data_time: 0.0348 memory: 21513 grad_norm: 2.7803 loss: 1.4433 caption_loss_cls: 2.4083 grounding_loss_reg: 3.0511 detection_loss_cls: 0.0416 detection_loss_reg: 0.3592 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0437 instance_segmentation_loss_reg: 0.3616 instance_segmentation_loss_poly: 0.9617 +2023/10/30 14:45:25 - mmengine - INFO - Saving checkpoint at 206000 iterations +2023/10/30 14:55:00 - mmengine - INFO - Iter(train) [206500/640000] base_lr: 1.5335e-04 lr: 1.5759e-05 eta: 5 days, 15:36:17 time: 1.1202 data_time: 0.0350 memory: 21513 grad_norm: 2.7673 loss: 1.4366 caption_loss_cls: 2.4080 grounding_loss_reg: 3.0504 detection_loss_cls: 0.0416 detection_loss_reg: 0.3594 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0437 instance_segmentation_loss_reg: 0.3618 instance_segmentation_loss_poly: 0.9622 +2023/10/30 15:04:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 15:04:23 - mmengine - INFO - Iter(train) [207000/640000] base_lr: 1.5314e-04 lr: 1.5740e-05 eta: 5 days, 15:26:49 time: 1.1369 data_time: 0.0354 memory: 21513 grad_norm: 2.7311 loss: 1.4275 caption_loss_cls: 2.4068 grounding_loss_reg: 3.0448 detection_loss_cls: 0.0415 detection_loss_reg: 0.3588 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0438 instance_segmentation_loss_reg: 0.3625 instance_segmentation_loss_poly: 0.9631 +2023/10/30 15:04:23 - mmengine - INFO - Saving checkpoint at 207000 iterations +2023/10/30 15:14:10 - mmengine - INFO - Iter(train) [207500/640000] base_lr: 1.5293e-04 lr: 1.5721e-05 eta: 5 days, 15:20:15 time: 1.1332 data_time: 0.0352 memory: 21513 grad_norm: 2.7594 loss: 1.4410 caption_loss_cls: 2.4099 grounding_loss_reg: 3.0425 detection_loss_cls: 0.0415 detection_loss_reg: 0.3595 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0440 instance_segmentation_loss_reg: 0.3636 instance_segmentation_loss_poly: 0.9647 +2023/10/30 15:23:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 15:23:48 - mmengine - INFO - Iter(train) [208000/640000] base_lr: 1.5273e-04 lr: 1.5703e-05 eta: 5 days, 15:12:36 time: 1.1407 data_time: 0.0356 memory: 21513 grad_norm: 2.7362 loss: 1.4394 caption_loss_cls: 2.4103 grounding_loss_reg: 3.0386 detection_loss_cls: 0.0415 detection_loss_reg: 0.3599 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0442 instance_segmentation_loss_reg: 0.3655 instance_segmentation_loss_poly: 0.9677 +2023/10/30 15:23:48 - mmengine - INFO - Saving checkpoint at 208000 iterations +2023/10/30 15:34:04 - mmengine - INFO - Iter(train) [208500/640000] base_lr: 1.5252e-04 lr: 1.5684e-05 eta: 5 days, 15:09:19 time: 1.1556 data_time: 0.0369 memory: 21513 grad_norm: 2.7281 loss: 1.4440 caption_loss_cls: 2.4108 grounding_loss_reg: 3.0396 detection_loss_cls: 0.0417 detection_loss_reg: 0.3603 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0441 instance_segmentation_loss_reg: 0.3649 instance_segmentation_loss_poly: 0.9652 +2023/10/30 15:42:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 15:42:46 - mmengine - INFO - Iter(train) [209000/640000] base_lr: 1.5231e-04 lr: 1.5665e-05 eta: 5 days, 14:55:07 time: 1.1526 data_time: 0.0368 memory: 21513 grad_norm: 2.6923 loss: 1.4380 caption_loss_cls: 2.4047 grounding_loss_reg: 3.0359 detection_loss_cls: 0.0420 detection_loss_reg: 0.3627 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0441 instance_segmentation_loss_reg: 0.3655 instance_segmentation_loss_poly: 0.9665 +2023/10/30 15:42:46 - mmengine - INFO - Saving checkpoint at 209000 iterations +2023/10/30 15:52:14 - mmengine - INFO - Iter(train) [209500/640000] base_lr: 1.5210e-04 lr: 1.5646e-05 eta: 5 days, 14:46:12 time: 1.1413 data_time: 0.0361 memory: 21513 grad_norm: 2.7158 loss: 1.4468 caption_loss_cls: 2.4033 grounding_loss_reg: 3.0349 detection_loss_cls: 0.0419 detection_loss_reg: 0.3631 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0441 instance_segmentation_loss_reg: 0.3658 instance_segmentation_loss_poly: 0.9668 +2023/10/30 16:01:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 16:01:14 - mmengine - INFO - Iter(train) [210000/640000] base_lr: 1.5190e-04 lr: 1.5627e-05 eta: 5 days, 14:34:05 time: 1.1369 data_time: 0.0360 memory: 21513 grad_norm: 2.7264 loss: 1.4530 caption_loss_cls: 2.4042 grounding_loss_reg: 3.0340 detection_loss_cls: 0.0419 detection_loss_reg: 0.3628 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0440 instance_segmentation_loss_reg: 0.3654 instance_segmentation_loss_poly: 0.9669 +2023/10/30 16:01:14 - mmengine - INFO - Saving checkpoint at 210000 iterations +2023/10/30 16:10:41 - mmengine - INFO - Iter(train) [210500/640000] base_lr: 1.5169e-04 lr: 1.5608e-05 eta: 5 days, 14:25:05 time: 1.1347 data_time: 0.0361 memory: 21513 grad_norm: 2.7396 loss: 1.4593 caption_loss_cls: 2.4028 grounding_loss_reg: 3.0318 detection_loss_cls: 0.0419 detection_loss_reg: 0.3631 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0440 instance_segmentation_loss_reg: 0.3656 instance_segmentation_loss_poly: 0.9669 +2023/10/30 16:20:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 16:20:18 - mmengine - INFO - Iter(train) [211000/640000] base_lr: 1.5148e-04 lr: 1.5589e-05 eta: 5 days, 14:17:14 time: 1.1384 data_time: 0.0364 memory: 21513 grad_norm: 2.7334 loss: 1.4631 caption_loss_cls: 2.4026 grounding_loss_reg: 3.0315 detection_loss_cls: 0.0418 detection_loss_reg: 0.3627 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0439 instance_segmentation_loss_reg: 0.3648 instance_segmentation_loss_poly: 0.9657 +2023/10/30 16:20:18 - mmengine - INFO - Saving checkpoint at 211000 iterations +2023/10/30 16:29:47 - mmengine - INFO - Iter(train) [211500/640000] base_lr: 1.5127e-04 lr: 1.5570e-05 eta: 5 days, 14:08:28 time: 1.1340 data_time: 0.0359 memory: 21513 grad_norm: 2.7016 loss: 1.4386 caption_loss_cls: 2.4006 grounding_loss_reg: 3.0327 detection_loss_cls: 0.0418 detection_loss_reg: 0.3634 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0438 instance_segmentation_loss_reg: 0.3646 instance_segmentation_loss_poly: 0.9646 +2023/10/30 16:40:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 16:40:09 - mmengine - INFO - Iter(train) [212000/640000] base_lr: 1.5106e-04 lr: 1.5551e-05 eta: 5 days, 14:05:23 time: 1.1447 data_time: 0.0388 memory: 21513 grad_norm: 2.7110 loss: 1.4380 caption_loss_cls: 2.4012 grounding_loss_reg: 3.0310 detection_loss_cls: 0.0418 detection_loss_reg: 0.3632 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0437 instance_segmentation_loss_reg: 0.3632 instance_segmentation_loss_poly: 0.9615 +2023/10/30 16:40:09 - mmengine - INFO - Saving checkpoint at 212000 iterations +2023/10/30 16:49:46 - mmengine - INFO - Iter(train) [212500/640000] base_lr: 1.5085e-04 lr: 1.5532e-05 eta: 5 days, 13:57:24 time: 1.1351 data_time: 0.0378 memory: 21513 grad_norm: 2.7127 loss: 1.4266 caption_loss_cls: 2.3979 grounding_loss_reg: 3.0285 detection_loss_cls: 0.0416 detection_loss_reg: 0.3616 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0436 instance_segmentation_loss_reg: 0.3631 instance_segmentation_loss_poly: 0.9610 +2023/10/30 16:58:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 16:58:54 - mmengine - INFO - Iter(train) [213000/640000] base_lr: 1.5064e-04 lr: 1.5513e-05 eta: 5 days, 13:46:20 time: 1.1417 data_time: 0.0379 memory: 21513 grad_norm: 2.7126 loss: 1.4166 caption_loss_cls: 2.3991 grounding_loss_reg: 3.0251 detection_loss_cls: 0.0415 detection_loss_reg: 0.3607 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0435 instance_segmentation_loss_reg: 0.3629 instance_segmentation_loss_poly: 0.9603 +2023/10/30 16:58:54 - mmengine - INFO - Saving checkpoint at 213000 iterations +2023/10/30 17:08:07 - mmengine - INFO - Iter(train) [213500/640000] base_lr: 1.5043e-04 lr: 1.5494e-05 eta: 5 days, 13:35:43 time: 1.1379 data_time: 0.0378 memory: 21513 grad_norm: 2.6993 loss: 1.4103 caption_loss_cls: 2.3973 grounding_loss_reg: 3.0248 detection_loss_cls: 0.0413 detection_loss_reg: 0.3603 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0435 instance_segmentation_loss_reg: 0.3624 instance_segmentation_loss_poly: 0.9589 +2023/10/30 17:17:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 17:17:22 - mmengine - INFO - Iter(train) [214000/640000] base_lr: 1.5022e-04 lr: 1.5475e-05 eta: 5 days, 13:25:21 time: 1.1416 data_time: 0.0378 memory: 21513 grad_norm: 2.6730 loss: 1.4004 caption_loss_cls: 2.3942 grounding_loss_reg: 3.0223 detection_loss_cls: 0.0413 detection_loss_reg: 0.3603 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0433 instance_segmentation_loss_reg: 0.3615 instance_segmentation_loss_poly: 0.9569 +2023/10/30 17:17:22 - mmengine - INFO - Saving checkpoint at 214000 iterations +2023/10/30 17:26:30 - mmengine - INFO - Iter(train) [214500/640000] base_lr: 1.5001e-04 lr: 1.5455e-05 eta: 5 days, 13:14:15 time: 1.1368 data_time: 0.0375 memory: 21513 grad_norm: 2.6762 loss: 1.3973 caption_loss_cls: 2.3927 grounding_loss_reg: 3.0213 detection_loss_cls: 0.0412 detection_loss_reg: 0.3596 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0432 instance_segmentation_loss_reg: 0.3607 instance_segmentation_loss_poly: 0.9550 +2023/10/30 17:36:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 17:36:00 - mmengine - INFO - Iter(train) [215000/640000] base_lr: 1.4980e-04 lr: 1.5436e-05 eta: 5 days, 13:05:32 time: 1.1351 data_time: 0.0375 memory: 21513 grad_norm: 2.6843 loss: 1.3906 caption_loss_cls: 2.3916 grounding_loss_reg: 3.0192 detection_loss_cls: 0.0411 detection_loss_reg: 0.3595 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0431 instance_segmentation_loss_reg: 0.3607 instance_segmentation_loss_poly: 0.9550 +2023/10/30 17:36:00 - mmengine - INFO - Saving checkpoint at 215000 iterations +2023/10/30 17:45:29 - mmengine - INFO - Iter(train) [215500/640000] base_lr: 1.4959e-04 lr: 1.5417e-05 eta: 5 days, 12:56:39 time: 1.1350 data_time: 0.0377 memory: 21513 grad_norm: 2.7187 loss: 1.4101 caption_loss_cls: 2.3909 grounding_loss_reg: 3.0155 detection_loss_cls: 0.0411 detection_loss_reg: 0.3589 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0430 instance_segmentation_loss_reg: 0.3596 instance_segmentation_loss_poly: 0.9531 +2023/10/30 17:55:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 17:55:01 - mmengine - INFO - Iter(train) [216000/640000] base_lr: 1.4937e-04 lr: 1.5398e-05 eta: 5 days, 12:48:06 time: 1.1227 data_time: 0.0346 memory: 21513 grad_norm: 2.6931 loss: 1.4011 caption_loss_cls: 2.3902 grounding_loss_reg: 3.0134 detection_loss_cls: 0.0410 detection_loss_reg: 0.3584 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0430 instance_segmentation_loss_reg: 0.3589 instance_segmentation_loss_poly: 0.9513 +2023/10/30 17:55:01 - mmengine - INFO - Saving checkpoint at 216000 iterations +2023/10/30 18:05:12 - mmengine - INFO - Iter(train) [216500/640000] base_lr: 1.4916e-04 lr: 1.5378e-05 eta: 5 days, 12:43:27 time: 1.1311 data_time: 0.0348 memory: 21513 grad_norm: 2.6994 loss: 1.4115 caption_loss_cls: 2.3902 grounding_loss_reg: 3.0144 detection_loss_cls: 0.0408 detection_loss_reg: 0.3574 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0431 instance_segmentation_loss_reg: 0.3600 instance_segmentation_loss_poly: 0.9539 +2023/10/30 18:14:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 18:14:47 - mmengine - INFO - Iter(train) [217000/640000] base_lr: 1.4895e-04 lr: 1.5359e-05 eta: 5 days, 12:35:07 time: 1.1377 data_time: 0.0352 memory: 21513 grad_norm: 2.6982 loss: 1.4269 caption_loss_cls: 2.3931 grounding_loss_reg: 3.0140 detection_loss_cls: 0.0408 detection_loss_reg: 0.3566 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0433 instance_segmentation_loss_reg: 0.3614 instance_segmentation_loss_poly: 0.9559 +2023/10/30 18:14:47 - mmengine - INFO - Saving checkpoint at 217000 iterations +2023/10/30 18:23:51 - mmengine - INFO - Iter(train) [217500/640000] base_lr: 1.4874e-04 lr: 1.5340e-05 eta: 5 days, 12:23:42 time: 1.1355 data_time: 0.0352 memory: 21513 grad_norm: 2.7324 loss: 1.4320 caption_loss_cls: 2.3932 grounding_loss_reg: 3.0157 detection_loss_cls: 0.0410 detection_loss_reg: 0.3571 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0433 instance_segmentation_loss_reg: 0.3614 instance_segmentation_loss_poly: 0.9561 +2023/10/30 18:33:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 18:33:19 - mmengine - INFO - Iter(train) [218000/640000] base_lr: 1.4852e-04 lr: 1.5320e-05 eta: 5 days, 12:14:39 time: 1.1388 data_time: 0.0353 memory: 21513 grad_norm: 2.7494 loss: 1.4368 caption_loss_cls: 2.3936 grounding_loss_reg: 3.0170 detection_loss_cls: 0.0411 detection_loss_reg: 0.3580 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0432 instance_segmentation_loss_reg: 0.3600 instance_segmentation_loss_poly: 0.9521 +2023/10/30 18:33:19 - mmengine - INFO - Saving checkpoint at 218000 iterations +2023/10/30 18:42:36 - mmengine - INFO - Iter(train) [218500/640000] base_lr: 1.4831e-04 lr: 1.5301e-05 eta: 5 days, 12:04:34 time: 1.1412 data_time: 0.0353 memory: 21513 grad_norm: 2.7330 loss: 1.4331 caption_loss_cls: 2.3943 grounding_loss_reg: 3.0146 detection_loss_cls: 0.0412 detection_loss_reg: 0.3583 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0432 instance_segmentation_loss_reg: 0.3604 instance_segmentation_loss_poly: 0.9528 +2023/10/30 18:51:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 18:51:37 - mmengine - INFO - Iter(train) [219000/640000] base_lr: 1.4810e-04 lr: 1.5282e-05 eta: 5 days, 11:52:51 time: 1.1337 data_time: 0.0350 memory: 21513 grad_norm: 2.7326 loss: 1.4332 caption_loss_cls: 2.3930 grounding_loss_reg: 3.0135 detection_loss_cls: 0.0411 detection_loss_reg: 0.3576 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0432 instance_segmentation_loss_reg: 0.3599 instance_segmentation_loss_poly: 0.9515 +2023/10/30 18:51:37 - mmengine - INFO - Saving checkpoint at 219000 iterations +2023/10/30 19:01:06 - mmengine - INFO - Iter(train) [219500/640000] base_lr: 1.4788e-04 lr: 1.5262e-05 eta: 5 days, 11:43:58 time: 1.1338 data_time: 0.0352 memory: 21513 grad_norm: 2.7238 loss: 1.4315 caption_loss_cls: 2.3917 grounding_loss_reg: 3.0139 detection_loss_cls: 0.0412 detection_loss_reg: 0.3575 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0432 instance_segmentation_loss_reg: 0.3596 instance_segmentation_loss_poly: 0.9506 +2023/10/30 19:10:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231029_192652 +2023/10/30 19:10:35 - mmengine - INFO - Iter(train) [220000/640000] base_lr: 1.4767e-04 lr: 1.5243e-05 eta: 5 days, 11:34:59 time: 1.1329 data_time: 0.0351 memory: 21513 grad_norm: 2.7374 loss: 1.4345 caption_loss_cls: 2.3935 grounding_loss_reg: 3.0112 detection_loss_cls: 0.0411 detection_loss_reg: 0.3568 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0430 instance_segmentation_loss_reg: 0.3593 instance_segmentation_loss_poly: 0.9501 +2023/10/30 19:10:35 - mmengine - INFO - Saving checkpoint at 220000 iterations +2023/10/30 19:19:14 - mmengine - INFO - Evaluating bbox... +2023/10/30 19:20:09 - mmengine - INFO - bbox_mAP_copypaste: 0.403 0.575 0.438 0.235 0.459 0.528 +2023/10/30 19:20:09 - mmengine - INFO - Evaluating segm... +2023/10/30 19:21:20 - mmengine - INFO - segm_mAP_copypaste: 0.250 0.476 0.236 0.111 0.289 0.406 +2023/10/30 19:25:56 - mmengine - INFO - per class results: +2023/10/30 19:25:56 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.24 | 85.91 | +| building | 80.31 | 86.31 | +| sky | 92.71 | 97.36 | +| floor | 79.21 | 87.54 | +| tree | 71.95 | 88.77 | +| ceiling | 79.52 | 93.84 | +| road | 80.7 | 90.87 | +| bed | 85.94 | 91.86 | +| windowpane | 57.0 | 75.89 | +| grass | 67.14 | 81.03 | +| cabinet | 56.66 | 71.05 | +| sidewalk | 63.23 | 75.6 | +| person | 78.04 | 91.94 | +| earth | 38.85 | 54.71 | +| door | 47.67 | 61.55 | +| table | 54.47 | 69.75 | +| mountain | 54.43 | 67.24 | +| plant | 49.03 | 60.12 | +| curtain | 69.89 | 79.73 | +| chair | 52.1 | 64.96 | +| car | 79.54 | 91.84 | +| water | 46.19 | 61.67 | +| painting | 67.66 | 85.76 | +| sofa | 63.28 | 80.23 | +| shelf | 39.63 | 67.3 | +| house | 44.4 | 73.21 | +| sea | 49.4 | 77.89 | +| mirror | 59.2 | 67.78 | +| rug | 60.29 | 68.22 | +| field | 36.11 | 51.46 | +| armchair | 39.72 | 62.29 | +| seat | 61.71 | 75.55 | +| fence | 40.31 | 63.19 | +| desk | 41.68 | 61.57 | +| rock | 29.98 | 33.44 | +| wardrobe | 49.14 | 72.04 | +| lamp | 55.94 | 70.55 | +| bathtub | 65.51 | 81.14 | +| railing | 32.73 | 58.1 | +| cushion | 51.47 | 67.33 | +| base | 23.13 | 35.98 | +| box | 24.01 | 36.09 | +| column | 46.26 | 59.62 | +| signboard | 36.07 | 53.18 | +| chest of drawers | 35.69 | 45.2 | +| counter | 23.17 | 37.15 | +| sand | 39.84 | 48.96 | +| sink | 65.81 | 76.03 | +| skyscraper | 63.57 | 87.8 | +| fireplace | 67.22 | 85.19 | +| refrigerator | 66.16 | 83.09 | +| grandstand | 28.6 | 75.92 | +| path | 16.93 | 21.09 | +| stairs | 28.11 | 38.12 | +| runway | 67.31 | 84.11 | +| case | 37.09 | 48.43 | +| pool table | 87.66 | 97.27 | +| pillow | 46.71 | 61.65 | +| screen door | 63.87 | 72.07 | +| stairway | 30.41 | 41.11 | +| river | 13.45 | 17.19 | +| bridge | 51.88 | 89.23 | +| bookcase | 33.63 | 55.59 | +| blind | 33.49 | 40.8 | +| coffee table | 46.35 | 88.37 | +| toilet | 80.92 | 86.17 | +| flower | 31.56 | 52.47 | +| book | 43.75 | 66.12 | +| hill | 9.91 | 25.36 | +| bench | 46.42 | 61.67 | +| countertop | 50.98 | 61.81 | +| stove | 68.13 | 83.39 | +| palm | 41.81 | 56.89 | +| kitchen island | 35.14 | 72.55 | +| computer | 70.86 | 81.53 | +| swivel chair | 42.59 | 60.02 | +| boat | 51.84 | 80.6 | +| bar | 39.96 | 56.09 | +| arcade machine | 27.42 | 28.05 | +| hovel | 7.27 | 8.55 | +| bus | 78.88 | 94.6 | +| towel | 58.7 | 69.43 | +| light | 31.79 | 34.04 | +| truck | 39.24 | 50.09 | +| tower | 28.63 | 50.97 | +| chandelier | 58.74 | 69.08 | +| awning | 21.04 | 24.38 | +| streetlight | 24.23 | 40.95 | +| booth | 40.21 | 41.47 | +| television receiver | 66.13 | 80.19 | +| airplane | 56.61 | 62.75 | +| dirt track | 0.0 | 0.0 | +| apparel | 31.71 | 36.24 | +| pole | 20.52 | 27.67 | +| land | 3.52 | 5.57 | +| bannister | 12.85 | 16.52 | +| escalator | 5.03 | 5.24 | +| ottoman | 48.09 | 64.65 | +| bottle | 19.5 | 23.69 | +| buffet | 33.02 | 38.42 | +| poster | 26.45 | 35.06 | +| stage | 11.91 | 27.05 | +| van | 20.29 | 24.83 | +| ship | 55.18 | 91.39 | +| fountain | 3.84 | 3.85 | +| conveyer belt | 29.71 | 96.61 | +| canopy | 11.02 | 17.33 | +| washer | 61.0 | 62.46 | +| plaything | 19.18 | 26.64 | +| swimming pool | 50.86 | 72.26 | +| stool | 38.57 | 53.16 | +| barrel | 14.84 | 75.75 | +| basket | 24.14 | 48.64 | +| waterfall | 58.23 | 75.13 | +| tent | 86.34 | 97.24 | +| bag | 10.73 | 11.75 | +| minibike | 69.83 | 87.91 | +| cradle | 62.25 | 80.48 | +| oven | 24.94 | 28.86 | +| ball | 30.7 | 35.77 | +| food | 42.36 | 46.87 | +| step | 14.54 | 15.77 | +| tank | 41.33 | 46.98 | +| trade name | 23.97 | 34.71 | +| microwave | 67.64 | 86.5 | +| pot | 38.49 | 47.16 | +| animal | 51.01 | 52.64 | +| bicycle | 55.15 | 73.11 | +| lake | 44.71 | 68.19 | +| dishwasher | 51.99 | 72.33 | +| screen | 56.41 | 68.67 | +| blanket | 19.48 | 29.77 | +| sculpture | 33.19 | 55.39 | +| hood | 53.21 | 68.51 | +| sconce | 28.83 | 32.61 | +| vase | 33.05 | 41.19 | +| traffic light | 31.4 | 38.23 | +| tray | 4.45 | 9.68 | +| ashcan | 33.39 | 44.14 | +| fan | 47.6 | 57.55 | +| pier | 51.75 | 61.77 | +| crt screen | 7.56 | 22.68 | +| plate | 48.57 | 73.89 | +| monitor | 9.3 | 9.96 | +| bulletin board | 34.26 | 49.33 | +| shower | 0.22 | 0.26 | +| radiator | 49.02 | 53.88 | +| glass | 10.97 | 11.45 | +| clock | 21.84 | 28.9 | +| flag | 31.78 | 36.53 | ++---------------------+-------+-------+ +2023/10/30 19:26:20 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4030 coco/bbox_mAP_50: 0.5750 coco/bbox_mAP_75: 0.4380 coco/bbox_mAP_s: 0.2350 coco/bbox_mAP_m: 0.4590 coco/bbox_mAP_l: 0.5280 coco/segm_mAP: 0.2500 coco/segm_mAP_50: 0.4760 coco/segm_mAP_75: 0.2360 coco/segm_mAP_s: 0.1110 coco/segm_mAP_m: 0.2890 coco/segm_mAP_l: 0.4060 Bleu_1: 0.7049 Bleu_2: 0.5340 Bleu_3: 0.3947 Bleu_4: 0.2912 METEOR: 0.2471 ROUGE_L: 0.5236 CIDEr: 0.9193 SPICE: 0.1748 aAcc: 80.7600 mIoU: 43.3300 mAcc: 56.8900 visual-grounding/miou: 0.7389 visual-grounding/acc: 0.8206 data_time: 0.0368 time: 0.5588 +2023/11/01 21:01:23 - mmengine - INFO - Iter(train) [220500/640000] base_lr: 1.4745e-04 lr: 1.5223e-05 eta: 5 days, 8:24:29 time: 1.1180 data_time: 0.0313 memory: 21520 grad_norm: 2.7408 loss: 1.4253 caption_loss_cls: 2.3882 grounding_loss_reg: 3.0093 detection_loss_cls: 0.0411 detection_loss_reg: 0.3558 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0430 instance_segmentation_loss_reg: 0.3580 instance_segmentation_loss_poly: 0.9474 +2023/11/01 21:10:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/01 21:10:48 - mmengine - INFO - Iter(train) [221000/640000] base_lr: 1.4724e-04 lr: 1.5204e-05 eta: 5 days, 9:50:50 time: 1.1155 data_time: 0.0335 memory: 21518 grad_norm: 2.7679 loss: 1.4117 caption_loss_cls: 2.3843 grounding_loss_reg: 3.0102 detection_loss_cls: 0.0408 detection_loss_reg: 0.3541 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0430 instance_segmentation_loss_reg: 0.3584 instance_segmentation_loss_poly: 0.9476 +2023/11/01 21:10:48 - mmengine - INFO - Saving checkpoint at 221000 iterations +2023/11/01 21:20:08 - mmengine - INFO - Iter(train) [221500/640000] base_lr: 1.4702e-04 lr: 1.5184e-05 eta: 5 days, 9:49:44 time: 1.1194 data_time: 0.0333 memory: 21518 grad_norm: 2.7510 loss: 1.3937 caption_loss_cls: 2.3843 grounding_loss_reg: 3.0069 detection_loss_cls: 0.0408 detection_loss_reg: 0.3537 semantic_segmentation_loss_cls: 0.0107 instance_segmentation_loss_cls: 0.0428 instance_segmentation_loss_reg: 0.3578 instance_segmentation_loss_poly: 0.9470 +2023/11/01 21:28:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/01 21:28:43 - mmengine - INFO - Iter(train) [222000/640000] base_lr: 1.4681e-04 lr: 1.5164e-05 eta: 5 days, 7:08:59 time: 1.1063 data_time: 0.0330 memory: 21518 grad_norm: 2.7630 loss: 1.3911 caption_loss_cls: 2.3815 grounding_loss_reg: 3.0056 detection_loss_cls: 0.0408 detection_loss_reg: 0.3533 semantic_segmentation_loss_cls: 0.0107 instance_segmentation_loss_cls: 0.0425 instance_segmentation_loss_reg: 0.3567 instance_segmentation_loss_poly: 0.9452 +2023/11/01 21:28:43 - mmengine - INFO - Saving checkpoint at 222000 iterations +2023/11/01 21:37:58 - mmengine - INFO - Iter(train) [222500/640000] base_lr: 1.4659e-04 lr: 1.5145e-05 eta: 5 days, 7:20:11 time: 1.1057 data_time: 0.0329 memory: 21518 grad_norm: 2.7325 loss: 1.3793 caption_loss_cls: 2.3774 grounding_loss_reg: 3.0050 detection_loss_cls: 0.0408 detection_loss_reg: 0.3537 semantic_segmentation_loss_cls: 0.0107 instance_segmentation_loss_cls: 0.0424 instance_segmentation_loss_reg: 0.3562 instance_segmentation_loss_poly: 0.9449 +2023/11/01 21:47:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/01 21:47:09 - mmengine - INFO - Iter(train) [223000/640000] base_lr: 1.4638e-04 lr: 1.5125e-05 eta: 5 days, 7:14:11 time: 1.1082 data_time: 0.0329 memory: 21518 grad_norm: 2.7402 loss: 1.3728 caption_loss_cls: 2.3730 grounding_loss_reg: 2.9990 detection_loss_cls: 0.0407 detection_loss_reg: 0.3526 semantic_segmentation_loss_cls: 0.0107 instance_segmentation_loss_cls: 0.0423 instance_segmentation_loss_reg: 0.3562 instance_segmentation_loss_poly: 0.9451 +2023/11/01 21:47:09 - mmengine - INFO - Saving checkpoint at 223000 iterations +2023/11/01 21:56:37 - mmengine - INFO - Iter(train) [223500/640000] base_lr: 1.4616e-04 lr: 1.5106e-05 eta: 5 days, 7:42:37 time: 1.1079 data_time: 0.0327 memory: 21518 grad_norm: 2.7109 loss: 1.3548 caption_loss_cls: 2.3684 grounding_loss_reg: 2.9999 detection_loss_cls: 0.0408 detection_loss_reg: 0.3533 semantic_segmentation_loss_cls: 0.0107 instance_segmentation_loss_cls: 0.0422 instance_segmentation_loss_reg: 0.3563 instance_segmentation_loss_poly: 0.9458 +2023/11/01 22:05:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/01 22:05:44 - mmengine - INFO - Iter(train) [224000/640000] base_lr: 1.4595e-04 lr: 1.5086e-05 eta: 5 days, 7:24:12 time: 1.1025 data_time: 0.0327 memory: 21518 grad_norm: 2.7404 loss: 1.3617 caption_loss_cls: 2.3649 grounding_loss_reg: 2.9979 detection_loss_cls: 0.0409 detection_loss_reg: 0.3546 semantic_segmentation_loss_cls: 0.0107 instance_segmentation_loss_cls: 0.0421 instance_segmentation_loss_reg: 0.3569 instance_segmentation_loss_poly: 0.9473 +2023/11/01 22:05:44 - mmengine - INFO - Saving checkpoint at 224000 iterations +2023/11/01 22:15:07 - mmengine - INFO - Iter(train) [224500/640000] base_lr: 1.4573e-04 lr: 1.5066e-05 eta: 5 days, 7:32:41 time: 1.1055 data_time: 0.0363 memory: 21518 grad_norm: 2.7524 loss: 1.3669 caption_loss_cls: 2.3612 grounding_loss_reg: 2.9969 detection_loss_cls: 0.0408 detection_loss_reg: 0.3541 semantic_segmentation_loss_cls: 0.0107 instance_segmentation_loss_cls: 0.0420 instance_segmentation_loss_reg: 0.3573 instance_segmentation_loss_poly: 0.9480 +2023/11/01 22:22:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/01 22:22:56 - mmengine - INFO - Iter(train) [225000/640000] base_lr: 1.4551e-04 lr: 1.5047e-05 eta: 5 days, 5:27:48 time: 1.0815 data_time: 0.0334 memory: 21518 grad_norm: 2.7989 loss: 1.3937 caption_loss_cls: 2.3582 grounding_loss_reg: 2.9972 detection_loss_cls: 0.0409 detection_loss_reg: 0.3554 semantic_segmentation_loss_cls: 0.0107 instance_segmentation_loss_cls: 0.0420 instance_segmentation_loss_reg: 0.3577 instance_segmentation_loss_poly: 0.9482 +2023/11/01 22:22:56 - mmengine - INFO - Saving checkpoint at 225000 iterations +2023/11/01 22:32:18 - mmengine - INFO - Iter(train) [225500/640000] base_lr: 1.4529e-04 lr: 1.5027e-05 eta: 5 days, 5:40:26 time: 1.0820 data_time: 0.0335 memory: 21518 grad_norm: 2.8090 loss: 1.4040 caption_loss_cls: 2.3563 grounding_loss_reg: 2.9924 detection_loss_cls: 0.0409 detection_loss_reg: 0.3555 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0421 instance_segmentation_loss_reg: 0.3585 instance_segmentation_loss_poly: 0.9501 +2023/11/01 22:41:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/01 22:41:53 - mmengine - INFO - Iter(train) [226000/640000] base_lr: 1.4508e-04 lr: 1.5007e-05 eta: 5 days, 6:05:08 time: 1.0971 data_time: 0.0361 memory: 21518 grad_norm: 2.7682 loss: 1.3799 caption_loss_cls: 2.3544 grounding_loss_reg: 2.9915 detection_loss_cls: 0.0408 detection_loss_reg: 0.3548 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0421 instance_segmentation_loss_reg: 0.3576 instance_segmentation_loss_poly: 0.9483 +2023/11/01 22:41:53 - mmengine - INFO - Saving checkpoint at 226000 iterations +2023/11/01 22:51:20 - mmengine - INFO - Iter(train) [226500/640000] base_lr: 1.4486e-04 lr: 1.4987e-05 eta: 5 days, 6:15:33 time: 1.1000 data_time: 0.0362 memory: 21518 grad_norm: 2.8156 loss: 1.3951 caption_loss_cls: 2.3499 grounding_loss_reg: 2.9906 detection_loss_cls: 0.0408 detection_loss_reg: 0.3554 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0420 instance_segmentation_loss_reg: 0.3580 instance_segmentation_loss_poly: 0.9489 +2023/11/01 23:00:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/01 23:00:15 - mmengine - INFO - Iter(train) [227000/640000] base_lr: 1.4464e-04 lr: 1.4967e-05 eta: 5 days, 5:51:20 time: 1.0960 data_time: 0.0361 memory: 21518 grad_norm: 2.8139 loss: 1.4023 caption_loss_cls: 2.3471 grounding_loss_reg: 2.9881 detection_loss_cls: 0.0408 detection_loss_reg: 0.3546 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0419 instance_segmentation_loss_reg: 0.3575 instance_segmentation_loss_poly: 0.9491 +2023/11/01 23:00:15 - mmengine - INFO - Saving checkpoint at 227000 iterations +2023/11/01 23:08:33 - mmengine - INFO - Iter(train) [227500/640000] base_lr: 1.4442e-04 lr: 1.4948e-05 eta: 5 days, 4:56:08 time: 1.0785 data_time: 0.0357 memory: 21518 grad_norm: 2.8878 loss: 1.4145 caption_loss_cls: 2.3407 grounding_loss_reg: 2.9898 detection_loss_cls: 0.0408 detection_loss_reg: 0.3542 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0417 instance_segmentation_loss_reg: 0.3554 instance_segmentation_loss_poly: 0.9457 +2023/11/01 23:17:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/01 23:17:02 - mmengine - INFO - Iter(train) [228000/640000] base_lr: 1.4420e-04 lr: 1.4928e-05 eta: 5 days, 4:15:38 time: 1.0690 data_time: 0.0353 memory: 21518 grad_norm: 2.9161 loss: 1.4224 caption_loss_cls: 2.3364 grounding_loss_reg: 2.9877 detection_loss_cls: 0.0408 detection_loss_reg: 0.3549 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0414 instance_segmentation_loss_reg: 0.3539 instance_segmentation_loss_poly: 0.9430 +2023/11/01 23:17:02 - mmengine - INFO - Saving checkpoint at 228000 iterations +2023/11/01 23:25:40 - mmengine - INFO - Iter(train) [228500/640000] base_lr: 1.4399e-04 lr: 1.4908e-05 eta: 5 days, 3:46:17 time: 1.0578 data_time: 0.0350 memory: 21518 grad_norm: 2.9404 loss: 1.4376 caption_loss_cls: 2.3381 grounding_loss_reg: 2.9849 detection_loss_cls: 0.0406 detection_loss_reg: 0.3537 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0412 instance_segmentation_loss_reg: 0.3538 instance_segmentation_loss_poly: 0.9435 +2023/11/01 23:34:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/01 23:34:38 - mmengine - INFO - Iter(train) [229000/640000] base_lr: 1.4377e-04 lr: 1.4888e-05 eta: 5 days, 3:34:57 time: 1.0751 data_time: 0.0355 memory: 21518 grad_norm: 2.8905 loss: 1.4224 caption_loss_cls: 2.3360 grounding_loss_reg: 2.9851 detection_loss_cls: 0.0405 detection_loss_reg: 0.3520 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0410 instance_segmentation_loss_reg: 0.3531 instance_segmentation_loss_poly: 0.9422 +2023/11/01 23:34:38 - mmengine - INFO - Saving checkpoint at 229000 iterations +2023/11/01 23:43:36 - mmengine - INFO - Iter(train) [229500/640000] base_lr: 1.4355e-04 lr: 1.4868e-05 eta: 5 days, 3:23:07 time: 1.0691 data_time: 0.0353 memory: 21518 grad_norm: 2.8964 loss: 1.4175 caption_loss_cls: 2.3315 grounding_loss_reg: 2.9829 detection_loss_cls: 0.0403 detection_loss_reg: 0.3509 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0409 instance_segmentation_loss_reg: 0.3521 instance_segmentation_loss_poly: 0.9404 +2023/11/01 23:52:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/01 23:52:20 - mmengine - INFO - Iter(train) [230000/640000] base_lr: 1.4333e-04 lr: 1.4848e-05 eta: 5 days, 3:02:32 time: 1.0563 data_time: 0.0329 memory: 21518 grad_norm: 2.9693 loss: 1.4486 caption_loss_cls: 2.3304 grounding_loss_reg: 2.9808 detection_loss_cls: 0.0404 detection_loss_reg: 0.3512 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0407 instance_segmentation_loss_reg: 0.3512 instance_segmentation_loss_poly: 0.9381 +2023/11/01 23:52:20 - mmengine - INFO - Saving checkpoint at 230000 iterations +2023/11/02 00:01:39 - mmengine - INFO - Iter(train) [230500/640000] base_lr: 1.4311e-04 lr: 1.4828e-05 eta: 5 days, 3:05:31 time: 1.0543 data_time: 0.0328 memory: 21518 grad_norm: 2.9822 loss: 1.4508 caption_loss_cls: 2.3310 grounding_loss_reg: 2.9783 detection_loss_cls: 0.0403 detection_loss_reg: 0.3511 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0406 instance_segmentation_loss_reg: 0.3515 instance_segmentation_loss_poly: 0.9385 +2023/11/02 00:10:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 00:10:09 - mmengine - INFO - Iter(train) [231000/640000] base_lr: 1.4289e-04 lr: 1.4808e-05 eta: 5 days, 2:37:11 time: 1.0482 data_time: 0.0327 memory: 21518 grad_norm: 3.0071 loss: 1.4587 caption_loss_cls: 2.3313 grounding_loss_reg: 2.9765 detection_loss_cls: 0.0402 detection_loss_reg: 0.3503 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0405 instance_segmentation_loss_reg: 0.3506 instance_segmentation_loss_poly: 0.9366 +2023/11/02 00:10:09 - mmengine - INFO - Saving checkpoint at 231000 iterations +2023/11/02 00:19:08 - mmengine - INFO - Iter(train) [231500/640000] base_lr: 1.4267e-04 lr: 1.4788e-05 eta: 5 days, 2:27:20 time: 1.0582 data_time: 0.0331 memory: 21518 grad_norm: 2.9948 loss: 1.4684 caption_loss_cls: 2.3268 grounding_loss_reg: 2.9749 detection_loss_cls: 0.0402 detection_loss_reg: 0.3513 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0405 instance_segmentation_loss_reg: 0.3519 instance_segmentation_loss_poly: 0.9397 +2023/11/02 00:28:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 00:28:04 - mmengine - INFO - Iter(train) [232000/640000] base_lr: 1.4245e-04 lr: 1.4768e-05 eta: 5 days, 2:16:13 time: 1.0650 data_time: 0.0333 memory: 21518 grad_norm: 2.9475 loss: 1.4532 caption_loss_cls: 2.3278 grounding_loss_reg: 2.9752 detection_loss_cls: 0.0402 detection_loss_reg: 0.3513 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0407 instance_segmentation_loss_reg: 0.3531 instance_segmentation_loss_poly: 0.9426 +2023/11/02 00:28:04 - mmengine - INFO - Saving checkpoint at 232000 iterations +2023/11/02 00:37:34 - mmengine - INFO - Iter(train) [232500/640000] base_lr: 1.4223e-04 lr: 1.4748e-05 eta: 5 days, 2:23:42 time: 1.0780 data_time: 0.0335 memory: 21518 grad_norm: 2.9238 loss: 1.4346 caption_loss_cls: 2.3279 grounding_loss_reg: 2.9770 detection_loss_cls: 0.0401 detection_loss_reg: 0.3516 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0405 instance_segmentation_loss_reg: 0.3529 instance_segmentation_loss_poly: 0.9420 +2023/11/02 00:46:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 00:46:37 - mmengine - INFO - Iter(train) [233000/640000] base_lr: 1.4201e-04 lr: 1.4728e-05 eta: 5 days, 2:15:51 time: 1.0791 data_time: 0.0334 memory: 21518 grad_norm: 2.9268 loss: 1.4239 caption_loss_cls: 2.3250 grounding_loss_reg: 2.9714 detection_loss_cls: 0.0400 detection_loss_reg: 0.3510 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0404 instance_segmentation_loss_reg: 0.3526 instance_segmentation_loss_poly: 0.9415 +2023/11/02 00:46:37 - mmengine - INFO - Saving checkpoint at 233000 iterations +2023/11/02 00:56:04 - mmengine - INFO - Iter(train) [233500/640000] base_lr: 1.4178e-04 lr: 1.4708e-05 eta: 5 days, 2:20:17 time: 1.0867 data_time: 0.0339 memory: 21518 grad_norm: 2.9066 loss: 1.4305 caption_loss_cls: 2.3235 grounding_loss_reg: 2.9700 detection_loss_cls: 0.0400 detection_loss_reg: 0.3517 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0404 instance_segmentation_loss_reg: 0.3527 instance_segmentation_loss_poly: 0.9407 +2023/11/02 01:04:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 01:04:56 - mmengine - INFO - Iter(train) [234000/640000] base_lr: 1.4156e-04 lr: 1.4688e-05 eta: 5 days, 2:06:31 time: 1.0887 data_time: 0.0338 memory: 21518 grad_norm: 2.8710 loss: 1.4165 caption_loss_cls: 2.3240 grounding_loss_reg: 2.9688 detection_loss_cls: 0.0398 detection_loss_reg: 0.3509 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0404 instance_segmentation_loss_reg: 0.3527 instance_segmentation_loss_poly: 0.9402 +2023/11/02 01:04:57 - mmengine - INFO - Saving checkpoint at 234000 iterations +2023/11/02 01:14:15 - mmengine - INFO - Iter(train) [234500/640000] base_lr: 1.4134e-04 lr: 1.4667e-05 eta: 5 days, 2:05:37 time: 1.0887 data_time: 0.0338 memory: 21518 grad_norm: 2.8280 loss: 1.4006 caption_loss_cls: 2.3227 grounding_loss_reg: 2.9660 detection_loss_cls: 0.0398 detection_loss_reg: 0.3516 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0405 instance_segmentation_loss_reg: 0.3541 instance_segmentation_loss_poly: 0.9429 +2023/11/02 01:23:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 01:23:01 - mmengine - INFO - Iter(train) [235000/640000] base_lr: 1.4112e-04 lr: 1.4647e-05 eta: 5 days, 1:49:09 time: 1.0926 data_time: 0.0339 memory: 21518 grad_norm: 2.8173 loss: 1.3986 caption_loss_cls: 2.3171 grounding_loss_reg: 2.9635 detection_loss_cls: 0.0398 detection_loss_reg: 0.3517 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0404 instance_segmentation_loss_reg: 0.3532 instance_segmentation_loss_poly: 0.9416 +2023/11/02 01:23:01 - mmengine - INFO - Saving checkpoint at 235000 iterations +2023/11/02 01:32:10 - mmengine - INFO - Iter(train) [235500/640000] base_lr: 1.4090e-04 lr: 1.4627e-05 eta: 5 days, 1:43:22 time: 1.0952 data_time: 0.0339 memory: 21518 grad_norm: 2.8274 loss: 1.3974 caption_loss_cls: 2.3165 grounding_loss_reg: 2.9616 detection_loss_cls: 0.0397 detection_loss_reg: 0.3509 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0403 instance_segmentation_loss_reg: 0.3536 instance_segmentation_loss_poly: 0.9420 +2023/11/02 01:41:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 01:41:18 - mmengine - INFO - Iter(train) [236000/640000] base_lr: 1.4067e-04 lr: 1.4607e-05 eta: 5 days, 1:36:54 time: 1.0982 data_time: 0.0339 memory: 21518 grad_norm: 2.8475 loss: 1.3969 caption_loss_cls: 2.3174 grounding_loss_reg: 2.9590 detection_loss_cls: 0.0396 detection_loss_reg: 0.3506 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0402 instance_segmentation_loss_reg: 0.3533 instance_segmentation_loss_poly: 0.9415 +2023/11/02 01:41:18 - mmengine - INFO - Saving checkpoint at 236000 iterations +2023/11/02 01:50:04 - mmengine - INFO - Iter(train) [236500/640000] base_lr: 1.4045e-04 lr: 1.4587e-05 eta: 5 days, 1:21:11 time: 1.0872 data_time: 0.0336 memory: 21518 grad_norm: 2.8783 loss: 1.4046 caption_loss_cls: 2.3139 grounding_loss_reg: 2.9558 detection_loss_cls: 0.0396 detection_loss_reg: 0.3504 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0402 instance_segmentation_loss_reg: 0.3529 instance_segmentation_loss_poly: 0.9396 +2023/11/02 01:58:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 01:58:41 - mmengine - INFO - Iter(train) [237000/640000] base_lr: 1.4023e-04 lr: 1.4566e-05 eta: 5 days, 1:02:42 time: 1.0808 data_time: 0.0332 memory: 21518 grad_norm: 2.8776 loss: 1.4008 caption_loss_cls: 2.3109 grounding_loss_reg: 2.9539 detection_loss_cls: 0.0395 detection_loss_reg: 0.3502 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3513 instance_segmentation_loss_poly: 0.9362 +2023/11/02 01:58:41 - mmengine - INFO - Saving checkpoint at 237000 iterations +2023/11/02 02:07:49 - mmengine - INFO - Iter(train) [237500/640000] base_lr: 1.4001e-04 lr: 1.4546e-05 eta: 5 days, 0:56:23 time: 1.0758 data_time: 0.0328 memory: 21518 grad_norm: 2.8728 loss: 1.3884 caption_loss_cls: 2.3034 grounding_loss_reg: 2.9513 detection_loss_cls: 0.0393 detection_loss_reg: 0.3493 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3502 instance_segmentation_loss_poly: 0.9343 +2023/11/02 02:16:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 02:16:40 - mmengine - INFO - Iter(train) [238000/640000] base_lr: 1.3978e-04 lr: 1.4526e-05 eta: 5 days, 0:43:22 time: 1.0754 data_time: 0.0329 memory: 21518 grad_norm: 2.9066 loss: 1.4006 caption_loss_cls: 2.3050 grounding_loss_reg: 2.9486 detection_loss_cls: 0.0393 detection_loss_reg: 0.3497 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3512 instance_segmentation_loss_poly: 0.9359 +2023/11/02 02:16:40 - mmengine - INFO - Saving checkpoint at 238000 iterations +2023/11/02 02:25:55 - mmengine - INFO - Iter(train) [238500/640000] base_lr: 1.3956e-04 lr: 1.4505e-05 eta: 5 days, 0:39:45 time: 1.0745 data_time: 0.0328 memory: 21518 grad_norm: 2.9283 loss: 1.4025 caption_loss_cls: 2.3002 grounding_loss_reg: 2.9478 detection_loss_cls: 0.0391 detection_loss_reg: 0.3481 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0398 instance_segmentation_loss_reg: 0.3507 instance_segmentation_loss_poly: 0.9357 +2023/11/02 02:35:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 02:35:02 - mmengine - INFO - Iter(train) [239000/640000] base_lr: 1.3933e-04 lr: 1.4485e-05 eta: 5 days, 0:32:34 time: 1.0797 data_time: 0.0330 memory: 21518 grad_norm: 2.9216 loss: 1.3950 caption_loss_cls: 2.3018 grounding_loss_reg: 2.9420 detection_loss_cls: 0.0390 detection_loss_reg: 0.3477 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0397 instance_segmentation_loss_reg: 0.3499 instance_segmentation_loss_poly: 0.9349 +2023/11/02 02:35:02 - mmengine - INFO - Saving checkpoint at 239000 iterations +2023/11/02 02:43:55 - mmengine - INFO - Iter(train) [239500/640000] base_lr: 1.3911e-04 lr: 1.4465e-05 eta: 5 days, 0:20:53 time: 1.0758 data_time: 0.0325 memory: 21518 grad_norm: 2.9010 loss: 1.3836 caption_loss_cls: 2.3015 grounding_loss_reg: 2.9384 detection_loss_cls: 0.0390 detection_loss_reg: 0.3483 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0397 instance_segmentation_loss_reg: 0.3503 instance_segmentation_loss_poly: 0.9357 +2023/11/02 02:52:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 02:52:52 - mmengine - INFO - Iter(train) [240000/640000] base_lr: 1.3889e-04 lr: 1.4444e-05 eta: 5 days, 0:10:34 time: 1.0731 data_time: 0.0323 memory: 21518 grad_norm: 2.8959 loss: 1.3852 caption_loss_cls: 2.2999 grounding_loss_reg: 2.9385 detection_loss_cls: 0.0390 detection_loss_reg: 0.3483 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0396 instance_segmentation_loss_reg: 0.3496 instance_segmentation_loss_poly: 0.9346 +2023/11/02 02:52:52 - mmengine - INFO - Saving checkpoint at 240000 iterations +2023/11/02 03:01:20 - mmengine - INFO - Evaluating bbox... +2023/11/02 03:02:16 - mmengine - INFO - bbox_mAP_copypaste: 0.403 0.574 0.441 0.242 0.456 0.531 +2023/11/02 03:02:16 - mmengine - INFO - Evaluating segm... +2023/11/02 03:03:28 - mmengine - INFO - segm_mAP_copypaste: 0.268 0.495 0.259 0.126 0.312 0.420 +2023/11/02 03:08:35 - mmengine - INFO - per class results: +2023/11/02 03:08:35 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 73.19 | 88.68 | +| building | 80.27 | 89.69 | +| sky | 92.62 | 97.7 | +| floor | 78.95 | 87.9 | +| tree | 71.87 | 85.14 | +| ceiling | 80.89 | 93.72 | +| road | 81.6 | 89.59 | +| bed | 83.77 | 94.12 | +| windowpane | 56.97 | 71.18 | +| grass | 68.22 | 82.97 | +| cabinet | 53.27 | 64.51 | +| sidewalk | 63.36 | 72.84 | +| person | 77.12 | 88.29 | +| earth | 38.08 | 56.09 | +| door | 41.46 | 57.72 | +| table | 53.76 | 66.31 | +| mountain | 55.89 | 70.54 | +| plant | 48.75 | 65.02 | +| curtain | 67.92 | 85.06 | +| chair | 51.68 | 64.24 | +| car | 81.26 | 91.67 | +| water | 47.96 | 68.8 | +| painting | 65.8 | 85.78 | +| sofa | 59.29 | 73.74 | +| shelf | 40.14 | 53.49 | +| house | 38.19 | 56.73 | +| sea | 40.62 | 54.81 | +| mirror | 60.99 | 72.94 | +| rug | 61.71 | 67.97 | +| field | 36.66 | 50.3 | +| armchair | 38.82 | 62.27 | +| seat | 58.22 | 71.92 | +| fence | 43.37 | 56.68 | +| desk | 39.22 | 49.12 | +| rock | 19.0 | 23.16 | +| wardrobe | 45.58 | 70.02 | +| lamp | 54.37 | 66.11 | +| bathtub | 69.11 | 81.32 | +| railing | 32.94 | 43.83 | +| cushion | 49.61 | 66.42 | +| base | 24.7 | 30.91 | +| box | 22.67 | 33.84 | +| column | 41.05 | 49.08 | +| signboard | 35.92 | 46.14 | +| chest of drawers | 39.44 | 64.14 | +| counter | 31.8 | 36.46 | +| sand | 36.33 | 45.15 | +| sink | 64.33 | 74.3 | +| skyscraper | 50.09 | 64.34 | +| fireplace | 57.97 | 64.49 | +| refrigerator | 72.55 | 75.09 | +| grandstand | 36.18 | 69.62 | +| path | 17.38 | 20.21 | +| stairs | 30.98 | 46.92 | +| runway | 69.52 | 80.39 | +| case | 48.99 | 55.35 | +| pool table | 85.76 | 95.81 | +| pillow | 48.21 | 63.66 | +| screen door | 45.95 | 51.69 | +| stairway | 31.55 | 34.54 | +| river | 13.87 | 29.6 | +| bridge | 64.67 | 80.75 | +| bookcase | 33.74 | 59.95 | +| blind | 30.44 | 38.49 | +| coffee table | 46.75 | 83.62 | +| toilet | 80.75 | 87.56 | +| flower | 30.3 | 48.05 | +| book | 42.42 | 68.51 | +| hill | 12.83 | 24.98 | +| bench | 40.28 | 46.2 | +| countertop | 48.19 | 60.73 | +| stove | 68.34 | 79.05 | +| palm | 41.05 | 54.08 | +| kitchen island | 36.66 | 64.28 | +| computer | 65.79 | 76.54 | +| swivel chair | 35.59 | 47.03 | +| boat | 47.26 | 54.08 | +| bar | 50.25 | 68.45 | +| arcade machine | 32.81 | 36.52 | +| hovel | 11.33 | 13.79 | +| bus | 79.86 | 88.72 | +| towel | 57.4 | 63.46 | +| light | 32.04 | 34.25 | +| truck | 34.37 | 40.2 | +| tower | 11.18 | 14.51 | +| chandelier | 49.69 | 55.4 | +| awning | 21.41 | 40.33 | +| streetlight | 19.4 | 22.46 | +| booth | 46.72 | 50.38 | +| television receiver | 68.05 | 83.44 | +| airplane | 50.6 | 66.55 | +| dirt track | 0.0 | 0.0 | +| apparel | 29.19 | 52.3 | +| pole | 25.23 | 33.94 | +| land | 3.97 | 5.4 | +| bannister | 10.44 | 13.14 | +| escalator | 20.78 | 21.55 | +| ottoman | 35.26 | 50.33 | +| bottle | 30.11 | 36.5 | +| buffet | 41.22 | 46.41 | +| poster | 3.45 | 3.47 | +| stage | 9.01 | 18.51 | +| van | 19.54 | 30.02 | +| ship | 34.95 | 48.53 | +| fountain | 3.54 | 3.81 | +| conveyer belt | 66.84 | 81.08 | +| canopy | 28.62 | 41.74 | +| washer | 56.95 | 62.57 | +| plaything | 20.42 | 24.56 | +| swimming pool | 48.21 | 50.5 | +| stool | 40.33 | 50.92 | +| barrel | 17.08 | 51.18 | +| basket | 30.2 | 40.13 | +| waterfall | 63.13 | 86.48 | +| tent | 53.35 | 98.16 | +| bag | 11.28 | 13.5 | +| minibike | 69.7 | 77.29 | +| cradle | 54.86 | 78.11 | +| oven | 26.1 | 32.16 | +| ball | 26.96 | 31.17 | +| food | 51.2 | 63.3 | +| step | 14.13 | 17.51 | +| tank | 32.57 | 38.87 | +| trade name | 27.63 | 35.24 | +| microwave | 72.37 | 79.19 | +| pot | 43.68 | 49.62 | +| animal | 62.16 | 65.14 | +| bicycle | 50.77 | 76.79 | +| lake | 57.11 | 59.85 | +| dishwasher | 54.35 | 72.25 | +| screen | 69.98 | 85.68 | +| blanket | 5.56 | 6.33 | +| sculpture | 47.45 | 54.33 | +| hood | 48.7 | 51.5 | +| sconce | 19.43 | 21.0 | +| vase | 34.92 | 46.93 | +| traffic light | 32.82 | 42.44 | +| tray | 3.37 | 4.19 | +| ashcan | 33.45 | 42.95 | +| fan | 44.69 | 52.52 | +| pier | 54.65 | 77.81 | +| crt screen | 2.04 | 4.77 | +| plate | 49.83 | 68.09 | +| monitor | 1.5 | 1.58 | +| bulletin board | 15.54 | 18.46 | +| shower | 3.1 | 3.26 | +| radiator | 38.32 | 43.02 | +| glass | 10.12 | 10.54 | +| clock | 16.31 | 17.64 | +| flag | 32.93 | 40.41 | ++---------------------+-------+-------+ +2023/11/02 03:08:51 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4030 coco/bbox_mAP_50: 0.5740 coco/bbox_mAP_75: 0.4410 coco/bbox_mAP_s: 0.2420 coco/bbox_mAP_m: 0.4560 coco/bbox_mAP_l: 0.5310 coco/segm_mAP: 0.2680 coco/segm_mAP_50: 0.4950 coco/segm_mAP_75: 0.2590 coco/segm_mAP_s: 0.1260 coco/segm_mAP_m: 0.3120 coco/segm_mAP_l: 0.4200 Bleu_1: 0.7203 Bleu_2: 0.5480 Bleu_3: 0.4069 Bleu_4: 0.3007 METEOR: 0.2497 ROUGE_L: 0.5267 CIDEr: 0.9424 SPICE: 0.1828 aAcc: 80.5600 mIoU: 42.7300 mAcc: 53.7100 visual-grounding/miou: 0.7387 visual-grounding/acc: 0.8180 data_time: 0.0093 time: 0.5256 +2023/11/02 03:18:03 - mmengine - INFO - Iter(train) [240500/640000] base_lr: 1.3866e-04 lr: 1.4424e-05 eta: 5 days, 0:05:31 time: 1.0800 data_time: 0.0300 memory: 21516 grad_norm: 2.8873 loss: 1.3846 caption_loss_cls: 2.3025 grounding_loss_reg: 2.9378 detection_loss_cls: 0.0389 detection_loss_reg: 0.3491 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0396 instance_segmentation_loss_reg: 0.3502 instance_segmentation_loss_poly: 0.9359 +2023/11/02 03:27:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 03:27:00 - mmengine - INFO - Iter(train) [241000/640000] base_lr: 1.3844e-04 lr: 1.4403e-05 eta: 4 days, 23:55:06 time: 1.0848 data_time: 0.0305 memory: 21516 grad_norm: 2.8615 loss: 1.3883 caption_loss_cls: 2.3050 grounding_loss_reg: 2.9403 detection_loss_cls: 0.0390 detection_loss_reg: 0.3497 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0396 instance_segmentation_loss_reg: 0.3504 instance_segmentation_loss_poly: 0.9370 +2023/11/02 03:27:00 - mmengine - INFO - Saving checkpoint at 241000 iterations +2023/11/02 03:35:40 - mmengine - INFO - Iter(train) [241500/640000] base_lr: 1.3821e-04 lr: 1.4383e-05 eta: 4 days, 23:39:41 time: 1.0780 data_time: 0.0306 memory: 21516 grad_norm: 2.9240 loss: 1.4059 caption_loss_cls: 2.3099 grounding_loss_reg: 2.9387 detection_loss_cls: 0.0390 detection_loss_reg: 0.3492 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0395 instance_segmentation_loss_reg: 0.3494 instance_segmentation_loss_poly: 0.9351 +2023/11/02 03:44:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 03:44:44 - mmengine - INFO - Iter(train) [242000/640000] base_lr: 1.3799e-04 lr: 1.4362e-05 eta: 4 days, 23:31:45 time: 1.0815 data_time: 0.0309 memory: 21516 grad_norm: 2.8894 loss: 1.4011 caption_loss_cls: 2.3095 grounding_loss_reg: 2.9374 detection_loss_cls: 0.0391 detection_loss_reg: 0.3497 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0397 instance_segmentation_loss_reg: 0.3499 instance_segmentation_loss_poly: 0.9359 +2023/11/02 03:44:44 - mmengine - INFO - Saving checkpoint at 242000 iterations +2023/11/02 03:53:59 - mmengine - INFO - Iter(train) [242500/640000] base_lr: 1.3776e-04 lr: 1.4342e-05 eta: 4 days, 23:26:43 time: 1.0811 data_time: 0.0312 memory: 21516 grad_norm: 2.9173 loss: 1.4139 caption_loss_cls: 2.3115 grounding_loss_reg: 2.9379 detection_loss_cls: 0.0391 detection_loss_reg: 0.3500 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3508 instance_segmentation_loss_poly: 0.9376 +2023/11/02 04:03:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 04:03:12 - mmengine - INFO - Iter(train) [243000/640000] base_lr: 1.3754e-04 lr: 1.4321e-05 eta: 4 days, 23:21:21 time: 1.0830 data_time: 0.0314 memory: 21516 grad_norm: 2.8967 loss: 1.4074 caption_loss_cls: 2.3123 grounding_loss_reg: 2.9360 detection_loss_cls: 0.0390 detection_loss_reg: 0.3499 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0401 instance_segmentation_loss_reg: 0.3515 instance_segmentation_loss_poly: 0.9377 +2023/11/02 04:03:12 - mmengine - INFO - Saving checkpoint at 243000 iterations +2023/11/02 04:12:39 - mmengine - INFO - Iter(train) [243500/640000] base_lr: 1.3731e-04 lr: 1.4301e-05 eta: 4 days, 23:19:21 time: 1.0912 data_time: 0.0323 memory: 21516 grad_norm: 2.8893 loss: 1.4168 caption_loss_cls: 2.3183 grounding_loss_reg: 2.9358 detection_loss_cls: 0.0391 detection_loss_reg: 0.3508 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0403 instance_segmentation_loss_reg: 0.3521 instance_segmentation_loss_poly: 0.9381 +2023/11/02 04:21:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 04:21:23 - mmengine - INFO - Iter(train) [244000/640000] base_lr: 1.3708e-04 lr: 1.4280e-05 eta: 4 days, 23:05:20 time: 1.0878 data_time: 0.0326 memory: 21516 grad_norm: 2.9127 loss: 1.4255 caption_loss_cls: 2.3186 grounding_loss_reg: 2.9352 detection_loss_cls: 0.0391 detection_loss_reg: 0.3503 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0403 instance_segmentation_loss_reg: 0.3516 instance_segmentation_loss_poly: 0.9366 +2023/11/02 04:21:23 - mmengine - INFO - Saving checkpoint at 244000 iterations +2023/11/02 04:31:02 - mmengine - INFO - Iter(train) [244500/640000] base_lr: 1.3686e-04 lr: 1.4260e-05 eta: 4 days, 23:06:30 time: 1.0944 data_time: 0.0356 memory: 21516 grad_norm: 2.8473 loss: 1.4113 caption_loss_cls: 2.3185 grounding_loss_reg: 2.9355 detection_loss_cls: 0.0391 detection_loss_reg: 0.3505 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0404 instance_segmentation_loss_reg: 0.3524 instance_segmentation_loss_poly: 0.9380 +2023/11/02 04:40:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 04:40:40 - mmengine - INFO - Iter(train) [245000/640000] base_lr: 1.3663e-04 lr: 1.4239e-05 eta: 4 days, 23:06:55 time: 1.1047 data_time: 0.0360 memory: 21516 grad_norm: 2.8325 loss: 1.4045 caption_loss_cls: 2.3192 grounding_loss_reg: 2.9360 detection_loss_cls: 0.0391 detection_loss_reg: 0.3506 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0402 instance_segmentation_loss_reg: 0.3516 instance_segmentation_loss_poly: 0.9364 +2023/11/02 04:40:40 - mmengine - INFO - Saving checkpoint at 245000 iterations +2023/11/02 04:49:58 - mmengine - INFO - Iter(train) [245500/640000] base_lr: 1.3640e-04 lr: 1.4218e-05 eta: 4 days, 23:01:45 time: 1.1141 data_time: 0.0364 memory: 21516 grad_norm: 2.7979 loss: 1.3987 caption_loss_cls: 2.3190 grounding_loss_reg: 2.9362 detection_loss_cls: 0.0390 detection_loss_reg: 0.3502 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3506 instance_segmentation_loss_poly: 0.9352 +2023/11/02 04:59:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 04:59:30 - mmengine - INFO - Iter(train) [246000/640000] base_lr: 1.3618e-04 lr: 1.4198e-05 eta: 4 days, 22:59:48 time: 1.1209 data_time: 0.0363 memory: 21516 grad_norm: 2.7732 loss: 1.3837 caption_loss_cls: 2.3198 grounding_loss_reg: 2.9349 detection_loss_cls: 0.0389 detection_loss_reg: 0.3497 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3508 instance_segmentation_loss_poly: 0.9349 +2023/11/02 04:59:30 - mmengine - INFO - Saving checkpoint at 246000 iterations +2023/11/02 05:08:32 - mmengine - INFO - Iter(train) [246500/640000] base_lr: 1.3595e-04 lr: 1.4177e-05 eta: 4 days, 22:50:24 time: 1.1179 data_time: 0.0361 memory: 21516 grad_norm: 2.7224 loss: 1.3659 caption_loss_cls: 2.3212 grounding_loss_reg: 2.9335 detection_loss_cls: 0.0390 detection_loss_reg: 0.3502 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3502 instance_segmentation_loss_poly: 0.9338 +2023/11/02 05:17:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 05:17:33 - mmengine - INFO - Iter(train) [247000/640000] base_lr: 1.3572e-04 lr: 1.4157e-05 eta: 4 days, 22:40:38 time: 1.1147 data_time: 0.0359 memory: 21516 grad_norm: 2.7647 loss: 1.3714 caption_loss_cls: 2.3162 grounding_loss_reg: 2.9331 detection_loss_cls: 0.0389 detection_loss_reg: 0.3496 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3509 instance_segmentation_loss_poly: 0.9345 +2023/11/02 05:17:33 - mmengine - INFO - Saving checkpoint at 247000 iterations +2023/11/02 05:26:46 - mmengine - INFO - Iter(train) [247500/640000] base_lr: 1.3549e-04 lr: 1.4136e-05 eta: 4 days, 22:33:43 time: 1.1113 data_time: 0.0354 memory: 21516 grad_norm: 2.7572 loss: 1.3614 caption_loss_cls: 2.3220 grounding_loss_reg: 2.9295 detection_loss_cls: 0.0389 detection_loss_reg: 0.3498 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3512 instance_segmentation_loss_poly: 0.9356 +2023/11/02 05:35:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 05:35:54 - mmengine - INFO - Iter(train) [248000/640000] base_lr: 1.3527e-04 lr: 1.4115e-05 eta: 4 days, 22:25:35 time: 1.1174 data_time: 0.0354 memory: 21516 grad_norm: 2.7327 loss: 1.3546 caption_loss_cls: 2.3228 grounding_loss_reg: 2.9287 detection_loss_cls: 0.0388 detection_loss_reg: 0.3504 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3516 instance_segmentation_loss_poly: 0.9360 +2023/11/02 05:35:54 - mmengine - INFO - Saving checkpoint at 248000 iterations +2023/11/02 05:44:57 - mmengine - INFO - Iter(train) [248500/640000] base_lr: 1.3504e-04 lr: 1.4094e-05 eta: 4 days, 22:16:11 time: 1.1081 data_time: 0.0350 memory: 21516 grad_norm: 2.7998 loss: 1.3687 caption_loss_cls: 2.3261 grounding_loss_reg: 2.9257 detection_loss_cls: 0.0387 detection_loss_reg: 0.3501 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0402 instance_segmentation_loss_reg: 0.3516 instance_segmentation_loss_poly: 0.9356 +2023/11/02 05:53:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 05:53:19 - mmengine - INFO - Iter(train) [249000/640000] base_lr: 1.3481e-04 lr: 1.4074e-05 eta: 4 days, 21:57:43 time: 1.0892 data_time: 0.0344 memory: 21516 grad_norm: 2.8683 loss: 1.3842 caption_loss_cls: 2.3223 grounding_loss_reg: 2.9261 detection_loss_cls: 0.0386 detection_loss_reg: 0.3500 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3515 instance_segmentation_loss_poly: 0.9347 +2023/11/02 05:53:19 - mmengine - INFO - Saving checkpoint at 249000 iterations +2023/11/02 06:02:29 - mmengine - INFO - Iter(train) [249500/640000] base_lr: 1.3458e-04 lr: 1.4053e-05 eta: 4 days, 21:50:08 time: 1.0871 data_time: 0.0344 memory: 21516 grad_norm: 2.8842 loss: 1.3851 caption_loss_cls: 2.3202 grounding_loss_reg: 2.9285 detection_loss_cls: 0.0385 detection_loss_reg: 0.3493 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3511 instance_segmentation_loss_poly: 0.9340 +2023/11/02 06:11:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 06:11:15 - mmengine - INFO - Iter(train) [250000/640000] base_lr: 1.3435e-04 lr: 1.4032e-05 eta: 4 days, 21:37:28 time: 1.0759 data_time: 0.0342 memory: 21516 grad_norm: 2.9418 loss: 1.3999 caption_loss_cls: 2.3164 grounding_loss_reg: 2.9276 detection_loss_cls: 0.0385 detection_loss_reg: 0.3490 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3513 instance_segmentation_loss_poly: 0.9351 +2023/11/02 06:11:15 - mmengine - INFO - Saving checkpoint at 250000 iterations +2023/11/02 06:20:28 - mmengine - INFO - Iter(train) [250500/640000] base_lr: 1.3412e-04 lr: 1.4011e-05 eta: 4 days, 21:30:23 time: 1.0784 data_time: 0.0344 memory: 21516 grad_norm: 2.9576 loss: 1.4106 caption_loss_cls: 2.3180 grounding_loss_reg: 2.9244 detection_loss_cls: 0.0385 detection_loss_reg: 0.3487 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0401 instance_segmentation_loss_reg: 0.3516 instance_segmentation_loss_poly: 0.9357 +2023/11/02 06:29:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 06:29:43 - mmengine - INFO - Iter(train) [251000/640000] base_lr: 1.3389e-04 lr: 1.3990e-05 eta: 4 days, 21:23:50 time: 1.0820 data_time: 0.0347 memory: 21516 grad_norm: 2.9369 loss: 1.4140 caption_loss_cls: 2.3163 grounding_loss_reg: 2.9242 detection_loss_cls: 0.0386 detection_loss_reg: 0.3497 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3509 instance_segmentation_loss_poly: 0.9338 +2023/11/02 06:29:43 - mmengine - INFO - Saving checkpoint at 251000 iterations +2023/11/02 06:38:47 - mmengine - INFO - Iter(train) [251500/640000] base_lr: 1.3367e-04 lr: 1.3970e-05 eta: 4 days, 21:14:56 time: 1.0798 data_time: 0.0347 memory: 21516 grad_norm: 2.9207 loss: 1.3965 caption_loss_cls: 2.3116 grounding_loss_reg: 2.9221 detection_loss_cls: 0.0384 detection_loss_reg: 0.3477 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3502 instance_segmentation_loss_poly: 0.9319 +2023/11/02 06:47:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 06:47:47 - mmengine - INFO - Iter(train) [252000/640000] base_lr: 1.3344e-04 lr: 1.3949e-05 eta: 4 days, 21:05:07 time: 1.0777 data_time: 0.0347 memory: 21516 grad_norm: 2.9315 loss: 1.4010 caption_loss_cls: 2.3167 grounding_loss_reg: 2.9218 detection_loss_cls: 0.0383 detection_loss_reg: 0.3472 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0398 instance_segmentation_loss_reg: 0.3491 instance_segmentation_loss_poly: 0.9294 +2023/11/02 06:47:47 - mmengine - INFO - Saving checkpoint at 252000 iterations +2023/11/02 06:57:17 - mmengine - INFO - Iter(train) [252500/640000] base_lr: 1.3321e-04 lr: 1.3928e-05 eta: 4 days, 21:01:17 time: 1.0845 data_time: 0.0349 memory: 21516 grad_norm: 2.8867 loss: 1.3931 caption_loss_cls: 2.3188 grounding_loss_reg: 2.9206 detection_loss_cls: 0.0383 detection_loss_reg: 0.3477 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3494 instance_segmentation_loss_poly: 0.9304 +2023/11/02 07:06:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 07:06:09 - mmengine - INFO - Iter(train) [253000/640000] base_lr: 1.3298e-04 lr: 1.3907e-05 eta: 4 days, 20:49:57 time: 1.0920 data_time: 0.0351 memory: 21516 grad_norm: 2.8569 loss: 1.3817 caption_loss_cls: 2.3186 grounding_loss_reg: 2.9227 detection_loss_cls: 0.0384 detection_loss_reg: 0.3481 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0398 instance_segmentation_loss_reg: 0.3495 instance_segmentation_loss_poly: 0.9305 +2023/11/02 07:06:09 - mmengine - INFO - Saving checkpoint at 253000 iterations +2023/11/02 07:14:59 - mmengine - INFO - Iter(train) [253500/640000] base_lr: 1.3275e-04 lr: 1.3886e-05 eta: 4 days, 20:38:13 time: 1.0870 data_time: 0.0349 memory: 21516 grad_norm: 2.8707 loss: 1.3854 caption_loss_cls: 2.3198 grounding_loss_reg: 2.9224 detection_loss_cls: 0.0383 detection_loss_reg: 0.3475 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0397 instance_segmentation_loss_reg: 0.3484 instance_segmentation_loss_poly: 0.9294 +2023/11/02 07:24:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 07:24:05 - mmengine - INFO - Iter(train) [254000/640000] base_lr: 1.3252e-04 lr: 1.3865e-05 eta: 4 days, 20:29:41 time: 1.0918 data_time: 0.0352 memory: 21516 grad_norm: 2.8433 loss: 1.3885 caption_loss_cls: 2.3198 grounding_loss_reg: 2.9229 detection_loss_cls: 0.0382 detection_loss_reg: 0.3465 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0397 instance_segmentation_loss_reg: 0.3493 instance_segmentation_loss_poly: 0.9323 +2023/11/02 07:24:05 - mmengine - INFO - Saving checkpoint at 254000 iterations +2023/11/02 07:33:24 - mmengine - INFO - Iter(train) [254500/640000] base_lr: 1.3229e-04 lr: 1.3844e-05 eta: 4 days, 20:23:39 time: 1.0937 data_time: 0.0354 memory: 21516 grad_norm: 2.8480 loss: 1.3970 caption_loss_cls: 2.3190 grounding_loss_reg: 2.9248 detection_loss_cls: 0.0383 detection_loss_reg: 0.3478 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0396 instance_segmentation_loss_reg: 0.3484 instance_segmentation_loss_poly: 0.9306 +2023/11/02 07:42:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 07:42:19 - mmengine - INFO - Iter(train) [255000/640000] base_lr: 1.3205e-04 lr: 1.3823e-05 eta: 4 days, 20:12:53 time: 1.0885 data_time: 0.0353 memory: 21516 grad_norm: 2.8494 loss: 1.3963 caption_loss_cls: 2.3203 grounding_loss_reg: 2.9217 detection_loss_cls: 0.0383 detection_loss_reg: 0.3472 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0396 instance_segmentation_loss_reg: 0.3490 instance_segmentation_loss_poly: 0.9312 +2023/11/02 07:42:19 - mmengine - INFO - Saving checkpoint at 255000 iterations +2023/11/02 07:51:18 - mmengine - INFO - Iter(train) [255500/640000] base_lr: 1.3182e-04 lr: 1.3802e-05 eta: 4 days, 20:03:06 time: 1.0873 data_time: 0.0353 memory: 21516 grad_norm: 2.8805 loss: 1.4132 caption_loss_cls: 2.3200 grounding_loss_reg: 2.9253 detection_loss_cls: 0.0384 detection_loss_reg: 0.3480 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0397 instance_segmentation_loss_reg: 0.3489 instance_segmentation_loss_poly: 0.9307 +2023/11/02 08:00:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 08:00:14 - mmengine - INFO - Iter(train) [256000/640000] base_lr: 1.3159e-04 lr: 1.3781e-05 eta: 4 days, 19:52:33 time: 1.0862 data_time: 0.0353 memory: 21516 grad_norm: 2.8680 loss: 1.4017 caption_loss_cls: 2.3202 grounding_loss_reg: 2.9256 detection_loss_cls: 0.0384 detection_loss_reg: 0.3477 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0396 instance_segmentation_loss_reg: 0.3489 instance_segmentation_loss_poly: 0.9308 +2023/11/02 08:00:14 - mmengine - INFO - Saving checkpoint at 256000 iterations +2023/11/02 08:09:39 - mmengine - INFO - Iter(train) [256500/640000] base_lr: 1.3136e-04 lr: 1.3760e-05 eta: 4 days, 19:47:18 time: 1.0850 data_time: 0.0355 memory: 21516 grad_norm: 2.8993 loss: 1.4131 caption_loss_cls: 2.3194 grounding_loss_reg: 2.9263 detection_loss_cls: 0.0385 detection_loss_reg: 0.3483 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0396 instance_segmentation_loss_reg: 0.3495 instance_segmentation_loss_poly: 0.9334 +2023/11/02 08:18:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 08:18:59 - mmengine - INFO - Iter(train) [257000/640000] base_lr: 1.3113e-04 lr: 1.3739e-05 eta: 4 days, 19:41:11 time: 1.0922 data_time: 0.0358 memory: 21516 grad_norm: 2.9132 loss: 1.4216 caption_loss_cls: 2.3218 grounding_loss_reg: 2.9253 detection_loss_cls: 0.0385 detection_loss_reg: 0.3478 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0396 instance_segmentation_loss_reg: 0.3500 instance_segmentation_loss_poly: 0.9351 +2023/11/02 08:18:59 - mmengine - INFO - Saving checkpoint at 257000 iterations +2023/11/02 08:27:31 - mmengine - INFO - Iter(train) [257500/640000] base_lr: 1.3090e-04 lr: 1.3718e-05 eta: 4 days, 19:26:40 time: 1.0877 data_time: 0.0358 memory: 21516 grad_norm: 2.9293 loss: 1.4325 caption_loss_cls: 2.3267 grounding_loss_reg: 2.9254 detection_loss_cls: 0.0386 detection_loss_reg: 0.3487 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0395 instance_segmentation_loss_reg: 0.3489 instance_segmentation_loss_poly: 0.9331 +2023/11/02 08:36:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 08:36:48 - mmengine - INFO - Iter(train) [258000/640000] base_lr: 1.3067e-04 lr: 1.3697e-05 eta: 4 days, 19:19:53 time: 1.0904 data_time: 0.0358 memory: 21516 grad_norm: 2.9189 loss: 1.4279 caption_loss_cls: 2.3279 grounding_loss_reg: 2.9277 detection_loss_cls: 0.0385 detection_loss_reg: 0.3484 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0395 instance_segmentation_loss_reg: 0.3489 instance_segmentation_loss_poly: 0.9332 +2023/11/02 08:36:48 - mmengine - INFO - Saving checkpoint at 258000 iterations +2023/11/02 08:46:28 - mmengine - INFO - Iter(train) [258500/640000] base_lr: 1.3044e-04 lr: 1.3676e-05 eta: 4 days, 19:16:44 time: 1.0954 data_time: 0.0358 memory: 21516 grad_norm: 2.9049 loss: 1.4094 caption_loss_cls: 2.3259 grounding_loss_reg: 2.9265 detection_loss_cls: 0.0385 detection_loss_reg: 0.3481 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0395 instance_segmentation_loss_reg: 0.3492 instance_segmentation_loss_poly: 0.9324 +2023/11/02 08:55:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 08:55:16 - mmengine - INFO - Iter(train) [259000/640000] base_lr: 1.3020e-04 lr: 1.3655e-05 eta: 4 days, 19:05:06 time: 1.0939 data_time: 0.0357 memory: 21516 grad_norm: 2.9131 loss: 1.4021 caption_loss_cls: 2.3217 grounding_loss_reg: 2.9293 detection_loss_cls: 0.0386 detection_loss_reg: 0.3489 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0394 instance_segmentation_loss_reg: 0.3486 instance_segmentation_loss_poly: 0.9312 +2023/11/02 08:55:16 - mmengine - INFO - Saving checkpoint at 259000 iterations +2023/11/02 09:04:22 - mmengine - INFO - Iter(train) [259500/640000] base_lr: 1.2997e-04 lr: 1.3634e-05 eta: 4 days, 18:56:17 time: 1.0953 data_time: 0.0359 memory: 21516 grad_norm: 2.8996 loss: 1.4022 caption_loss_cls: 2.3164 grounding_loss_reg: 2.9305 detection_loss_cls: 0.0384 detection_loss_reg: 0.3481 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0394 instance_segmentation_loss_reg: 0.3485 instance_segmentation_loss_poly: 0.9306 +2023/11/02 09:13:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 09:13:10 - mmengine - INFO - Iter(train) [260000/640000] base_lr: 1.2974e-04 lr: 1.3613e-05 eta: 4 days, 18:44:47 time: 1.0937 data_time: 0.0358 memory: 21516 grad_norm: 2.9157 loss: 1.4042 caption_loss_cls: 2.3157 grounding_loss_reg: 2.9280 detection_loss_cls: 0.0384 detection_loss_reg: 0.3482 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0394 instance_segmentation_loss_reg: 0.3475 instance_segmentation_loss_poly: 0.9284 +2023/11/02 09:13:10 - mmengine - INFO - Saving checkpoint at 260000 iterations +2023/11/02 09:21:58 - mmengine - INFO - Evaluating bbox... +2023/11/02 09:22:53 - mmengine - INFO - bbox_mAP_copypaste: 0.416 0.585 0.454 0.245 0.464 0.558 +2023/11/02 09:22:53 - mmengine - INFO - Evaluating segm... +2023/11/02 09:24:02 - mmengine - INFO - segm_mAP_copypaste: 0.273 0.495 0.265 0.129 0.308 0.431 +2023/11/02 09:29:10 - mmengine - INFO - per class results: +2023/11/02 09:29:10 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.27 | 87.3 | +| building | 80.65 | 91.66 | +| sky | 93.14 | 97.13 | +| floor | 78.31 | 89.5 | +| tree | 72.86 | 85.11 | +| ceiling | 82.3 | 93.44 | +| road | 82.08 | 91.5 | +| bed | 86.0 | 95.61 | +| windowpane | 58.91 | 74.5 | +| grass | 67.31 | 85.27 | +| cabinet | 59.3 | 77.94 | +| sidewalk | 63.53 | 73.81 | +| person | 78.74 | 88.98 | +| earth | 34.32 | 43.38 | +| door | 47.94 | 61.39 | +| table | 56.83 | 77.98 | +| mountain | 51.18 | 61.82 | +| plant | 50.84 | 72.61 | +| curtain | 68.25 | 86.72 | +| chair | 53.49 | 69.2 | +| car | 81.76 | 91.89 | +| water | 49.86 | 62.46 | +| painting | 66.63 | 79.84 | +| sofa | 64.57 | 79.12 | +| shelf | 39.83 | 55.03 | +| house | 36.12 | 47.03 | +| sea | 49.88 | 74.77 | +| mirror | 61.61 | 76.36 | +| rug | 64.67 | 78.03 | +| field | 34.51 | 48.48 | +| armchair | 42.38 | 61.04 | +| seat | 51.73 | 79.43 | +| fence | 39.48 | 59.21 | +| desk | 44.2 | 64.38 | +| rock | 37.32 | 54.37 | +| wardrobe | 51.31 | 63.34 | +| lamp | 56.97 | 72.75 | +| bathtub | 68.24 | 86.15 | +| railing | 27.7 | 39.51 | +| cushion | 53.08 | 64.2 | +| base | 20.12 | 33.9 | +| box | 20.76 | 26.3 | +| column | 45.98 | 61.42 | +| signboard | 33.6 | 41.45 | +| chest of drawers | 25.52 | 29.55 | +| counter | 29.98 | 36.46 | +| sand | 37.59 | 52.85 | +| sink | 67.77 | 75.81 | +| skyscraper | 48.21 | 59.09 | +| fireplace | 69.27 | 86.84 | +| refrigerator | 64.31 | 68.54 | +| grandstand | 44.17 | 73.56 | +| path | 20.05 | 28.8 | +| stairs | 22.63 | 32.31 | +| runway | 68.83 | 88.68 | +| case | 39.11 | 53.86 | +| pool table | 88.11 | 96.06 | +| pillow | 48.5 | 59.06 | +| screen door | 61.1 | 66.0 | +| stairway | 25.99 | 36.2 | +| river | 10.38 | 17.06 | +| bridge | 50.1 | 63.27 | +| bookcase | 35.03 | 49.79 | +| blind | 23.55 | 26.89 | +| coffee table | 55.79 | 65.79 | +| toilet | 82.02 | 90.47 | +| flower | 21.95 | 23.86 | +| book | 42.2 | 54.62 | +| hill | 10.27 | 20.21 | +| bench | 41.31 | 53.65 | +| countertop | 51.56 | 68.91 | +| stove | 72.31 | 83.63 | +| palm | 46.53 | 62.23 | +| kitchen island | 20.2 | 26.6 | +| computer | 58.38 | 63.66 | +| swivel chair | 41.69 | 62.41 | +| boat | 40.3 | 49.88 | +| bar | 17.4 | 21.13 | +| arcade machine | 49.1 | 66.77 | +| hovel | 10.79 | 12.35 | +| bus | 85.56 | 96.5 | +| towel | 55.25 | 62.41 | +| light | 48.65 | 59.86 | +| truck | 32.23 | 42.32 | +| tower | 26.38 | 35.27 | +| chandelier | 57.74 | 66.45 | +| awning | 19.08 | 23.1 | +| streetlight | 20.81 | 30.37 | +| booth | 41.0 | 44.49 | +| television receiver | 65.44 | 66.96 | +| airplane | 50.3 | 63.75 | +| dirt track | 0.0 | 0.0 | +| apparel | 28.1 | 39.06 | +| pole | 10.91 | 11.98 | +| land | 1.85 | 2.59 | +| bannister | 12.55 | 19.32 | +| escalator | 32.22 | 42.04 | +| ottoman | 40.69 | 53.46 | +| bottle | 25.18 | 31.16 | +| buffet | 47.08 | 54.15 | +| poster | 29.33 | 38.66 | +| stage | 10.89 | 22.24 | +| van | 33.45 | 44.38 | +| ship | 38.11 | 92.9 | +| fountain | 21.58 | 31.26 | +| conveyer belt | 70.71 | 85.74 | +| canopy | 26.51 | 29.94 | +| washer | 60.47 | 69.99 | +| plaything | 21.84 | 36.98 | +| swimming pool | 59.09 | 74.88 | +| stool | 36.81 | 43.84 | +| barrel | 7.44 | 9.52 | +| basket | 26.15 | 38.0 | +| waterfall | 68.04 | 83.54 | +| tent | 91.97 | 97.86 | +| bag | 9.7 | 11.05 | +| minibike | 66.96 | 79.49 | +| cradle | 63.53 | 91.22 | +| oven | 44.99 | 57.71 | +| ball | 15.57 | 16.97 | +| food | 42.73 | 45.09 | +| step | 11.01 | 17.45 | +| tank | 31.13 | 33.11 | +| trade name | 6.76 | 6.86 | +| microwave | 70.61 | 76.11 | +| pot | 44.67 | 53.1 | +| animal | 51.8 | 54.43 | +| bicycle | 50.72 | 62.41 | +| lake | 49.62 | 67.9 | +| dishwasher | 47.75 | 65.81 | +| screen | 71.37 | 81.82 | +| blanket | 2.99 | 3.24 | +| sculpture | 42.16 | 49.94 | +| hood | 41.36 | 42.84 | +| sconce | 39.92 | 52.4 | +| vase | 40.59 | 52.53 | +| traffic light | 26.67 | 30.33 | +| tray | 6.29 | 8.03 | +| ashcan | 34.86 | 53.29 | +| fan | 52.44 | 64.03 | +| pier | 32.03 | 34.16 | +| crt screen | 10.27 | 31.44 | +| plate | 53.15 | 64.64 | +| monitor | 10.77 | 12.34 | +| bulletin board | 21.13 | 35.56 | +| shower | 0.83 | 1.08 | +| radiator | 49.82 | 61.04 | +| glass | 7.88 | 8.06 | +| clock | 17.61 | 20.76 | +| flag | 30.22 | 33.9 | ++---------------------+-------+-------+ +2023/11/02 09:29:25 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4160 coco/bbox_mAP_50: 0.5850 coco/bbox_mAP_75: 0.4540 coco/bbox_mAP_s: 0.2450 coco/bbox_mAP_m: 0.4640 coco/bbox_mAP_l: 0.5580 coco/segm_mAP: 0.2730 coco/segm_mAP_50: 0.4950 coco/segm_mAP_75: 0.2650 coco/segm_mAP_s: 0.1290 coco/segm_mAP_m: 0.3080 coco/segm_mAP_l: 0.4310 Bleu_1: 0.7140 Bleu_2: 0.5435 Bleu_3: 0.4038 Bleu_4: 0.2988 METEOR: 0.2481 ROUGE_L: 0.5261 CIDEr: 0.9290 SPICE: 0.1790 aAcc: 81.2800 mIoU: 43.5300 mAcc: 54.3800 visual-grounding/miou: 0.7418 visual-grounding/acc: 0.8198 data_time: 0.0046 time: 0.5204 +2023/11/02 09:37:45 - mmengine - INFO - Iter(train) [260500/640000] base_lr: 1.2951e-04 lr: 1.3591e-05 eta: 4 days, 18:29:16 time: 1.0780 data_time: 0.0323 memory: 21516 grad_norm: 2.9319 loss: 1.3925 caption_loss_cls: 2.3122 grounding_loss_reg: 2.9260 detection_loss_cls: 0.0383 detection_loss_reg: 0.3474 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0394 instance_segmentation_loss_reg: 0.3476 instance_segmentation_loss_poly: 0.9284 +2023/11/02 09:46:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 09:46:33 - mmengine - INFO - Iter(train) [261000/640000] base_lr: 1.2927e-04 lr: 1.3570e-05 eta: 4 days, 18:17:52 time: 1.0698 data_time: 0.0320 memory: 21516 grad_norm: 2.9023 loss: 1.3860 caption_loss_cls: 2.3104 grounding_loss_reg: 2.9242 detection_loss_cls: 0.0383 detection_loss_reg: 0.3461 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3474 instance_segmentation_loss_poly: 0.9278 +2023/11/02 09:46:33 - mmengine - INFO - Saving checkpoint at 261000 iterations +2023/11/02 09:55:23 - mmengine - INFO - Iter(train) [261500/640000] base_lr: 1.2904e-04 lr: 1.3549e-05 eta: 4 days, 18:06:44 time: 1.0742 data_time: 0.0319 memory: 21516 grad_norm: 2.8795 loss: 1.3723 caption_loss_cls: 2.3091 grounding_loss_reg: 2.9256 detection_loss_cls: 0.0383 detection_loss_reg: 0.3462 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3477 instance_segmentation_loss_poly: 0.9276 +2023/11/02 10:04:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 10:04:03 - mmengine - INFO - Iter(train) [262000/640000] base_lr: 1.2881e-04 lr: 1.3528e-05 eta: 4 days, 17:54:16 time: 1.0650 data_time: 0.0317 memory: 21516 grad_norm: 2.9178 loss: 1.3731 caption_loss_cls: 2.3066 grounding_loss_reg: 2.9222 detection_loss_cls: 0.0384 detection_loss_reg: 0.3471 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3479 instance_segmentation_loss_poly: 0.9275 +2023/11/02 10:04:03 - mmengine - INFO - Saving checkpoint at 262000 iterations +2023/11/02 10:12:59 - mmengine - INFO - Iter(train) [262500/640000] base_lr: 1.2857e-04 lr: 1.3507e-05 eta: 4 days, 17:44:16 time: 1.0541 data_time: 0.0313 memory: 21516 grad_norm: 2.9695 loss: 1.3862 caption_loss_cls: 2.3027 grounding_loss_reg: 2.9194 detection_loss_cls: 0.0384 detection_loss_reg: 0.3470 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3478 instance_segmentation_loss_poly: 0.9279 +2023/11/02 10:22:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 10:22:17 - mmengine - INFO - Iter(train) [263000/640000] base_lr: 1.2834e-04 lr: 1.3485e-05 eta: 4 days, 17:37:27 time: 1.0615 data_time: 0.0313 memory: 21516 grad_norm: 2.9459 loss: 1.3822 caption_loss_cls: 2.3034 grounding_loss_reg: 2.9200 detection_loss_cls: 0.0384 detection_loss_reg: 0.3465 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0391 instance_segmentation_loss_reg: 0.3461 instance_segmentation_loss_poly: 0.9235 +2023/11/02 10:22:17 - mmengine - INFO - Saving checkpoint at 263000 iterations +2023/11/02 10:31:24 - mmengine - INFO - Iter(train) [263500/640000] base_lr: 1.2811e-04 lr: 1.3464e-05 eta: 4 days, 17:29:04 time: 1.0619 data_time: 0.0314 memory: 21516 grad_norm: 2.9655 loss: 1.3912 caption_loss_cls: 2.2994 grounding_loss_reg: 2.9208 detection_loss_cls: 0.0382 detection_loss_reg: 0.3456 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0392 instance_segmentation_loss_reg: 0.3470 instance_segmentation_loss_poly: 0.9241 +2023/11/02 10:40:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 10:40:21 - mmengine - INFO - Iter(train) [264000/640000] base_lr: 1.2787e-04 lr: 1.3443e-05 eta: 4 days, 17:19:12 time: 1.0641 data_time: 0.0316 memory: 21516 grad_norm: 2.9600 loss: 1.3991 caption_loss_cls: 2.3036 grounding_loss_reg: 2.9167 detection_loss_cls: 0.0381 detection_loss_reg: 0.3459 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0392 instance_segmentation_loss_reg: 0.3471 instance_segmentation_loss_poly: 0.9252 +2023/11/02 10:40:21 - mmengine - INFO - Saving checkpoint at 264000 iterations +2023/11/02 10:49:37 - mmengine - INFO - Iter(train) [264500/640000] base_lr: 1.2764e-04 lr: 1.3422e-05 eta: 4 days, 17:12:03 time: 1.0775 data_time: 0.0348 memory: 21516 grad_norm: 2.9477 loss: 1.4085 caption_loss_cls: 2.3052 grounding_loss_reg: 2.9199 detection_loss_cls: 0.0381 detection_loss_reg: 0.3457 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3470 instance_segmentation_loss_poly: 0.9245 +2023/11/02 10:58:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 10:58:34 - mmengine - INFO - Iter(train) [265000/640000] base_lr: 1.2741e-04 lr: 1.3400e-05 eta: 4 days, 17:02:07 time: 1.0796 data_time: 0.0350 memory: 21516 grad_norm: 2.9790 loss: 1.4206 caption_loss_cls: 2.3071 grounding_loss_reg: 2.9173 detection_loss_cls: 0.0381 detection_loss_reg: 0.3453 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0394 instance_segmentation_loss_reg: 0.3478 instance_segmentation_loss_poly: 0.9252 +2023/11/02 10:58:34 - mmengine - INFO - Saving checkpoint at 265000 iterations +2023/11/02 11:07:51 - mmengine - INFO - Iter(train) [265500/640000] base_lr: 1.2717e-04 lr: 1.3379e-05 eta: 4 days, 16:55:01 time: 1.0865 data_time: 0.0355 memory: 21516 grad_norm: 2.9328 loss: 1.4134 caption_loss_cls: 2.3066 grounding_loss_reg: 2.9153 detection_loss_cls: 0.0381 detection_loss_reg: 0.3454 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0395 instance_segmentation_loss_reg: 0.3481 instance_segmentation_loss_poly: 0.9252 +2023/11/02 11:17:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 11:17:23 - mmengine - INFO - Iter(train) [266000/640000] base_lr: 1.2694e-04 lr: 1.3358e-05 eta: 4 days, 16:49:56 time: 1.0995 data_time: 0.0359 memory: 21516 grad_norm: 2.8921 loss: 1.4091 caption_loss_cls: 2.3103 grounding_loss_reg: 2.9136 detection_loss_cls: 0.0382 detection_loss_reg: 0.3459 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0396 instance_segmentation_loss_reg: 0.3490 instance_segmentation_loss_poly: 0.9283 +2023/11/02 11:17:23 - mmengine - INFO - Saving checkpoint at 266000 iterations +2023/11/02 11:26:40 - mmengine - INFO - Iter(train) [266500/640000] base_lr: 1.2670e-04 lr: 1.3337e-05 eta: 4 days, 16:42:45 time: 1.1048 data_time: 0.0361 memory: 21516 grad_norm: 2.8657 loss: 1.3976 caption_loss_cls: 2.3097 grounding_loss_reg: 2.9120 detection_loss_cls: 0.0382 detection_loss_reg: 0.3460 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0397 instance_segmentation_loss_reg: 0.3491 instance_segmentation_loss_poly: 0.9272 +2023/11/02 11:36:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 11:36:03 - mmengine - INFO - Iter(train) [267000/640000] base_lr: 1.2647e-04 lr: 1.3315e-05 eta: 4 days, 16:36:17 time: 1.1061 data_time: 0.0362 memory: 21516 grad_norm: 2.8154 loss: 1.3941 caption_loss_cls: 2.3124 grounding_loss_reg: 2.9106 detection_loss_cls: 0.0382 detection_loss_reg: 0.3466 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0398 instance_segmentation_loss_reg: 0.3500 instance_segmentation_loss_poly: 0.9286 +2023/11/02 11:36:03 - mmengine - INFO - Saving checkpoint at 267000 iterations +2023/11/02 11:45:12 - mmengine - INFO - Iter(train) [267500/640000] base_lr: 1.2623e-04 lr: 1.3294e-05 eta: 4 days, 16:27:53 time: 1.1065 data_time: 0.0362 memory: 21516 grad_norm: 2.8134 loss: 1.3921 caption_loss_cls: 2.3099 grounding_loss_reg: 2.9117 detection_loss_cls: 0.0382 detection_loss_reg: 0.3466 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0398 instance_segmentation_loss_reg: 0.3490 instance_segmentation_loss_poly: 0.9261 +2023/11/02 11:54:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 11:54:25 - mmengine - INFO - Iter(train) [268000/640000] base_lr: 1.2600e-04 lr: 1.3272e-05 eta: 4 days, 16:20:05 time: 1.1105 data_time: 0.0363 memory: 21516 grad_norm: 2.7975 loss: 1.3843 caption_loss_cls: 2.3056 grounding_loss_reg: 2.9117 detection_loss_cls: 0.0383 detection_loss_reg: 0.3474 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3498 instance_segmentation_loss_poly: 0.9283 +2023/11/02 11:54:25 - mmengine - INFO - Saving checkpoint at 268000 iterations +2023/11/02 12:03:47 - mmengine - INFO - Iter(train) [268500/640000] base_lr: 1.2576e-04 lr: 1.3251e-05 eta: 4 days, 16:13:16 time: 1.1118 data_time: 0.0368 memory: 21516 grad_norm: 2.7977 loss: 1.3793 caption_loss_cls: 2.3017 grounding_loss_reg: 2.9101 detection_loss_cls: 0.0383 detection_loss_reg: 0.3464 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3499 instance_segmentation_loss_poly: 0.9287 +2023/11/02 12:13:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 12:13:19 - mmengine - INFO - Iter(train) [269000/640000] base_lr: 1.2553e-04 lr: 1.3230e-05 eta: 4 days, 16:07:50 time: 1.1209 data_time: 0.0366 memory: 21516 grad_norm: 2.7501 loss: 1.3556 caption_loss_cls: 2.3078 grounding_loss_reg: 2.9062 detection_loss_cls: 0.0384 detection_loss_reg: 0.3473 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0401 instance_segmentation_loss_reg: 0.3504 instance_segmentation_loss_poly: 0.9296 +2023/11/02 12:13:19 - mmengine - INFO - Saving checkpoint at 269000 iterations +2023/11/02 12:22:31 - mmengine - INFO - Iter(train) [269500/640000] base_lr: 1.2529e-04 lr: 1.3208e-05 eta: 4 days, 15:59:43 time: 1.1196 data_time: 0.0363 memory: 21516 grad_norm: 2.7721 loss: 1.3575 caption_loss_cls: 2.3106 grounding_loss_reg: 2.9050 detection_loss_cls: 0.0383 detection_loss_reg: 0.3473 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0401 instance_segmentation_loss_reg: 0.3510 instance_segmentation_loss_poly: 0.9294 +2023/11/02 12:31:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 12:31:44 - mmengine - INFO - Iter(train) [270000/640000] base_lr: 1.2506e-04 lr: 1.3187e-05 eta: 4 days, 15:51:41 time: 1.1148 data_time: 0.0361 memory: 21516 grad_norm: 2.7995 loss: 1.3642 caption_loss_cls: 2.3138 grounding_loss_reg: 2.9042 detection_loss_cls: 0.0384 detection_loss_reg: 0.3479 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3503 instance_segmentation_loss_poly: 0.9280 +2023/11/02 12:31:44 - mmengine - INFO - Saving checkpoint at 270000 iterations +2023/11/02 12:40:48 - mmengine - INFO - Iter(train) [270500/640000] base_lr: 1.2482e-04 lr: 1.3165e-05 eta: 4 days, 15:42:34 time: 1.1115 data_time: 0.0360 memory: 21516 grad_norm: 2.7933 loss: 1.3664 caption_loss_cls: 2.3132 grounding_loss_reg: 2.9029 detection_loss_cls: 0.0384 detection_loss_reg: 0.3480 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3498 instance_segmentation_loss_poly: 0.9261 +2023/11/02 12:49:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 12:49:31 - mmengine - INFO - Iter(train) [271000/640000] base_lr: 1.2458e-04 lr: 1.3144e-05 eta: 4 days, 15:30:54 time: 1.1014 data_time: 0.0358 memory: 21516 grad_norm: 2.8700 loss: 1.3768 caption_loss_cls: 2.3132 grounding_loss_reg: 2.9012 detection_loss_cls: 0.0382 detection_loss_reg: 0.3474 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3504 instance_segmentation_loss_poly: 0.9270 +2023/11/02 12:49:31 - mmengine - INFO - Saving checkpoint at 271000 iterations +2023/11/02 12:58:40 - mmengine - INFO - Iter(train) [271500/640000] base_lr: 1.2435e-04 lr: 1.3123e-05 eta: 4 days, 15:22:21 time: 1.1014 data_time: 0.0356 memory: 21516 grad_norm: 2.8516 loss: 1.3605 caption_loss_cls: 2.3136 grounding_loss_reg: 2.9020 detection_loss_cls: 0.0382 detection_loss_reg: 0.3471 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0398 instance_segmentation_loss_reg: 0.3510 instance_segmentation_loss_poly: 0.9280 +2023/11/02 13:07:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 13:07:45 - mmengine - INFO - Iter(train) [272000/640000] base_lr: 1.2411e-04 lr: 1.3101e-05 eta: 4 days, 15:13:22 time: 1.0993 data_time: 0.0356 memory: 21516 grad_norm: 2.8845 loss: 1.3670 caption_loss_cls: 2.3091 grounding_loss_reg: 2.8985 detection_loss_cls: 0.0383 detection_loss_reg: 0.3477 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0398 instance_segmentation_loss_reg: 0.3515 instance_segmentation_loss_poly: 0.9289 +2023/11/02 13:07:45 - mmengine - INFO - Saving checkpoint at 272000 iterations +2023/11/02 13:16:21 - mmengine - INFO - Iter(train) [272500/640000] base_lr: 1.2388e-04 lr: 1.3080e-05 eta: 4 days, 15:01:03 time: 1.0881 data_time: 0.0347 memory: 21516 grad_norm: 2.9129 loss: 1.3759 caption_loss_cls: 2.3086 grounding_loss_reg: 2.8990 detection_loss_cls: 0.0383 detection_loss_reg: 0.3485 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0397 instance_segmentation_loss_reg: 0.3505 instance_segmentation_loss_poly: 0.9271 +2023/11/02 13:26:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 13:26:01 - mmengine - INFO - Iter(train) [273000/640000] base_lr: 1.2364e-04 lr: 1.3058e-05 eta: 4 days, 14:56:07 time: 1.0898 data_time: 0.0351 memory: 21516 grad_norm: 2.9225 loss: 1.3861 caption_loss_cls: 2.3126 grounding_loss_reg: 2.8959 detection_loss_cls: 0.0382 detection_loss_reg: 0.3482 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3525 instance_segmentation_loss_poly: 0.9312 +2023/11/02 13:26:01 - mmengine - INFO - Saving checkpoint at 273000 iterations +2023/11/02 13:35:07 - mmengine - INFO - Iter(train) [273500/640000] base_lr: 1.2340e-04 lr: 1.3037e-05 eta: 4 days, 14:47:16 time: 1.0884 data_time: 0.0353 memory: 21516 grad_norm: 2.9274 loss: 1.3902 caption_loss_cls: 2.3094 grounding_loss_reg: 2.8943 detection_loss_cls: 0.0382 detection_loss_reg: 0.3476 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3528 instance_segmentation_loss_poly: 0.9305 +2023/11/02 13:44:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 13:44:06 - mmengine - INFO - Iter(train) [274000/640000] base_lr: 1.2317e-04 lr: 1.3015e-05 eta: 4 days, 14:37:35 time: 1.0850 data_time: 0.0352 memory: 21516 grad_norm: 2.9256 loss: 1.3895 caption_loss_cls: 2.3128 grounding_loss_reg: 2.8894 detection_loss_cls: 0.0384 detection_loss_reg: 0.3490 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3520 instance_segmentation_loss_poly: 0.9284 +2023/11/02 13:44:06 - mmengine - INFO - Saving checkpoint at 274000 iterations +2023/11/02 13:52:57 - mmengine - INFO - Iter(train) [274500/640000] base_lr: 1.2293e-04 lr: 1.2994e-05 eta: 4 days, 14:27:01 time: 1.0817 data_time: 0.0351 memory: 21516 grad_norm: 2.9351 loss: 1.3900 caption_loss_cls: 2.3165 grounding_loss_reg: 2.8879 detection_loss_cls: 0.0384 detection_loss_reg: 0.3498 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0398 instance_segmentation_loss_reg: 0.3518 instance_segmentation_loss_poly: 0.9280 +2023/11/02 14:01:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 14:01:57 - mmengine - INFO - Iter(train) [275000/640000] base_lr: 1.2269e-04 lr: 1.2972e-05 eta: 4 days, 14:17:26 time: 1.0858 data_time: 0.0354 memory: 21516 grad_norm: 2.9167 loss: 1.3981 caption_loss_cls: 2.3134 grounding_loss_reg: 2.8883 detection_loss_cls: 0.0383 detection_loss_reg: 0.3486 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3524 instance_segmentation_loss_poly: 0.9294 +2023/11/02 14:01:57 - mmengine - INFO - Saving checkpoint at 275000 iterations +2023/11/02 14:10:53 - mmengine - INFO - Iter(train) [275500/640000] base_lr: 1.2245e-04 lr: 1.2950e-05 eta: 4 days, 14:07:33 time: 1.0829 data_time: 0.0354 memory: 21516 grad_norm: 2.9406 loss: 1.4090 caption_loss_cls: 2.3120 grounding_loss_reg: 2.8868 detection_loss_cls: 0.0381 detection_loss_reg: 0.3481 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0397 instance_segmentation_loss_reg: 0.3517 instance_segmentation_loss_poly: 0.9278 +2023/11/02 14:18:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 14:18:52 - mmengine - INFO - Iter(train) [276000/640000] base_lr: 1.2222e-04 lr: 1.2929e-05 eta: 4 days, 13:51:25 time: 1.0663 data_time: 0.0347 memory: 21516 grad_norm: 2.9712 loss: 1.4142 caption_loss_cls: 2.3100 grounding_loss_reg: 2.8850 detection_loss_cls: 0.0381 detection_loss_reg: 0.3486 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0397 instance_segmentation_loss_reg: 0.3520 instance_segmentation_loss_poly: 0.9284 +2023/11/02 14:18:52 - mmengine - INFO - Saving checkpoint at 276000 iterations +2023/11/02 14:28:16 - mmengine - INFO - Iter(train) [276500/640000] base_lr: 1.2198e-04 lr: 1.2907e-05 eta: 4 days, 13:44:36 time: 1.0783 data_time: 0.0352 memory: 21516 grad_norm: 2.9222 loss: 1.3993 caption_loss_cls: 2.3114 grounding_loss_reg: 2.8839 detection_loss_cls: 0.0381 detection_loss_reg: 0.3481 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0397 instance_segmentation_loss_reg: 0.3517 instance_segmentation_loss_poly: 0.9260 +2023/11/02 14:37:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 14:37:13 - mmengine - INFO - Iter(train) [277000/640000] base_lr: 1.2174e-04 lr: 1.2886e-05 eta: 4 days, 13:34:49 time: 1.0676 data_time: 0.0347 memory: 21516 grad_norm: 2.9697 loss: 1.4070 caption_loss_cls: 2.3088 grounding_loss_reg: 2.8817 detection_loss_cls: 0.0380 detection_loss_reg: 0.3476 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0396 instance_segmentation_loss_reg: 0.3517 instance_segmentation_loss_poly: 0.9252 +2023/11/02 14:37:13 - mmengine - INFO - Saving checkpoint at 277000 iterations +2023/11/02 14:46:41 - mmengine - INFO - Iter(train) [277500/640000] base_lr: 1.2150e-04 lr: 1.2864e-05 eta: 4 days, 13:28:19 time: 1.0730 data_time: 0.0366 memory: 21516 grad_norm: 2.9644 loss: 1.4043 caption_loss_cls: 2.3039 grounding_loss_reg: 2.8821 detection_loss_cls: 0.0380 detection_loss_reg: 0.3480 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0398 instance_segmentation_loss_reg: 0.3532 instance_segmentation_loss_poly: 0.9281 +2023/11/02 14:55:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 14:55:22 - mmengine - INFO - Iter(train) [278000/640000] base_lr: 1.2127e-04 lr: 1.2842e-05 eta: 4 days, 13:16:49 time: 1.0684 data_time: 0.0363 memory: 21516 grad_norm: 2.9916 loss: 1.3988 caption_loss_cls: 2.2999 grounding_loss_reg: 2.8801 detection_loss_cls: 0.0380 detection_loss_reg: 0.3478 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0398 instance_segmentation_loss_reg: 0.3529 instance_segmentation_loss_poly: 0.9283 +2023/11/02 14:55:22 - mmengine - INFO - Saving checkpoint at 278000 iterations +2023/11/02 15:05:07 - mmengine - INFO - Iter(train) [278500/640000] base_lr: 1.2103e-04 lr: 1.2821e-05 eta: 4 days, 13:12:02 time: 1.0819 data_time: 0.0370 memory: 21516 grad_norm: 2.9546 loss: 1.3988 caption_loss_cls: 2.3041 grounding_loss_reg: 2.8777 detection_loss_cls: 0.0380 detection_loss_reg: 0.3490 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3545 instance_segmentation_loss_poly: 0.9315 +2023/11/02 15:14:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 15:14:10 - mmengine - INFO - Iter(train) [279000/640000] base_lr: 1.2079e-04 lr: 1.2799e-05 eta: 4 days, 13:02:50 time: 1.0827 data_time: 0.0369 memory: 21516 grad_norm: 2.9489 loss: 1.3910 caption_loss_cls: 2.3025 grounding_loss_reg: 2.8778 detection_loss_cls: 0.0381 detection_loss_reg: 0.3497 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3553 instance_segmentation_loss_poly: 0.9324 +2023/11/02 15:14:10 - mmengine - INFO - Saving checkpoint at 279000 iterations +2023/11/02 15:23:26 - mmengine - INFO - Iter(train) [279500/640000] base_lr: 1.2055e-04 lr: 1.2778e-05 eta: 4 days, 12:55:01 time: 1.0876 data_time: 0.0370 memory: 21516 grad_norm: 2.9380 loss: 1.3933 caption_loss_cls: 2.3072 grounding_loss_reg: 2.8758 detection_loss_cls: 0.0383 detection_loss_reg: 0.3513 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0401 instance_segmentation_loss_reg: 0.3562 instance_segmentation_loss_poly: 0.9340 +2023/11/02 15:32:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 15:32:22 - mmengine - INFO - Iter(train) [280000/640000] base_lr: 1.2031e-04 lr: 1.2756e-05 eta: 4 days, 12:45:12 time: 1.1021 data_time: 0.0375 memory: 21516 grad_norm: 2.8908 loss: 1.3862 caption_loss_cls: 2.3103 grounding_loss_reg: 2.8756 detection_loss_cls: 0.0382 detection_loss_reg: 0.3505 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3560 instance_segmentation_loss_poly: 0.9347 +2023/11/02 15:32:22 - mmengine - INFO - Saving checkpoint at 280000 iterations +2023/11/02 15:40:54 - mmengine - INFO - Evaluating bbox... +2023/11/02 15:41:49 - mmengine - INFO - bbox_mAP_copypaste: 0.422 0.594 0.457 0.257 0.474 0.555 +2023/11/02 15:41:49 - mmengine - INFO - Evaluating segm... +2023/11/02 15:43:00 - mmengine - INFO - segm_mAP_copypaste: 0.281 0.512 0.274 0.138 0.324 0.430 +2023/11/02 15:47:39 - mmengine - INFO - per class results: +2023/11/02 15:47:39 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.98 | 88.33 | +| building | 79.06 | 93.44 | +| sky | 92.6 | 96.87 | +| floor | 78.47 | 87.37 | +| tree | 71.79 | 85.7 | +| ceiling | 81.73 | 90.46 | +| road | 81.98 | 89.52 | +| bed | 83.31 | 94.92 | +| windowpane | 58.22 | 71.25 | +| grass | 67.35 | 77.56 | +| cabinet | 56.84 | 71.06 | +| sidewalk | 63.36 | 74.16 | +| person | 78.26 | 88.83 | +| earth | 39.07 | 64.17 | +| door | 48.63 | 68.38 | +| table | 51.86 | 79.28 | +| mountain | 55.96 | 72.21 | +| plant | 51.7 | 66.62 | +| curtain | 68.39 | 79.6 | +| chair | 53.6 | 70.41 | +| car | 79.38 | 87.21 | +| water | 47.1 | 61.1 | +| painting | 67.55 | 85.79 | +| sofa | 62.02 | 76.6 | +| shelf | 40.24 | 52.98 | +| house | 34.63 | 47.83 | +| sea | 43.12 | 71.45 | +| mirror | 62.89 | 70.21 | +| rug | 54.87 | 58.57 | +| field | 34.42 | 47.99 | +| armchair | 41.52 | 59.89 | +| seat | 63.74 | 77.5 | +| fence | 36.7 | 54.96 | +| desk | 39.9 | 63.24 | +| rock | 30.18 | 38.73 | +| wardrobe | 44.27 | 52.21 | +| lamp | 57.12 | 69.82 | +| bathtub | 69.78 | 84.4 | +| railing | 25.39 | 33.1 | +| cushion | 47.33 | 55.18 | +| base | 28.67 | 50.1 | +| box | 17.57 | 22.14 | +| column | 49.88 | 56.99 | +| signboard | 32.5 | 40.67 | +| chest of drawers | 34.03 | 62.38 | +| counter | 22.44 | 34.59 | +| sand | 42.02 | 55.06 | +| sink | 63.48 | 76.51 | +| skyscraper | 35.29 | 41.26 | +| fireplace | 69.76 | 85.18 | +| refrigerator | 70.59 | 86.67 | +| grandstand | 41.93 | 72.94 | +| path | 16.27 | 22.6 | +| stairs | 24.17 | 31.6 | +| runway | 72.71 | 77.39 | +| case | 28.8 | 34.25 | +| pool table | 88.81 | 94.9 | +| pillow | 42.84 | 47.04 | +| screen door | 53.44 | 54.17 | +| stairway | 33.49 | 41.23 | +| river | 12.52 | 15.33 | +| bridge | 35.96 | 49.13 | +| bookcase | 35.32 | 52.84 | +| blind | 13.03 | 13.55 | +| coffee table | 44.66 | 46.8 | +| toilet | 81.8 | 87.64 | +| flower | 35.35 | 46.02 | +| book | 42.84 | 64.19 | +| hill | 11.5 | 21.86 | +| bench | 42.5 | 48.43 | +| countertop | 44.48 | 56.3 | +| stove | 68.7 | 80.18 | +| palm | 46.2 | 62.54 | +| kitchen island | 33.51 | 70.29 | +| computer | 68.89 | 85.02 | +| swivel chair | 32.03 | 38.28 | +| boat | 60.22 | 79.35 | +| bar | 22.34 | 33.76 | +| arcade machine | 62.35 | 67.59 | +| hovel | 14.73 | 16.16 | +| bus | 84.13 | 93.26 | +| towel | 53.77 | 76.35 | +| light | 37.93 | 42.22 | +| truck | 31.65 | 55.02 | +| tower | 14.03 | 18.61 | +| chandelier | 60.4 | 68.32 | +| awning | 18.98 | 21.76 | +| streetlight | 23.34 | 29.7 | +| booth | 35.9 | 75.16 | +| television receiver | 70.16 | 78.06 | +| airplane | 46.89 | 63.31 | +| dirt track | 0.0 | 0.0 | +| apparel | 24.98 | 47.47 | +| pole | 24.22 | 30.26 | +| land | 1.87 | 2.28 | +| bannister | 10.05 | 12.31 | +| escalator | 25.18 | 28.09 | +| ottoman | 43.65 | 51.96 | +| bottle | 20.29 | 23.47 | +| buffet | 40.64 | 49.63 | +| poster | 26.03 | 34.47 | +| stage | 13.2 | 23.16 | +| van | 26.73 | 33.85 | +| ship | 41.79 | 45.84 | +| fountain | 27.94 | 29.87 | +| conveyer belt | 71.11 | 77.36 | +| canopy | 15.89 | 17.24 | +| washer | 61.84 | 75.25 | +| plaything | 18.76 | 22.79 | +| swimming pool | 50.96 | 78.81 | +| stool | 38.98 | 52.55 | +| barrel | 9.21 | 13.55 | +| basket | 27.57 | 40.62 | +| waterfall | 43.98 | 58.32 | +| tent | 77.34 | 97.79 | +| bag | 12.69 | 14.73 | +| minibike | 69.38 | 76.81 | +| cradle | 65.71 | 76.24 | +| oven | 15.93 | 20.02 | +| ball | 27.56 | 31.46 | +| food | 55.47 | 66.92 | +| step | 10.15 | 10.76 | +| tank | 21.54 | 24.38 | +| trade name | 14.97 | 15.56 | +| microwave | 68.96 | 76.06 | +| pot | 37.58 | 41.12 | +| animal | 51.71 | 52.84 | +| bicycle | 54.09 | 69.58 | +| lake | 36.35 | 38.2 | +| dishwasher | 52.92 | 67.9 | +| screen | 56.2 | 68.66 | +| blanket | 10.71 | 14.19 | +| sculpture | 40.2 | 63.44 | +| hood | 43.89 | 45.58 | +| sconce | 23.11 | 24.6 | +| vase | 37.61 | 52.3 | +| traffic light | 34.46 | 51.43 | +| tray | 6.26 | 15.52 | +| ashcan | 33.39 | 38.05 | +| fan | 47.64 | 69.8 | +| pier | 28.24 | 37.55 | +| crt screen | 14.06 | 46.98 | +| plate | 55.19 | 68.63 | +| monitor | 7.85 | 8.71 | +| bulletin board | 30.38 | 39.89 | +| shower | 1.09 | 4.18 | +| radiator | 32.08 | 33.39 | +| glass | 12.73 | 13.56 | +| clock | 22.29 | 29.46 | +| flag | 30.18 | 34.04 | ++---------------------+-------+-------+ +2023/11/02 15:47:54 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4220 coco/bbox_mAP_50: 0.5940 coco/bbox_mAP_75: 0.4570 coco/bbox_mAP_s: 0.2570 coco/bbox_mAP_m: 0.4740 coco/bbox_mAP_l: 0.5550 coco/segm_mAP: 0.2810 coco/segm_mAP_50: 0.5120 coco/segm_mAP_75: 0.2740 coco/segm_mAP_s: 0.1380 coco/segm_mAP_m: 0.3240 coco/segm_mAP_l: 0.4300 Bleu_1: 0.7240 Bleu_2: 0.5556 Bleu_3: 0.4131 Bleu_4: 0.3039 METEOR: 0.2529 ROUGE_L: 0.5315 CIDEr: 0.9715 SPICE: 0.1832 aAcc: 80.8400 mIoU: 42.5300 mAcc: 53.2900 visual-grounding/miou: 0.7412 visual-grounding/acc: 0.8177 data_time: 0.0045 time: 0.5192 +2023/11/02 15:57:01 - mmengine - INFO - Iter(train) [280500/640000] base_lr: 1.2008e-04 lr: 1.2734e-05 eta: 4 days, 12:36:34 time: 1.0980 data_time: 0.0347 memory: 21516 grad_norm: 2.9077 loss: 1.4014 caption_loss_cls: 2.3121 grounding_loss_reg: 2.8790 detection_loss_cls: 0.0384 detection_loss_reg: 0.3519 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0402 instance_segmentation_loss_reg: 0.3576 instance_segmentation_loss_poly: 0.9374 +2023/11/02 16:06:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 16:06:25 - mmengine - INFO - Iter(train) [281000/640000] base_lr: 1.1984e-04 lr: 1.2713e-05 eta: 4 days, 12:29:31 time: 1.1050 data_time: 0.0349 memory: 21516 grad_norm: 2.8732 loss: 1.3918 caption_loss_cls: 2.3124 grounding_loss_reg: 2.8793 detection_loss_cls: 0.0384 detection_loss_reg: 0.3528 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3567 instance_segmentation_loss_poly: 0.9350 +2023/11/02 16:06:25 - mmengine - INFO - Saving checkpoint at 281000 iterations +2023/11/02 16:15:56 - mmengine - INFO - Iter(train) [281500/640000] base_lr: 1.1960e-04 lr: 1.2691e-05 eta: 4 days, 12:23:02 time: 1.1057 data_time: 0.0333 memory: 21516 grad_norm: 2.8611 loss: 1.3850 caption_loss_cls: 2.3098 grounding_loss_reg: 2.8773 detection_loss_cls: 0.0383 detection_loss_reg: 0.3523 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3564 instance_segmentation_loss_poly: 0.9338 +2023/11/02 16:24:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 16:24:23 - mmengine - INFO - Iter(train) [282000/640000] base_lr: 1.1936e-04 lr: 1.2669e-05 eta: 4 days, 12:10:23 time: 1.1024 data_time: 0.0331 memory: 21516 grad_norm: 2.8280 loss: 1.3792 caption_loss_cls: 2.3079 grounding_loss_reg: 2.8770 detection_loss_cls: 0.0383 detection_loss_reg: 0.3523 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3566 instance_segmentation_loss_poly: 0.9341 +2023/11/02 16:24:23 - mmengine - INFO - Saving checkpoint at 282000 iterations +2023/11/02 16:33:24 - mmengine - INFO - Iter(train) [282500/640000] base_lr: 1.1912e-04 lr: 1.2647e-05 eta: 4 days, 12:00:58 time: 1.0912 data_time: 0.0325 memory: 21516 grad_norm: 2.8526 loss: 1.3792 caption_loss_cls: 2.3113 grounding_loss_reg: 2.8766 detection_loss_cls: 0.0382 detection_loss_reg: 0.3521 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0399 instance_segmentation_loss_reg: 0.3566 instance_segmentation_loss_poly: 0.9343 +2023/11/02 16:42:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 16:42:03 - mmengine - INFO - Iter(train) [283000/640000] base_lr: 1.1888e-04 lr: 1.2626e-05 eta: 4 days, 11:49:35 time: 1.0855 data_time: 0.0322 memory: 21516 grad_norm: 2.8687 loss: 1.3771 caption_loss_cls: 2.3121 grounding_loss_reg: 2.8742 detection_loss_cls: 0.0381 detection_loss_reg: 0.3518 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0398 instance_segmentation_loss_reg: 0.3556 instance_segmentation_loss_poly: 0.9329 +2023/11/02 16:42:03 - mmengine - INFO - Saving checkpoint at 283000 iterations +2023/11/02 16:51:14 - mmengine - INFO - Iter(train) [283500/640000] base_lr: 1.1864e-04 lr: 1.2604e-05 eta: 4 days, 11:41:10 time: 1.0841 data_time: 0.0323 memory: 21516 grad_norm: 2.9010 loss: 1.3807 caption_loss_cls: 2.3118 grounding_loss_reg: 2.8715 detection_loss_cls: 0.0381 detection_loss_reg: 0.3519 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0397 instance_segmentation_loss_reg: 0.3549 instance_segmentation_loss_poly: 0.9309 +2023/11/02 17:00:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 17:00:36 - mmengine - INFO - Iter(train) [284000/640000] base_lr: 1.1840e-04 lr: 1.2582e-05 eta: 4 days, 11:33:48 time: 1.0905 data_time: 0.0325 memory: 21516 grad_norm: 2.9023 loss: 1.3787 caption_loss_cls: 2.3141 grounding_loss_reg: 2.8704 detection_loss_cls: 0.0381 detection_loss_reg: 0.3513 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0396 instance_segmentation_loss_reg: 0.3543 instance_segmentation_loss_poly: 0.9293 +2023/11/02 17:00:36 - mmengine - INFO - Saving checkpoint at 284000 iterations +2023/11/02 17:10:05 - mmengine - INFO - Iter(train) [284500/640000] base_lr: 1.1817e-04 lr: 1.2560e-05 eta: 4 days, 11:26:58 time: 1.0955 data_time: 0.0352 memory: 21516 grad_norm: 2.8814 loss: 1.3542 caption_loss_cls: 2.3104 grounding_loss_reg: 2.8695 detection_loss_cls: 0.0381 detection_loss_reg: 0.3506 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0395 instance_segmentation_loss_reg: 0.3538 instance_segmentation_loss_poly: 0.9288 +2023/11/02 17:19:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 17:19:08 - mmengine - INFO - Iter(train) [285000/640000] base_lr: 1.1793e-04 lr: 1.2539e-05 eta: 4 days, 11:17:47 time: 1.0901 data_time: 0.0352 memory: 21516 grad_norm: 2.8989 loss: 1.3559 caption_loss_cls: 2.3081 grounding_loss_reg: 2.8636 detection_loss_cls: 0.0380 detection_loss_reg: 0.3505 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0394 instance_segmentation_loss_reg: 0.3529 instance_segmentation_loss_poly: 0.9255 +2023/11/02 17:19:08 - mmengine - INFO - Saving checkpoint at 285000 iterations +2023/11/02 17:28:29 - mmengine - INFO - Iter(train) [285500/640000] base_lr: 1.1769e-04 lr: 1.2517e-05 eta: 4 days, 11:10:16 time: 1.0878 data_time: 0.0350 memory: 21516 grad_norm: 2.8973 loss: 1.3551 caption_loss_cls: 2.3050 grounding_loss_reg: 2.8623 detection_loss_cls: 0.0380 detection_loss_reg: 0.3502 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3529 instance_segmentation_loss_poly: 0.9248 +2023/11/02 17:37:26 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 17:37:26 - mmengine - INFO - Iter(train) [286000/640000] base_lr: 1.1745e-04 lr: 1.2495e-05 eta: 4 days, 11:00:29 time: 1.0951 data_time: 0.0353 memory: 21516 grad_norm: 2.8861 loss: 1.3544 caption_loss_cls: 2.3084 grounding_loss_reg: 2.8621 detection_loss_cls: 0.0379 detection_loss_reg: 0.3489 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3527 instance_segmentation_loss_poly: 0.9236 +2023/11/02 17:37:26 - mmengine - INFO - Saving checkpoint at 286000 iterations +2023/11/02 17:46:24 - mmengine - INFO - Iter(train) [286500/640000] base_lr: 1.1721e-04 lr: 1.2473e-05 eta: 4 days, 10:50:51 time: 1.0945 data_time: 0.0353 memory: 21516 grad_norm: 2.8765 loss: 1.3541 caption_loss_cls: 2.3093 grounding_loss_reg: 2.8620 detection_loss_cls: 0.0379 detection_loss_reg: 0.3491 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0392 instance_segmentation_loss_reg: 0.3525 instance_segmentation_loss_poly: 0.9238 +2023/11/02 17:55:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 17:55:22 - mmengine - INFO - Iter(train) [287000/640000] base_lr: 1.1697e-04 lr: 1.2452e-05 eta: 4 days, 10:41:15 time: 1.0991 data_time: 0.0353 memory: 21516 grad_norm: 2.8537 loss: 1.3492 caption_loss_cls: 2.3083 grounding_loss_reg: 2.8614 detection_loss_cls: 0.0379 detection_loss_reg: 0.3491 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0392 instance_segmentation_loss_reg: 0.3522 instance_segmentation_loss_poly: 0.9229 +2023/11/02 17:55:22 - mmengine - INFO - Saving checkpoint at 287000 iterations +2023/11/02 18:04:18 - mmengine - INFO - Iter(train) [287500/640000] base_lr: 1.1673e-04 lr: 1.2430e-05 eta: 4 days, 10:31:28 time: 1.0955 data_time: 0.0352 memory: 21516 grad_norm: 2.8348 loss: 1.3452 caption_loss_cls: 2.3074 grounding_loss_reg: 2.8601 detection_loss_cls: 0.0379 detection_loss_reg: 0.3493 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0392 instance_segmentation_loss_reg: 0.3529 instance_segmentation_loss_poly: 0.9235 +2023/11/02 18:13:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 18:13:35 - mmengine - INFO - Iter(train) [288000/640000] base_lr: 1.1649e-04 lr: 1.2408e-05 eta: 4 days, 10:23:28 time: 1.0940 data_time: 0.0352 memory: 21516 grad_norm: 2.8243 loss: 1.3369 caption_loss_cls: 2.3078 grounding_loss_reg: 2.8569 detection_loss_cls: 0.0378 detection_loss_reg: 0.3485 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0391 instance_segmentation_loss_reg: 0.3531 instance_segmentation_loss_poly: 0.9227 +2023/11/02 18:13:35 - mmengine - INFO - Saving checkpoint at 288000 iterations +2023/11/02 18:22:50 - mmengine - INFO - Iter(train) [288500/640000] base_lr: 1.1625e-04 lr: 1.2386e-05 eta: 4 days, 10:15:19 time: 1.0907 data_time: 0.0353 memory: 21516 grad_norm: 2.8671 loss: 1.3583 caption_loss_cls: 2.3081 grounding_loss_reg: 2.8543 detection_loss_cls: 0.0379 detection_loss_reg: 0.3495 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3541 instance_segmentation_loss_poly: 0.9237 +2023/11/02 18:32:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 18:32:04 - mmengine - INFO - Iter(train) [289000/640000] base_lr: 1.1601e-04 lr: 1.2364e-05 eta: 4 days, 10:07:04 time: 1.0935 data_time: 0.0353 memory: 21516 grad_norm: 2.8337 loss: 1.3526 caption_loss_cls: 2.3083 grounding_loss_reg: 2.8537 detection_loss_cls: 0.0379 detection_loss_reg: 0.3499 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3540 instance_segmentation_loss_poly: 0.9229 +2023/11/02 18:32:04 - mmengine - INFO - Saving checkpoint at 289000 iterations +2023/11/02 18:41:17 - mmengine - INFO - Iter(train) [289500/640000] base_lr: 1.1577e-04 lr: 1.2342e-05 eta: 4 days, 9:58:42 time: 1.0913 data_time: 0.0352 memory: 21516 grad_norm: 2.8486 loss: 1.3564 caption_loss_cls: 2.3037 grounding_loss_reg: 2.8549 detection_loss_cls: 0.0380 detection_loss_reg: 0.3509 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3539 instance_segmentation_loss_poly: 0.9232 +2023/11/02 18:50:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 18:50:40 - mmengine - INFO - Iter(train) [290000/640000] base_lr: 1.1553e-04 lr: 1.2321e-05 eta: 4 days, 9:51:10 time: 1.0979 data_time: 0.0355 memory: 21516 grad_norm: 2.8502 loss: 1.3633 caption_loss_cls: 2.3024 grounding_loss_reg: 2.8541 detection_loss_cls: 0.0380 detection_loss_reg: 0.3505 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0394 instance_segmentation_loss_reg: 0.3541 instance_segmentation_loss_poly: 0.9234 +2023/11/02 18:50:40 - mmengine - INFO - Saving checkpoint at 290000 iterations +2023/11/02 18:59:27 - mmengine - INFO - Iter(train) [290500/640000] base_lr: 1.1529e-04 lr: 1.2299e-05 eta: 4 days, 9:40:37 time: 1.0951 data_time: 0.0353 memory: 21516 grad_norm: 2.8813 loss: 1.3624 caption_loss_cls: 2.3043 grounding_loss_reg: 2.8537 detection_loss_cls: 0.0381 detection_loss_reg: 0.3510 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3536 instance_segmentation_loss_poly: 0.9223 +2023/11/02 19:08:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 19:08:38 - mmengine - INFO - Iter(train) [291000/640000] base_lr: 1.1505e-04 lr: 1.2277e-05 eta: 4 days, 9:32:08 time: 1.0985 data_time: 0.0355 memory: 21516 grad_norm: 2.9073 loss: 1.3705 caption_loss_cls: 2.3071 grounding_loss_reg: 2.8531 detection_loss_cls: 0.0380 detection_loss_reg: 0.3509 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3527 instance_segmentation_loss_poly: 0.9210 +2023/11/02 19:08:38 - mmengine - INFO - Saving checkpoint at 291000 iterations +2023/11/02 19:17:40 - mmengine - INFO - Iter(train) [291500/640000] base_lr: 1.1481e-04 lr: 1.2255e-05 eta: 4 days, 9:22:49 time: 1.0998 data_time: 0.0353 memory: 21516 grad_norm: 2.8936 loss: 1.3586 caption_loss_cls: 2.3065 grounding_loss_reg: 2.8529 detection_loss_cls: 0.0381 detection_loss_reg: 0.3508 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3522 instance_segmentation_loss_poly: 0.9192 +2023/11/02 19:26:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 19:26:28 - mmengine - INFO - Iter(train) [292000/640000] base_lr: 1.1456e-04 lr: 1.2233e-05 eta: 4 days, 9:12:25 time: 1.0927 data_time: 0.0351 memory: 21516 grad_norm: 2.9113 loss: 1.3645 caption_loss_cls: 2.3030 grounding_loss_reg: 2.8526 detection_loss_cls: 0.0379 detection_loss_reg: 0.3486 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0394 instance_segmentation_loss_reg: 0.3529 instance_segmentation_loss_poly: 0.9201 +2023/11/02 19:26:28 - mmengine - INFO - Saving checkpoint at 292000 iterations +2023/11/02 19:35:46 - mmengine - INFO - Iter(train) [292500/640000] base_lr: 1.1432e-04 lr: 1.2211e-05 eta: 4 days, 9:04:27 time: 1.0935 data_time: 0.0353 memory: 21516 grad_norm: 2.9000 loss: 1.3595 caption_loss_cls: 2.2999 grounding_loss_reg: 2.8535 detection_loss_cls: 0.0379 detection_loss_reg: 0.3484 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0396 instance_segmentation_loss_reg: 0.3542 instance_segmentation_loss_poly: 0.9214 +2023/11/02 19:45:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 19:45:07 - mmengine - INFO - Iter(train) [293000/640000] base_lr: 1.1408e-04 lr: 1.2189e-05 eta: 4 days, 8:56:43 time: 1.0953 data_time: 0.0362 memory: 21516 grad_norm: 2.9203 loss: 1.3639 caption_loss_cls: 2.3009 grounding_loss_reg: 2.8545 detection_loss_cls: 0.0380 detection_loss_reg: 0.3490 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0394 instance_segmentation_loss_reg: 0.3523 instance_segmentation_loss_poly: 0.9178 +2023/11/02 19:45:07 - mmengine - INFO - Saving checkpoint at 293000 iterations +2023/11/02 19:54:25 - mmengine - INFO - Iter(train) [293500/640000] base_lr: 1.1384e-04 lr: 1.2167e-05 eta: 4 days, 8:48:38 time: 1.0965 data_time: 0.0361 memory: 21516 grad_norm: 2.9023 loss: 1.3530 caption_loss_cls: 2.2954 grounding_loss_reg: 2.8528 detection_loss_cls: 0.0383 detection_loss_reg: 0.3507 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3518 instance_segmentation_loss_poly: 0.9173 +2023/11/02 20:03:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 20:03:27 - mmengine - INFO - Iter(train) [294000/640000] base_lr: 1.1360e-04 lr: 1.2146e-05 eta: 4 days, 8:39:21 time: 1.0912 data_time: 0.0360 memory: 21516 grad_norm: 2.9237 loss: 1.3468 caption_loss_cls: 2.2897 grounding_loss_reg: 2.8492 detection_loss_cls: 0.0380 detection_loss_reg: 0.3487 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3520 instance_segmentation_loss_poly: 0.9177 +2023/11/02 20:03:27 - mmengine - INFO - Saving checkpoint at 294000 iterations +2023/11/02 20:12:33 - mmengine - INFO - Iter(train) [294500/640000] base_lr: 1.1336e-04 lr: 1.2124e-05 eta: 4 days, 8:30:22 time: 1.0960 data_time: 0.0365 memory: 21516 grad_norm: 2.9374 loss: 1.3472 caption_loss_cls: 2.2878 grounding_loss_reg: 2.8498 detection_loss_cls: 0.0379 detection_loss_reg: 0.3476 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3528 instance_segmentation_loss_poly: 0.9181 +2023/11/02 20:21:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 20:21:45 - mmengine - INFO - Iter(train) [295000/640000] base_lr: 1.1312e-04 lr: 1.2102e-05 eta: 4 days, 8:21:51 time: 1.0961 data_time: 0.0364 memory: 21516 grad_norm: 2.9337 loss: 1.3392 caption_loss_cls: 2.2862 grounding_loss_reg: 2.8484 detection_loss_cls: 0.0380 detection_loss_reg: 0.3490 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3521 instance_segmentation_loss_poly: 0.9172 +2023/11/02 20:21:45 - mmengine - INFO - Saving checkpoint at 295000 iterations +2023/11/02 20:30:53 - mmengine - INFO - Iter(train) [295500/640000] base_lr: 1.1288e-04 lr: 1.2080e-05 eta: 4 days, 8:13:02 time: 1.0977 data_time: 0.0366 memory: 21516 grad_norm: 2.9503 loss: 1.3439 caption_loss_cls: 2.2817 grounding_loss_reg: 2.8445 detection_loss_cls: 0.0381 detection_loss_reg: 0.3497 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3530 instance_segmentation_loss_poly: 0.9187 +2023/11/02 20:39:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231101_204912 +2023/11/02 20:39:44 - mmengine - INFO - Iter(train) [296000/640000] base_lr: 1.1264e-04 lr: 1.2058e-05 eta: 4 days, 8:02:54 time: 1.0984 data_time: 0.0366 memory: 21516 grad_norm: 2.9658 loss: 1.3442 caption_loss_cls: 2.2849 grounding_loss_reg: 2.8400 detection_loss_cls: 0.0379 detection_loss_reg: 0.3487 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3527 instance_segmentation_loss_poly: 0.9187 +2023/11/02 20:39:44 - mmengine - INFO - Saving checkpoint at 296000 iterations +2023/11/03 07:21:33 - mmengine - INFO - Iter(train) [296500/640000] base_lr: 1.1240e-04 lr: 1.2036e-05 eta: 4 days, 11:24:51 time: 1.0996 data_time: 0.0329 memory: 21520 grad_norm: 2.9586 loss: 1.3286 caption_loss_cls: 2.2822 grounding_loss_reg: 2.8370 detection_loss_cls: 0.0379 detection_loss_reg: 0.3496 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0392 instance_segmentation_loss_reg: 0.3524 instance_segmentation_loss_poly: 0.9184 +2023/11/03 07:30:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 07:30:44 - mmengine - INFO - Iter(train) [297000/640000] base_lr: 1.1215e-04 lr: 1.2014e-05 eta: 4 days, 10:05:53 time: 1.0970 data_time: 0.0316 memory: 21520 grad_norm: 2.9894 loss: 1.3311 caption_loss_cls: 2.2816 grounding_loss_reg: 2.8365 detection_loss_cls: 0.0379 detection_loss_reg: 0.3507 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0391 instance_segmentation_loss_reg: 0.3519 instance_segmentation_loss_poly: 0.9173 +2023/11/03 07:30:44 - mmengine - INFO - Saving checkpoint at 297000 iterations +2023/11/03 07:40:11 - mmengine - INFO - Iter(train) [297500/640000] base_lr: 1.1191e-04 lr: 1.1992e-05 eta: 4 days, 10:34:04 time: 1.0994 data_time: 0.0315 memory: 21520 grad_norm: 3.0085 loss: 1.3330 caption_loss_cls: 2.2784 grounding_loss_reg: 2.8342 detection_loss_cls: 0.0378 detection_loss_reg: 0.3504 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0390 instance_segmentation_loss_reg: 0.3522 instance_segmentation_loss_poly: 0.9176 +2023/11/03 07:48:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 07:48:58 - mmengine - INFO - Iter(train) [298000/640000] base_lr: 1.1167e-04 lr: 1.1970e-05 eta: 4 days, 8:50:56 time: 1.0958 data_time: 0.0310 memory: 21520 grad_norm: 3.0112 loss: 1.3340 caption_loss_cls: 2.2770 grounding_loss_reg: 2.8297 detection_loss_cls: 0.0378 detection_loss_reg: 0.3498 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0389 instance_segmentation_loss_reg: 0.3512 instance_segmentation_loss_poly: 0.9165 +2023/11/03 07:48:58 - mmengine - INFO - Saving checkpoint at 298000 iterations +2023/11/03 07:58:30 - mmengine - INFO - Iter(train) [298500/640000] base_lr: 1.1143e-04 lr: 1.1948e-05 eta: 4 days, 9:27:42 time: 1.1023 data_time: 0.0307 memory: 21520 grad_norm: 2.9668 loss: 1.3233 caption_loss_cls: 2.2729 grounding_loss_reg: 2.8296 detection_loss_cls: 0.0378 detection_loss_reg: 0.3498 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0387 instance_segmentation_loss_reg: 0.3500 instance_segmentation_loss_poly: 0.9135 +2023/11/03 08:07:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 08:07:56 - mmengine - INFO - Iter(train) [299000/640000] base_lr: 1.1119e-04 lr: 1.1926e-05 eta: 4 days, 9:37:04 time: 1.1059 data_time: 0.0306 memory: 21520 grad_norm: 2.9771 loss: 1.3251 caption_loss_cls: 2.2723 grounding_loss_reg: 2.8304 detection_loss_cls: 0.0376 detection_loss_reg: 0.3477 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0384 instance_segmentation_loss_reg: 0.3489 instance_segmentation_loss_poly: 0.9127 +2023/11/03 08:07:56 - mmengine - INFO - Saving checkpoint at 299000 iterations +2023/11/03 08:17:44 - mmengine - INFO - Iter(train) [299500/640000] base_lr: 1.1095e-04 lr: 1.1904e-05 eta: 4 days, 10:16:49 time: 1.1158 data_time: 0.0304 memory: 21520 grad_norm: 2.9306 loss: 1.3118 caption_loss_cls: 2.2662 grounding_loss_reg: 2.8288 detection_loss_cls: 0.0376 detection_loss_reg: 0.3469 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0382 instance_segmentation_loss_reg: 0.3478 instance_segmentation_loss_poly: 0.9107 +2023/11/03 08:27:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 08:27:13 - mmengine - INFO - Iter(train) [300000/640000] base_lr: 1.1070e-04 lr: 1.1882e-05 eta: 4 days, 10:16:04 time: 1.1252 data_time: 0.0314 memory: 21520 grad_norm: 2.9271 loss: 1.3136 caption_loss_cls: 2.2619 grounding_loss_reg: 2.8260 detection_loss_cls: 0.0376 detection_loss_reg: 0.3473 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0382 instance_segmentation_loss_reg: 0.3487 instance_segmentation_loss_poly: 0.9116 +2023/11/03 08:27:13 - mmengine - INFO - Saving checkpoint at 300000 iterations +2023/11/03 08:35:50 - mmengine - INFO - Evaluating bbox... +2023/11/03 08:36:46 - mmengine - INFO - bbox_mAP_copypaste: 0.416 0.587 0.450 0.246 0.465 0.563 +2023/11/03 08:36:46 - mmengine - INFO - Evaluating segm... +2023/11/03 08:37:59 - mmengine - INFO - segm_mAP_copypaste: 0.272 0.493 0.266 0.126 0.310 0.428 +2023/11/03 08:43:07 - mmengine - INFO - per class results: +2023/11/03 08:43:07 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 74.13 | 87.26 | +| building | 80.4 | 90.81 | +| sky | 92.24 | 96.7 | +| floor | 78.77 | 87.28 | +| tree | 72.4 | 85.73 | +| ceiling | 81.63 | 92.75 | +| road | 80.76 | 86.46 | +| bed | 86.21 | 94.13 | +| windowpane | 58.47 | 72.89 | +| grass | 69.72 | 88.33 | +| cabinet | 55.4 | 65.27 | +| sidewalk | 63.83 | 78.79 | +| person | 76.9 | 91.59 | +| earth | 31.63 | 43.18 | +| door | 49.76 | 70.83 | +| table | 57.31 | 74.55 | +| mountain | 50.53 | 57.32 | +| plant | 51.88 | 63.77 | +| curtain | 70.43 | 78.7 | +| chair | 54.02 | 69.94 | +| car | 80.33 | 89.35 | +| water | 37.09 | 42.08 | +| painting | 68.49 | 83.26 | +| sofa | 55.16 | 64.91 | +| shelf | 37.4 | 51.51 | +| house | 38.33 | 53.63 | +| sea | 49.43 | 80.56 | +| mirror | 61.65 | 68.45 | +| rug | 62.37 | 74.03 | +| field | 37.8 | 45.81 | +| armchair | 39.19 | 68.26 | +| seat | 59.65 | 78.71 | +| fence | 39.25 | 56.86 | +| desk | 43.08 | 55.67 | +| rock | 39.89 | 69.98 | +| wardrobe | 45.72 | 58.19 | +| lamp | 55.65 | 75.4 | +| bathtub | 72.21 | 89.44 | +| railing | 26.28 | 38.69 | +| cushion | 49.77 | 61.6 | +| base | 25.51 | 42.06 | +| box | 19.23 | 23.55 | +| column | 40.66 | 48.68 | +| signboard | 37.08 | 50.98 | +| chest of drawers | 37.47 | 61.09 | +| counter | 30.53 | 39.74 | +| sand | 29.9 | 75.94 | +| sink | 65.34 | 75.45 | +| skyscraper | 50.23 | 55.66 | +| fireplace | 66.28 | 88.05 | +| refrigerator | 65.8 | 83.88 | +| grandstand | 34.15 | 61.3 | +| path | 22.47 | 29.4 | +| stairs | 27.01 | 35.61 | +| runway | 64.7 | 81.25 | +| case | 35.53 | 60.42 | +| pool table | 87.27 | 97.07 | +| pillow | 53.35 | 74.93 | +| screen door | 52.52 | 66.24 | +| stairway | 30.95 | 43.15 | +| river | 26.17 | 68.16 | +| bridge | 43.28 | 88.24 | +| bookcase | 31.61 | 52.79 | +| blind | 26.03 | 32.43 | +| coffee table | 56.93 | 86.42 | +| toilet | 80.96 | 88.3 | +| flower | 29.34 | 41.22 | +| book | 44.92 | 64.08 | +| hill | 9.15 | 15.56 | +| bench | 43.39 | 51.36 | +| countertop | 48.91 | 64.14 | +| stove | 60.47 | 83.77 | +| palm | 35.28 | 42.11 | +| kitchen island | 39.31 | 81.47 | +| computer | 61.36 | 69.39 | +| swivel chair | 38.29 | 54.54 | +| boat | 67.49 | 86.31 | +| bar | 47.09 | 66.39 | +| arcade machine | 42.1 | 60.43 | +| hovel | 15.05 | 18.75 | +| bus | 80.21 | 96.47 | +| towel | 59.14 | 66.18 | +| light | 45.68 | 55.14 | +| truck | 26.09 | 35.51 | +| tower | 37.12 | 60.18 | +| chandelier | 60.83 | 78.29 | +| awning | 34.49 | 56.33 | +| streetlight | 25.76 | 33.28 | +| booth | 54.93 | 58.85 | +| television receiver | 68.29 | 81.73 | +| airplane | 47.97 | 66.44 | +| dirt track | 0.0 | 0.0 | +| apparel | 36.85 | 46.53 | +| pole | 22.92 | 32.32 | +| land | 2.49 | 4.81 | +| bannister | 13.35 | 17.6 | +| escalator | 9.2 | 9.84 | +| ottoman | 45.16 | 66.13 | +| bottle | 25.51 | 30.64 | +| buffet | 44.22 | 51.45 | +| poster | 19.4 | 24.52 | +| stage | 14.52 | 27.59 | +| van | 28.81 | 42.92 | +| ship | 33.4 | 38.21 | +| fountain | 13.39 | 14.81 | +| conveyer belt | 53.96 | 88.9 | +| canopy | 33.97 | 48.84 | +| washer | 72.83 | 81.96 | +| plaything | 20.47 | 26.16 | +| swimming pool | 57.76 | 74.97 | +| stool | 36.5 | 46.57 | +| barrel | 37.17 | 80.79 | +| basket | 24.41 | 38.54 | +| waterfall | 61.78 | 79.38 | +| tent | 69.11 | 98.36 | +| bag | 4.08 | 4.16 | +| minibike | 68.18 | 80.07 | +| cradle | 71.15 | 96.42 | +| oven | 20.6 | 29.77 | +| ball | 34.25 | 45.3 | +| food | 47.62 | 50.91 | +| step | 11.92 | 14.48 | +| tank | 40.31 | 50.82 | +| trade name | 23.31 | 26.86 | +| microwave | 62.57 | 64.95 | +| pot | 39.08 | 44.4 | +| animal | 65.67 | 69.84 | +| bicycle | 52.88 | 73.23 | +| lake | 25.37 | 68.9 | +| dishwasher | 51.24 | 73.73 | +| screen | 52.14 | 85.82 | +| blanket | 6.77 | 7.83 | +| sculpture | 47.6 | 64.71 | +| hood | 47.23 | 61.68 | +| sconce | 29.24 | 35.26 | +| vase | 35.0 | 43.88 | +| traffic light | 35.05 | 50.45 | +| tray | 10.16 | 17.52 | +| ashcan | 37.46 | 55.02 | +| fan | 50.8 | 63.5 | +| pier | 56.22 | 70.1 | +| crt screen | 7.22 | 18.54 | +| plate | 50.87 | 70.98 | +| monitor | 6.31 | 9.25 | +| bulletin board | 15.22 | 16.76 | +| shower | 7.61 | 16.47 | +| radiator | 48.29 | 52.7 | +| glass | 13.86 | 14.76 | +| clock | 20.17 | 29.43 | +| flag | 31.73 | 39.92 | ++---------------------+-------+-------+ +2023/11/03 08:43:24 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4160 coco/bbox_mAP_50: 0.5870 coco/bbox_mAP_75: 0.4500 coco/bbox_mAP_s: 0.2460 coco/bbox_mAP_m: 0.4650 coco/bbox_mAP_l: 0.5630 coco/segm_mAP: 0.2720 coco/segm_mAP_50: 0.4930 coco/segm_mAP_75: 0.2660 coco/segm_mAP_s: 0.1260 coco/segm_mAP_m: 0.3100 coco/segm_mAP_l: 0.4280 Bleu_1: 0.7219 Bleu_2: 0.5490 Bleu_3: 0.4067 Bleu_4: 0.2986 METEOR: 0.2505 ROUGE_L: 0.5286 CIDEr: 0.9505 SPICE: 0.1829 aAcc: 80.7000 mIoU: 44.0200 mAcc: 57.8100 visual-grounding/miou: 0.7490 visual-grounding/acc: 0.8280 data_time: 0.0108 time: 0.5323 +2023/11/03 08:52:44 - mmengine - INFO - Iter(train) [300500/640000] base_lr: 1.1046e-04 lr: 1.1860e-05 eta: 4 days, 10:06:06 time: 1.1250 data_time: 0.0320 memory: 21521 grad_norm: 2.9312 loss: 1.3251 caption_loss_cls: 2.2587 grounding_loss_reg: 2.8236 detection_loss_cls: 0.0376 detection_loss_reg: 0.3471 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0382 instance_segmentation_loss_reg: 0.3484 instance_segmentation_loss_poly: 0.9115 +2023/11/03 09:00:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 09:00:50 - mmengine - INFO - Iter(train) [301000/640000] base_lr: 1.1022e-04 lr: 1.1838e-05 eta: 4 days, 8:29:26 time: 1.1087 data_time: 0.0318 memory: 21521 grad_norm: 2.9829 loss: 1.3416 caption_loss_cls: 2.2580 grounding_loss_reg: 2.8195 detection_loss_cls: 0.0375 detection_loss_reg: 0.3469 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3487 instance_segmentation_loss_poly: 0.9129 +2023/11/03 09:00:50 - mmengine - INFO - Saving checkpoint at 301000 iterations +2023/11/03 09:10:26 - mmengine - INFO - Iter(train) [301500/640000] base_lr: 1.0998e-04 lr: 1.1816e-05 eta: 4 days, 8:41:21 time: 1.1109 data_time: 0.0318 memory: 21521 grad_norm: 2.9983 loss: 1.3439 caption_loss_cls: 2.2573 grounding_loss_reg: 2.8176 detection_loss_cls: 0.0374 detection_loss_reg: 0.3464 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3479 instance_segmentation_loss_poly: 0.9114 +2023/11/03 09:20:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 09:20:01 - mmengine - INFO - Iter(train) [302000/640000] base_lr: 1.0974e-04 lr: 1.1794e-05 eta: 4 days, 8:49:01 time: 1.1228 data_time: 0.0320 memory: 21521 grad_norm: 2.9572 loss: 1.3257 caption_loss_cls: 2.2567 grounding_loss_reg: 2.8171 detection_loss_cls: 0.0373 detection_loss_reg: 0.3458 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3477 instance_segmentation_loss_poly: 0.9106 +2023/11/03 09:20:01 - mmengine - INFO - Saving checkpoint at 302000 iterations +2023/11/03 09:29:39 - mmengine - INFO - Iter(train) [302500/640000] base_lr: 1.0949e-04 lr: 1.1772e-05 eta: 4 days, 8:56:59 time: 1.1243 data_time: 0.0324 memory: 21521 grad_norm: 3.0090 loss: 1.3431 caption_loss_cls: 2.2578 grounding_loss_reg: 2.8134 detection_loss_cls: 0.0373 detection_loss_reg: 0.3463 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3490 instance_segmentation_loss_poly: 0.9130 +2023/11/03 09:38:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 09:38:45 - mmengine - INFO - Iter(train) [303000/640000] base_lr: 1.0925e-04 lr: 1.1750e-05 eta: 4 days, 8:36:04 time: 1.1192 data_time: 0.0325 memory: 21521 grad_norm: 3.0137 loss: 1.3451 caption_loss_cls: 2.2578 grounding_loss_reg: 2.8120 detection_loss_cls: 0.0373 detection_loss_reg: 0.3467 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3491 instance_segmentation_loss_poly: 0.9138 +2023/11/03 09:38:45 - mmengine - INFO - Saving checkpoint at 303000 iterations +2023/11/03 09:47:21 - mmengine - INFO - Iter(train) [303500/640000] base_lr: 1.0901e-04 lr: 1.1728e-05 eta: 4 days, 7:54:48 time: 1.1012 data_time: 0.0321 memory: 21521 grad_norm: 3.0927 loss: 1.3625 caption_loss_cls: 2.2538 grounding_loss_reg: 2.8128 detection_loss_cls: 0.0373 detection_loss_reg: 0.3468 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0379 instance_segmentation_loss_reg: 0.3488 instance_segmentation_loss_poly: 0.9132 +2023/11/03 09:56:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 09:56:02 - mmengine - INFO - Iter(train) [304000/640000] base_lr: 1.0877e-04 lr: 1.1706e-05 eta: 4 days, 7:21:01 time: 1.0895 data_time: 0.0310 memory: 21521 grad_norm: 3.1250 loss: 1.3717 caption_loss_cls: 2.2497 grounding_loss_reg: 2.8107 detection_loss_cls: 0.0376 detection_loss_reg: 0.3481 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0378 instance_segmentation_loss_reg: 0.3488 instance_segmentation_loss_poly: 0.9139 +2023/11/03 09:56:02 - mmengine - INFO - Saving checkpoint at 304000 iterations +2023/11/03 10:04:55 - mmengine - INFO - Iter(train) [304500/640000] base_lr: 1.0853e-04 lr: 1.1684e-05 eta: 4 days, 6:57:59 time: 1.0821 data_time: 0.0337 memory: 21521 grad_norm: 3.1541 loss: 1.3795 caption_loss_cls: 2.2460 grounding_loss_reg: 2.8100 detection_loss_cls: 0.0376 detection_loss_reg: 0.3485 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0378 instance_segmentation_loss_reg: 0.3495 instance_segmentation_loss_poly: 0.9154 +2023/11/03 10:14:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 10:14:08 - mmengine - INFO - Iter(train) [305000/640000] base_lr: 1.0828e-04 lr: 1.1662e-05 eta: 4 days, 6:48:45 time: 1.0989 data_time: 0.0343 memory: 21521 grad_norm: 3.0921 loss: 1.3635 caption_loss_cls: 2.2453 grounding_loss_reg: 2.8105 detection_loss_cls: 0.0375 detection_loss_reg: 0.3482 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0377 instance_segmentation_loss_reg: 0.3495 instance_segmentation_loss_poly: 0.9164 +2023/11/03 10:14:08 - mmengine - INFO - Saving checkpoint at 305000 iterations +2023/11/03 10:23:19 - mmengine - INFO - Iter(train) [305500/640000] base_lr: 1.0804e-04 lr: 1.1640e-05 eta: 4 days, 6:38:51 time: 1.0928 data_time: 0.0343 memory: 21521 grad_norm: 3.1010 loss: 1.3704 caption_loss_cls: 2.2442 grounding_loss_reg: 2.8088 detection_loss_cls: 0.0376 detection_loss_reg: 0.3488 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0377 instance_segmentation_loss_reg: 0.3499 instance_segmentation_loss_poly: 0.9178 +2023/11/03 10:32:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 10:32:16 - mmengine - INFO - Iter(train) [306000/640000] base_lr: 1.0780e-04 lr: 1.1618e-05 eta: 4 days, 6:20:59 time: 1.0833 data_time: 0.0343 memory: 21521 grad_norm: 3.1893 loss: 1.3971 caption_loss_cls: 2.2391 grounding_loss_reg: 2.8075 detection_loss_cls: 0.0377 detection_loss_reg: 0.3493 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0377 instance_segmentation_loss_reg: 0.3497 instance_segmentation_loss_poly: 0.9180 +2023/11/03 10:32:16 - mmengine - INFO - Saving checkpoint at 306000 iterations +2023/11/03 10:41:46 - mmengine - INFO - Iter(train) [306500/640000] base_lr: 1.0756e-04 lr: 1.1596e-05 eta: 4 days, 6:21:14 time: 1.0812 data_time: 0.0342 memory: 21521 grad_norm: 3.2014 loss: 1.3945 caption_loss_cls: 2.2341 grounding_loss_reg: 2.8071 detection_loss_cls: 0.0376 detection_loss_reg: 0.3493 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0376 instance_segmentation_loss_reg: 0.3489 instance_segmentation_loss_poly: 0.9163 +2023/11/03 10:50:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 10:50:28 - mmengine - INFO - Iter(train) [307000/640000] base_lr: 1.0731e-04 lr: 1.1574e-05 eta: 4 days, 5:56:50 time: 1.0754 data_time: 0.0340 memory: 21521 grad_norm: 3.2117 loss: 1.3969 caption_loss_cls: 2.2345 grounding_loss_reg: 2.8061 detection_loss_cls: 0.0375 detection_loss_reg: 0.3486 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0375 instance_segmentation_loss_reg: 0.3483 instance_segmentation_loss_poly: 0.9153 +2023/11/03 10:50:28 - mmengine - INFO - Saving checkpoint at 307000 iterations +2023/11/03 10:59:46 - mmengine - INFO - Iter(train) [307500/640000] base_lr: 1.0707e-04 lr: 1.1552e-05 eta: 4 days, 5:50:31 time: 1.0857 data_time: 0.0345 memory: 21521 grad_norm: 3.1977 loss: 1.4004 caption_loss_cls: 2.2332 grounding_loss_reg: 2.8075 detection_loss_cls: 0.0375 detection_loss_reg: 0.3487 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0374 instance_segmentation_loss_reg: 0.3478 instance_segmentation_loss_poly: 0.9142 +2023/11/03 11:08:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 11:08:53 - mmengine - INFO - Iter(train) [308000/640000] base_lr: 1.0683e-04 lr: 1.1530e-05 eta: 4 days, 5:39:23 time: 1.0922 data_time: 0.0346 memory: 21521 grad_norm: 3.1526 loss: 1.3798 caption_loss_cls: 2.2300 grounding_loss_reg: 2.8074 detection_loss_cls: 0.0374 detection_loss_reg: 0.3479 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0373 instance_segmentation_loss_reg: 0.3475 instance_segmentation_loss_poly: 0.9145 +2023/11/03 11:08:53 - mmengine - INFO - Saving checkpoint at 308000 iterations +2023/11/03 11:18:30 - mmengine - INFO - Iter(train) [308500/640000] base_lr: 1.0659e-04 lr: 1.1508e-05 eta: 4 days, 5:41:37 time: 1.1033 data_time: 0.0347 memory: 21521 grad_norm: 3.1258 loss: 1.3579 caption_loss_cls: 2.2235 grounding_loss_reg: 2.8082 detection_loss_cls: 0.0373 detection_loss_reg: 0.3463 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0372 instance_segmentation_loss_reg: 0.3456 instance_segmentation_loss_poly: 0.9114 +2023/11/03 11:27:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 11:27:43 - mmengine - INFO - Iter(train) [309000/640000] base_lr: 1.0634e-04 lr: 1.1486e-05 eta: 4 days, 5:32:19 time: 1.1032 data_time: 0.0347 memory: 21521 grad_norm: 3.1254 loss: 1.3589 caption_loss_cls: 2.2227 grounding_loss_reg: 2.8041 detection_loss_cls: 0.0373 detection_loss_reg: 0.3455 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0372 instance_segmentation_loss_reg: 0.3461 instance_segmentation_loss_poly: 0.9119 +2023/11/03 11:27:43 - mmengine - INFO - Saving checkpoint at 309000 iterations +2023/11/03 11:37:21 - mmengine - INFO - Iter(train) [309500/640000] base_lr: 1.0610e-04 lr: 1.1464e-05 eta: 4 days, 5:33:48 time: 1.1100 data_time: 0.0350 memory: 21521 grad_norm: 3.1004 loss: 1.3523 caption_loss_cls: 2.2222 grounding_loss_reg: 2.8034 detection_loss_cls: 0.0371 detection_loss_reg: 0.3444 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0371 instance_segmentation_loss_reg: 0.3455 instance_segmentation_loss_poly: 0.9103 +2023/11/03 11:46:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 11:46:28 - mmengine - INFO - Iter(train) [310000/640000] base_lr: 1.0586e-04 lr: 1.1442e-05 eta: 4 days, 5:21:58 time: 1.1124 data_time: 0.0350 memory: 21521 grad_norm: 3.0678 loss: 1.3412 caption_loss_cls: 2.2192 grounding_loss_reg: 2.8017 detection_loss_cls: 0.0370 detection_loss_reg: 0.3440 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0369 instance_segmentation_loss_reg: 0.3450 instance_segmentation_loss_poly: 0.9091 +2023/11/03 11:46:28 - mmengine - INFO - Saving checkpoint at 310000 iterations +2023/11/03 11:56:03 - mmengine - INFO - Iter(train) [310500/640000] base_lr: 1.0562e-04 lr: 1.1420e-05 eta: 4 days, 5:20:50 time: 1.1136 data_time: 0.0349 memory: 21521 grad_norm: 3.0124 loss: 1.3274 caption_loss_cls: 2.2202 grounding_loss_reg: 2.7990 detection_loss_cls: 0.0370 detection_loss_reg: 0.3443 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3460 instance_segmentation_loss_poly: 0.9108 +2023/11/03 12:05:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 12:05:04 - mmengine - INFO - Iter(train) [311000/640000] base_lr: 1.0537e-04 lr: 1.1398e-05 eta: 4 days, 5:07:04 time: 1.1184 data_time: 0.0352 memory: 21521 grad_norm: 3.0209 loss: 1.3319 caption_loss_cls: 2.2173 grounding_loss_reg: 2.7968 detection_loss_cls: 0.0369 detection_loss_reg: 0.3444 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3463 instance_segmentation_loss_poly: 0.9105 +2023/11/03 12:05:04 - mmengine - INFO - Saving checkpoint at 311000 iterations +2023/11/03 12:14:34 - mmengine - INFO - Iter(train) [311500/640000] base_lr: 1.0513e-04 lr: 1.1375e-05 eta: 4 days, 5:03:37 time: 1.1215 data_time: 0.0353 memory: 21521 grad_norm: 3.0337 loss: 1.3315 caption_loss_cls: 2.2167 grounding_loss_reg: 2.7961 detection_loss_cls: 0.0369 detection_loss_reg: 0.3440 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0371 instance_segmentation_loss_reg: 0.3470 instance_segmentation_loss_poly: 0.9118 +2023/11/03 12:23:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 12:23:55 - mmengine - INFO - Iter(train) [312000/640000] base_lr: 1.0489e-04 lr: 1.1353e-05 eta: 4 days, 4:56:49 time: 1.1249 data_time: 0.0354 memory: 21521 grad_norm: 3.0490 loss: 1.3333 caption_loss_cls: 2.2131 grounding_loss_reg: 2.7947 detection_loss_cls: 0.0368 detection_loss_reg: 0.3435 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3458 instance_segmentation_loss_poly: 0.9091 +2023/11/03 12:23:55 - mmengine - INFO - Saving checkpoint at 312000 iterations +2023/11/03 12:32:57 - mmengine - INFO - Iter(train) [312500/640000] base_lr: 1.0464e-04 lr: 1.1331e-05 eta: 4 days, 4:43:23 time: 1.1160 data_time: 0.0352 memory: 21521 grad_norm: 3.0848 loss: 1.3527 caption_loss_cls: 2.2146 grounding_loss_reg: 2.7917 detection_loss_cls: 0.0370 detection_loss_reg: 0.3449 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0369 instance_segmentation_loss_reg: 0.3452 instance_segmentation_loss_poly: 0.9083 +2023/11/03 12:41:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 12:41:46 - mmengine - INFO - Iter(train) [313000/640000] base_lr: 1.0440e-04 lr: 1.1309e-05 eta: 4 days, 4:26:17 time: 1.1103 data_time: 0.0348 memory: 21521 grad_norm: 3.0886 loss: 1.3419 caption_loss_cls: 2.2114 grounding_loss_reg: 2.7942 detection_loss_cls: 0.0369 detection_loss_reg: 0.3444 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0369 instance_segmentation_loss_reg: 0.3451 instance_segmentation_loss_poly: 0.9075 +2023/11/03 12:41:46 - mmengine - INFO - Saving checkpoint at 313000 iterations +2023/11/03 12:51:07 - mmengine - INFO - Iter(train) [313500/640000] base_lr: 1.0416e-04 lr: 1.1287e-05 eta: 4 days, 4:19:23 time: 1.1057 data_time: 0.0346 memory: 21521 grad_norm: 3.0779 loss: 1.3362 caption_loss_cls: 2.2107 grounding_loss_reg: 2.7927 detection_loss_cls: 0.0367 detection_loss_reg: 0.3436 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0369 instance_segmentation_loss_reg: 0.3455 instance_segmentation_loss_poly: 0.9082 +2023/11/03 13:00:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 13:00:05 - mmengine - INFO - Iter(train) [314000/640000] base_lr: 1.0392e-04 lr: 1.1265e-05 eta: 4 days, 4:05:43 time: 1.1037 data_time: 0.0346 memory: 21521 grad_norm: 3.0927 loss: 1.3419 caption_loss_cls: 2.2087 grounding_loss_reg: 2.7921 detection_loss_cls: 0.0366 detection_loss_reg: 0.3436 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0369 instance_segmentation_loss_reg: 0.3454 instance_segmentation_loss_poly: 0.9068 +2023/11/03 13:00:05 - mmengine - INFO - Saving checkpoint at 314000 iterations +2023/11/03 13:09:37 - mmengine - INFO - Iter(train) [314500/640000] base_lr: 1.0367e-04 lr: 1.1243e-05 eta: 4 days, 4:01:53 time: 1.1029 data_time: 0.0345 memory: 21521 grad_norm: 3.1206 loss: 1.3463 caption_loss_cls: 2.2111 grounding_loss_reg: 2.7904 detection_loss_cls: 0.0367 detection_loss_reg: 0.3444 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0369 instance_segmentation_loss_reg: 0.3451 instance_segmentation_loss_poly: 0.9066 +2023/11/03 13:18:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 13:18:52 - mmengine - INFO - Iter(train) [315000/640000] base_lr: 1.0343e-04 lr: 1.1221e-05 eta: 4 days, 3:53:10 time: 1.1063 data_time: 0.0345 memory: 21521 grad_norm: 3.1134 loss: 1.3405 caption_loss_cls: 2.2142 grounding_loss_reg: 2.7899 detection_loss_cls: 0.0366 detection_loss_reg: 0.3435 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0368 instance_segmentation_loss_reg: 0.3445 instance_segmentation_loss_poly: 0.9059 +2023/11/03 13:18:52 - mmengine - INFO - Saving checkpoint at 315000 iterations +2023/11/03 13:27:58 - mmengine - INFO - Iter(train) [315500/640000] base_lr: 1.0319e-04 lr: 1.1199e-05 eta: 4 days, 3:42:03 time: 1.1005 data_time: 0.0342 memory: 21521 grad_norm: 3.0944 loss: 1.3283 caption_loss_cls: 2.2132 grounding_loss_reg: 2.7911 detection_loss_cls: 0.0365 detection_loss_reg: 0.3430 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0367 instance_segmentation_loss_reg: 0.3444 instance_segmentation_loss_poly: 0.9045 +2023/11/03 13:37:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 13:37:09 - mmengine - INFO - Iter(train) [316000/640000] base_lr: 1.0294e-04 lr: 1.1177e-05 eta: 4 days, 3:32:12 time: 1.0980 data_time: 0.0341 memory: 21521 grad_norm: 3.0842 loss: 1.3292 caption_loss_cls: 2.2106 grounding_loss_reg: 2.7908 detection_loss_cls: 0.0365 detection_loss_reg: 0.3430 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0367 instance_segmentation_loss_reg: 0.3444 instance_segmentation_loss_poly: 0.9029 +2023/11/03 13:37:09 - mmengine - INFO - Saving checkpoint at 316000 iterations +2023/11/03 13:46:56 - mmengine - INFO - Iter(train) [316500/640000] base_lr: 1.0270e-04 lr: 1.1155e-05 eta: 4 days, 3:31:37 time: 1.1091 data_time: 0.0343 memory: 21521 grad_norm: 3.0758 loss: 1.3213 caption_loss_cls: 2.2166 grounding_loss_reg: 2.7869 detection_loss_cls: 0.0364 detection_loss_reg: 0.3425 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0367 instance_segmentation_loss_reg: 0.3444 instance_segmentation_loss_poly: 0.9023 +2023/11/03 13:56:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 13:56:10 - mmengine - INFO - Iter(train) [317000/640000] base_lr: 1.0246e-04 lr: 1.1133e-05 eta: 4 days, 3:22:32 time: 1.1155 data_time: 0.0346 memory: 21521 grad_norm: 3.0572 loss: 1.3233 caption_loss_cls: 2.2184 grounding_loss_reg: 2.7864 detection_loss_cls: 0.0364 detection_loss_reg: 0.3419 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0367 instance_segmentation_loss_reg: 0.3437 instance_segmentation_loss_poly: 0.9010 +2023/11/03 13:56:10 - mmengine - INFO - Saving checkpoint at 317000 iterations +2023/11/03 14:05:07 - mmengine - INFO - Iter(train) [317500/640000] base_lr: 1.0222e-04 lr: 1.1110e-05 eta: 4 days, 3:09:03 time: 1.1096 data_time: 0.0345 memory: 21521 grad_norm: 3.1205 loss: 1.3375 caption_loss_cls: 2.2182 grounding_loss_reg: 2.7854 detection_loss_cls: 0.0366 detection_loss_reg: 0.3418 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0368 instance_segmentation_loss_reg: 0.3437 instance_segmentation_loss_poly: 0.9009 +2023/11/03 14:14:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 14:14:31 - mmengine - INFO - Iter(train) [318000/640000] base_lr: 1.0197e-04 lr: 1.1088e-05 eta: 4 days, 3:02:22 time: 1.1160 data_time: 0.0348 memory: 21521 grad_norm: 3.0887 loss: 1.3382 caption_loss_cls: 2.2231 grounding_loss_reg: 2.7838 detection_loss_cls: 0.0366 detection_loss_reg: 0.3416 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0368 instance_segmentation_loss_reg: 0.3435 instance_segmentation_loss_poly: 0.8998 +2023/11/03 14:14:31 - mmengine - INFO - Saving checkpoint at 318000 iterations +2023/11/03 14:24:00 - mmengine - INFO - Iter(train) [318500/640000] base_lr: 1.0173e-04 lr: 1.1066e-05 eta: 4 days, 2:56:37 time: 1.1153 data_time: 0.0349 memory: 21521 grad_norm: 3.1170 loss: 1.3459 caption_loss_cls: 2.2239 grounding_loss_reg: 2.7809 detection_loss_cls: 0.0366 detection_loss_reg: 0.3426 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3441 instance_segmentation_loss_poly: 0.9012 +2023/11/03 14:33:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 14:33:28 - mmengine - INFO - Iter(train) [319000/640000] base_lr: 1.0149e-04 lr: 1.1044e-05 eta: 4 days, 2:50:39 time: 1.1185 data_time: 0.0348 memory: 21521 grad_norm: 3.0890 loss: 1.3335 caption_loss_cls: 2.2196 grounding_loss_reg: 2.7815 detection_loss_cls: 0.0366 detection_loss_reg: 0.3423 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0371 instance_segmentation_loss_reg: 0.3442 instance_segmentation_loss_poly: 0.8997 +2023/11/03 14:33:28 - mmengine - INFO - Saving checkpoint at 319000 iterations +2023/11/03 14:43:10 - mmengine - INFO - Iter(train) [319500/640000] base_lr: 1.0124e-04 lr: 1.1022e-05 eta: 4 days, 2:47:40 time: 1.1274 data_time: 0.0353 memory: 21521 grad_norm: 3.0793 loss: 1.3464 caption_loss_cls: 2.2215 grounding_loss_reg: 2.7833 detection_loss_cls: 0.0366 detection_loss_reg: 0.3432 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0374 instance_segmentation_loss_reg: 0.3455 instance_segmentation_loss_poly: 0.9011 +2023/11/03 14:52:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 14:52:10 - mmengine - INFO - Iter(train) [320000/640000] base_lr: 1.0100e-04 lr: 1.1000e-05 eta: 4 days, 2:35:01 time: 1.1246 data_time: 0.0355 memory: 21521 grad_norm: 3.1096 loss: 1.3605 caption_loss_cls: 2.2237 grounding_loss_reg: 2.7794 detection_loss_cls: 0.0367 detection_loss_reg: 0.3438 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0375 instance_segmentation_loss_reg: 0.3459 instance_segmentation_loss_poly: 0.9014 +2023/11/03 14:52:10 - mmengine - INFO - Saving checkpoint at 320000 iterations +2023/11/03 15:01:18 - mmengine - INFO - Evaluating bbox... +2023/11/03 15:02:14 - mmengine - INFO - bbox_mAP_copypaste: 0.431 0.602 0.466 0.273 0.474 0.574 +2023/11/03 15:02:14 - mmengine - INFO - Evaluating segm... +2023/11/03 15:03:26 - mmengine - INFO - segm_mAP_copypaste: 0.285 0.520 0.277 0.147 0.323 0.444 +2023/11/03 15:08:08 - mmengine - INFO - per class results: +2023/11/03 15:08:08 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.18 | 88.31 | +| building | 79.84 | 88.92 | +| sky | 92.74 | 97.56 | +| floor | 79.17 | 88.49 | +| tree | 72.78 | 86.06 | +| ceiling | 82.57 | 92.51 | +| road | 81.09 | 88.23 | +| bed | 85.11 | 95.34 | +| windowpane | 59.26 | 77.32 | +| grass | 66.9 | 81.13 | +| cabinet | 58.56 | 70.74 | +| sidewalk | 64.71 | 76.02 | +| person | 78.33 | 88.04 | +| earth | 33.24 | 43.97 | +| door | 48.41 | 63.9 | +| table | 58.75 | 73.25 | +| mountain | 55.81 | 78.61 | +| plant | 51.14 | 66.3 | +| curtain | 68.95 | 84.8 | +| chair | 53.89 | 69.74 | +| car | 80.23 | 90.48 | +| water | 45.67 | 57.57 | +| painting | 70.15 | 82.14 | +| sofa | 57.22 | 86.42 | +| shelf | 39.09 | 58.4 | +| house | 43.72 | 78.73 | +| sea | 46.47 | 75.33 | +| mirror | 63.95 | 71.02 | +| rug | 56.39 | 59.35 | +| field | 34.27 | 51.93 | +| armchair | 30.49 | 37.64 | +| seat | 56.13 | 86.67 | +| fence | 35.63 | 47.67 | +| desk | 43.72 | 61.28 | +| rock | 30.4 | 49.51 | +| wardrobe | 45.08 | 69.45 | +| lamp | 57.16 | 66.89 | +| bathtub | 72.89 | 86.02 | +| railing | 27.3 | 54.69 | +| cushion | 48.73 | 55.6 | +| base | 26.89 | 45.02 | +| box | 22.56 | 30.2 | +| column | 46.1 | 58.24 | +| signboard | 29.25 | 33.34 | +| chest of drawers | 40.11 | 66.22 | +| counter | 33.22 | 40.91 | +| sand | 36.15 | 43.39 | +| sink | 67.13 | 72.59 | +| skyscraper | 49.67 | 62.3 | +| fireplace | 72.87 | 84.2 | +| refrigerator | 69.24 | 75.02 | +| grandstand | 41.05 | 66.89 | +| path | 19.38 | 29.36 | +| stairs | 25.07 | 37.36 | +| runway | 69.96 | 88.13 | +| case | 31.71 | 60.07 | +| pool table | 86.45 | 95.94 | +| pillow | 51.89 | 69.88 | +| screen door | 64.86 | 68.36 | +| stairway | 33.91 | 44.28 | +| river | 21.82 | 31.25 | +| bridge | 27.4 | 32.14 | +| bookcase | 36.93 | 53.73 | +| blind | 20.14 | 20.61 | +| coffee table | 58.49 | 69.81 | +| toilet | 82.85 | 89.24 | +| flower | 31.31 | 37.67 | +| book | 45.13 | 61.61 | +| hill | 10.73 | 16.72 | +| bench | 41.8 | 50.03 | +| countertop | 54.87 | 69.13 | +| stove | 70.94 | 83.18 | +| palm | 43.39 | 57.23 | +| kitchen island | 35.99 | 81.27 | +| computer | 62.33 | 73.25 | +| swivel chair | 45.86 | 60.72 | +| boat | 43.56 | 49.48 | +| bar | 29.99 | 37.84 | +| arcade machine | 62.84 | 66.88 | +| hovel | 9.1 | 12.04 | +| bus | 89.46 | 92.2 | +| towel | 53.71 | 62.82 | +| light | 35.3 | 37.97 | +| truck | 31.8 | 44.54 | +| tower | 35.65 | 58.68 | +| chandelier | 59.33 | 70.97 | +| awning | 19.21 | 20.95 | +| streetlight | 24.05 | 29.04 | +| booth | 68.42 | 72.03 | +| television receiver | 67.85 | 82.84 | +| airplane | 51.86 | 63.95 | +| dirt track | 0.0 | 0.0 | +| apparel | 28.65 | 45.92 | +| pole | 29.25 | 38.22 | +| land | 3.1 | 5.4 | +| bannister | 13.88 | 17.44 | +| escalator | 38.38 | 54.43 | +| ottoman | 45.27 | 63.0 | +| bottle | 15.06 | 17.08 | +| buffet | 30.27 | 30.43 | +| poster | 14.14 | 15.43 | +| stage | 15.16 | 27.75 | +| van | 30.27 | 39.5 | +| ship | 52.27 | 94.53 | +| fountain | 11.44 | 11.7 | +| conveyer belt | 78.77 | 88.59 | +| canopy | 20.38 | 27.93 | +| washer | 66.28 | 67.07 | +| plaything | 23.55 | 31.1 | +| swimming pool | 43.15 | 70.41 | +| stool | 38.77 | 48.49 | +| barrel | 11.69 | 21.88 | +| basket | 18.96 | 24.42 | +| waterfall | 48.5 | 55.91 | +| tent | 93.82 | 96.97 | +| bag | 7.33 | 7.69 | +| minibike | 65.13 | 74.16 | +| cradle | 71.04 | 85.89 | +| oven | 19.27 | 31.07 | +| ball | 10.18 | 10.75 | +| food | 47.28 | 54.52 | +| step | 15.61 | 17.14 | +| tank | 44.97 | 54.64 | +| trade name | 10.07 | 10.49 | +| microwave | 67.31 | 73.23 | +| pot | 44.81 | 50.83 | +| animal | 53.2 | 55.77 | +| bicycle | 55.36 | 75.78 | +| lake | 63.89 | 67.08 | +| dishwasher | 49.77 | 76.68 | +| screen | 69.37 | 82.09 | +| blanket | 10.25 | 13.53 | +| sculpture | 52.73 | 59.57 | +| hood | 50.88 | 56.12 | +| sconce | 34.92 | 41.81 | +| vase | 39.68 | 59.83 | +| traffic light | 32.23 | 51.74 | +| tray | 4.04 | 5.74 | +| ashcan | 34.73 | 39.98 | +| fan | 50.29 | 64.85 | +| pier | 25.34 | 26.23 | +| crt screen | 7.41 | 16.87 | +| plate | 56.78 | 69.55 | +| monitor | 24.97 | 36.22 | +| bulletin board | 17.39 | 20.55 | +| shower | 3.66 | 6.9 | +| radiator | 42.68 | 44.37 | +| glass | 9.95 | 10.24 | +| clock | 20.36 | 23.27 | +| flag | 30.58 | 34.96 | ++---------------------+-------+-------+ +2023/11/03 15:08:23 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4310 coco/bbox_mAP_50: 0.6020 coco/bbox_mAP_75: 0.4660 coco/bbox_mAP_s: 0.2730 coco/bbox_mAP_m: 0.4740 coco/bbox_mAP_l: 0.5740 coco/segm_mAP: 0.2850 coco/segm_mAP_50: 0.5200 coco/segm_mAP_75: 0.2770 coco/segm_mAP_s: 0.1470 coco/segm_mAP_m: 0.3230 coco/segm_mAP_l: 0.4440 Bleu_1: 0.7218 Bleu_2: 0.5510 Bleu_3: 0.4103 Bleu_4: 0.3023 METEOR: 0.2542 ROUGE_L: 0.5301 CIDEr: 0.9622 SPICE: 0.1849 aAcc: 81.0700 mIoU: 44.2300 mAcc: 55.2800 visual-grounding/miou: 0.7464 visual-grounding/acc: 0.8229 data_time: 0.0046 time: 0.5264 +2023/11/03 15:18:03 - mmengine - INFO - Iter(train) [320500/640000] base_lr: 1.0076e-04 lr: 1.0978e-05 eta: 4 days, 2:31:29 time: 1.1233 data_time: 0.0326 memory: 21521 grad_norm: 3.0421 loss: 1.3508 caption_loss_cls: 2.2287 grounding_loss_reg: 2.7786 detection_loss_cls: 0.0366 detection_loss_reg: 0.3438 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0374 instance_segmentation_loss_reg: 0.3450 instance_segmentation_loss_poly: 0.8982 +2023/11/03 15:27:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 15:27:56 - mmengine - INFO - Iter(train) [321000/640000] base_lr: 1.0051e-04 lr: 1.0956e-05 eta: 4 days, 2:30:12 time: 1.1329 data_time: 0.0330 memory: 21521 grad_norm: 3.0304 loss: 1.3397 caption_loss_cls: 2.2269 grounding_loss_reg: 2.7764 detection_loss_cls: 0.0365 detection_loss_reg: 0.3426 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0373 instance_segmentation_loss_reg: 0.3447 instance_segmentation_loss_poly: 0.8973 +2023/11/03 15:27:56 - mmengine - INFO - Saving checkpoint at 321000 iterations +2023/11/03 15:37:30 - mmengine - INFO - Iter(train) [321500/640000] base_lr: 1.0027e-04 lr: 1.0934e-05 eta: 4 days, 2:24:44 time: 1.1422 data_time: 0.0333 memory: 21521 grad_norm: 3.0036 loss: 1.3341 caption_loss_cls: 2.2284 grounding_loss_reg: 2.7781 detection_loss_cls: 0.0365 detection_loss_reg: 0.3427 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0373 instance_segmentation_loss_reg: 0.3445 instance_segmentation_loss_poly: 0.8968 +2023/11/03 15:47:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 15:47:15 - mmengine - INFO - Iter(train) [322000/640000] base_lr: 1.0003e-04 lr: 1.0912e-05 eta: 4 days, 2:21:17 time: 1.1474 data_time: 0.0332 memory: 21521 grad_norm: 2.9786 loss: 1.3151 caption_loss_cls: 2.2266 grounding_loss_reg: 2.7779 detection_loss_cls: 0.0366 detection_loss_reg: 0.3424 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0372 instance_segmentation_loss_reg: 0.3435 instance_segmentation_loss_poly: 0.8941 +2023/11/03 15:47:15 - mmengine - INFO - Saving checkpoint at 322000 iterations +2023/11/03 15:56:34 - mmengine - INFO - Iter(train) [322500/640000] base_lr: 9.9786e-05 lr: 1.0890e-05 eta: 4 days, 2:12:23 time: 1.1450 data_time: 0.0331 memory: 21521 grad_norm: 2.9271 loss: 1.3021 caption_loss_cls: 2.2249 grounding_loss_reg: 2.7815 detection_loss_cls: 0.0365 detection_loss_reg: 0.3421 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0371 instance_segmentation_loss_reg: 0.3423 instance_segmentation_loss_poly: 0.8916 +2023/11/03 16:05:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 16:05:48 - mmengine - INFO - Iter(train) [323000/640000] base_lr: 9.9543e-05 lr: 1.0868e-05 eta: 4 days, 2:02:30 time: 1.1414 data_time: 0.0330 memory: 21521 grad_norm: 2.9707 loss: 1.3094 caption_loss_cls: 2.2236 grounding_loss_reg: 2.7805 detection_loss_cls: 0.0364 detection_loss_reg: 0.3406 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3410 instance_segmentation_loss_poly: 0.8891 +2023/11/03 16:05:48 - mmengine - INFO - Saving checkpoint at 323000 iterations +2023/11/03 16:15:14 - mmengine - INFO - Iter(train) [323500/640000] base_lr: 9.9300e-05 lr: 1.0845e-05 eta: 4 days, 1:55:01 time: 1.1375 data_time: 0.0328 memory: 21521 grad_norm: 2.9686 loss: 1.2957 caption_loss_cls: 2.2231 grounding_loss_reg: 2.7789 detection_loss_cls: 0.0363 detection_loss_reg: 0.3401 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0371 instance_segmentation_loss_reg: 0.3418 instance_segmentation_loss_poly: 0.8911 +2023/11/03 16:24:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 16:24:37 - mmengine - INFO - Iter(train) [324000/640000] base_lr: 9.9057e-05 lr: 1.0823e-05 eta: 4 days, 1:46:42 time: 1.1431 data_time: 0.0328 memory: 21521 grad_norm: 2.9405 loss: 1.2821 caption_loss_cls: 2.2214 grounding_loss_reg: 2.7763 detection_loss_cls: 0.0362 detection_loss_reg: 0.3398 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3414 instance_segmentation_loss_poly: 0.8898 +2023/11/03 16:24:37 - mmengine - INFO - Saving checkpoint at 324000 iterations +2023/11/03 16:33:57 - mmengine - INFO - Iter(train) [324500/640000] base_lr: 9.8814e-05 lr: 1.0801e-05 eta: 4 days, 1:38:02 time: 1.1380 data_time: 0.0356 memory: 21521 grad_norm: 2.9921 loss: 1.2890 caption_loss_cls: 2.2210 grounding_loss_reg: 2.7746 detection_loss_cls: 0.0360 detection_loss_reg: 0.3394 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3404 instance_segmentation_loss_poly: 0.8873 +2023/11/03 16:42:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 16:42:35 - mmengine - INFO - Iter(train) [325000/640000] base_lr: 9.8571e-05 lr: 1.0779e-05 eta: 4 days, 1:21:40 time: 1.1193 data_time: 0.0351 memory: 21521 grad_norm: 3.0625 loss: 1.3156 caption_loss_cls: 2.2216 grounding_loss_reg: 2.7789 detection_loss_cls: 0.0359 detection_loss_reg: 0.3387 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3404 instance_segmentation_loss_poly: 0.8879 +2023/11/03 16:42:35 - mmengine - INFO - Saving checkpoint at 325000 iterations +2023/11/03 16:52:01 - mmengine - INFO - Iter(train) [325500/640000] base_lr: 9.8328e-05 lr: 1.0757e-05 eta: 4 days, 1:14:05 time: 1.1173 data_time: 0.0353 memory: 21521 grad_norm: 3.0924 loss: 1.3190 caption_loss_cls: 2.2192 grounding_loss_reg: 2.7780 detection_loss_cls: 0.0359 detection_loss_reg: 0.3379 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0371 instance_segmentation_loss_reg: 0.3406 instance_segmentation_loss_poly: 0.8870 +2023/11/03 17:01:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 17:01:05 - mmengine - INFO - Iter(train) [326000/640000] base_lr: 9.8085e-05 lr: 1.0735e-05 eta: 4 days, 1:02:23 time: 1.1068 data_time: 0.0353 memory: 21521 grad_norm: 3.1481 loss: 1.3406 caption_loss_cls: 2.2198 grounding_loss_reg: 2.7780 detection_loss_cls: 0.0358 detection_loss_reg: 0.3379 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3403 instance_segmentation_loss_poly: 0.8868 +2023/11/03 17:01:05 - mmengine - INFO - Saving checkpoint at 326000 iterations +2023/11/03 17:10:36 - mmengine - INFO - Iter(train) [326500/640000] base_lr: 9.7842e-05 lr: 1.0713e-05 eta: 4 days, 0:55:39 time: 1.1099 data_time: 0.0355 memory: 21521 grad_norm: 3.1657 loss: 1.3483 caption_loss_cls: 2.2236 grounding_loss_reg: 2.7774 detection_loss_cls: 0.0358 detection_loss_reg: 0.3380 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0371 instance_segmentation_loss_reg: 0.3408 instance_segmentation_loss_poly: 0.8875 +2023/11/03 17:20:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 17:20:08 - mmengine - INFO - Iter(train) [327000/640000] base_lr: 9.7599e-05 lr: 1.0691e-05 eta: 4 days, 0:48:55 time: 1.1144 data_time: 0.0360 memory: 21521 grad_norm: 3.1463 loss: 1.3516 caption_loss_cls: 2.2238 grounding_loss_reg: 2.7719 detection_loss_cls: 0.0359 detection_loss_reg: 0.3383 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0371 instance_segmentation_loss_reg: 0.3406 instance_segmentation_loss_poly: 0.8865 +2023/11/03 17:20:08 - mmengine - INFO - Saving checkpoint at 327000 iterations +2023/11/03 17:29:29 - mmengine - INFO - Iter(train) [327500/640000] base_lr: 9.7357e-05 lr: 1.0669e-05 eta: 4 days, 0:40:18 time: 1.1131 data_time: 0.0357 memory: 21521 grad_norm: 3.1190 loss: 1.3412 caption_loss_cls: 2.2224 grounding_loss_reg: 2.7719 detection_loss_cls: 0.0358 detection_loss_reg: 0.3379 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0371 instance_segmentation_loss_reg: 0.3410 instance_segmentation_loss_poly: 0.8875 +2023/11/03 17:38:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 17:38:50 - mmengine - INFO - Iter(train) [328000/640000] base_lr: 9.7114e-05 lr: 1.0647e-05 eta: 4 days, 0:31:39 time: 1.1127 data_time: 0.0357 memory: 21521 grad_norm: 3.1376 loss: 1.3458 caption_loss_cls: 2.2236 grounding_loss_reg: 2.7722 detection_loss_cls: 0.0358 detection_loss_reg: 0.3381 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0372 instance_segmentation_loss_reg: 0.3411 instance_segmentation_loss_poly: 0.8870 +2023/11/03 17:38:50 - mmengine - INFO - Saving checkpoint at 328000 iterations +2023/11/03 17:48:36 - mmengine - INFO - Iter(train) [328500/640000] base_lr: 9.6871e-05 lr: 1.0625e-05 eta: 4 days, 0:26:59 time: 1.1191 data_time: 0.0360 memory: 21521 grad_norm: 3.1149 loss: 1.3457 caption_loss_cls: 2.2263 grounding_loss_reg: 2.7733 detection_loss_cls: 0.0358 detection_loss_reg: 0.3390 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0372 instance_segmentation_loss_reg: 0.3418 instance_segmentation_loss_poly: 0.8875 +2023/11/03 17:57:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 17:57:46 - mmengine - INFO - Iter(train) [329000/640000] base_lr: 9.6628e-05 lr: 1.0603e-05 eta: 4 days, 0:16:32 time: 1.1271 data_time: 0.0363 memory: 21521 grad_norm: 3.0869 loss: 1.3351 caption_loss_cls: 2.2292 grounding_loss_reg: 2.7750 detection_loss_cls: 0.0359 detection_loss_reg: 0.3395 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0372 instance_segmentation_loss_reg: 0.3428 instance_segmentation_loss_poly: 0.8898 +2023/11/03 17:57:46 - mmengine - INFO - Saving checkpoint at 329000 iterations +2023/11/03 18:06:55 - mmengine - INFO - Iter(train) [329500/640000] base_lr: 9.6385e-05 lr: 1.0580e-05 eta: 4 days, 0:05:50 time: 1.1227 data_time: 0.0361 memory: 21521 grad_norm: 3.0811 loss: 1.3421 caption_loss_cls: 2.2285 grounding_loss_reg: 2.7718 detection_loss_cls: 0.0360 detection_loss_reg: 0.3403 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0372 instance_segmentation_loss_reg: 0.3432 instance_segmentation_loss_poly: 0.8915 +2023/11/03 18:16:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 18:16:18 - mmengine - INFO - Iter(train) [330000/640000] base_lr: 9.6143e-05 lr: 1.0558e-05 eta: 3 days, 23:57:25 time: 1.1277 data_time: 0.0363 memory: 21521 grad_norm: 3.0688 loss: 1.3396 caption_loss_cls: 2.2321 grounding_loss_reg: 2.7735 detection_loss_cls: 0.0360 detection_loss_reg: 0.3404 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0371 instance_segmentation_loss_reg: 0.3435 instance_segmentation_loss_poly: 0.8924 +2023/11/03 18:16:18 - mmengine - INFO - Saving checkpoint at 330000 iterations +2023/11/03 18:25:56 - mmengine - INFO - Iter(train) [330500/640000] base_lr: 9.5900e-05 lr: 1.0536e-05 eta: 3 days, 23:51:12 time: 1.1293 data_time: 0.0366 memory: 21521 grad_norm: 3.0650 loss: 1.3440 caption_loss_cls: 2.2294 grounding_loss_reg: 2.7716 detection_loss_cls: 0.0358 detection_loss_reg: 0.3396 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0371 instance_segmentation_loss_reg: 0.3431 instance_segmentation_loss_poly: 0.8913 +2023/11/03 18:35:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 18:35:08 - mmengine - INFO - Iter(train) [331000/640000] base_lr: 9.5657e-05 lr: 1.0514e-05 eta: 3 days, 23:41:03 time: 1.1243 data_time: 0.0363 memory: 21521 grad_norm: 3.0651 loss: 1.3446 caption_loss_cls: 2.2267 grounding_loss_reg: 2.7724 detection_loss_cls: 0.0359 detection_loss_reg: 0.3400 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3424 instance_segmentation_loss_poly: 0.8904 +2023/11/03 18:35:08 - mmengine - INFO - Saving checkpoint at 331000 iterations +2023/11/03 18:44:25 - mmengine - INFO - Iter(train) [331500/640000] base_lr: 9.5415e-05 lr: 1.0492e-05 eta: 3 days, 23:31:45 time: 1.1235 data_time: 0.0364 memory: 21521 grad_norm: 3.0904 loss: 1.3546 caption_loss_cls: 2.2265 grounding_loss_reg: 2.7707 detection_loss_cls: 0.0358 detection_loss_reg: 0.3403 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3438 instance_segmentation_loss_poly: 0.8922 +2023/11/03 18:53:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 18:53:38 - mmengine - INFO - Iter(train) [332000/640000] base_lr: 9.5172e-05 lr: 1.0470e-05 eta: 3 days, 23:21:41 time: 1.1213 data_time: 0.0365 memory: 21521 grad_norm: 3.0691 loss: 1.3493 caption_loss_cls: 2.2282 grounding_loss_reg: 2.7697 detection_loss_cls: 0.0359 detection_loss_reg: 0.3411 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0369 instance_segmentation_loss_reg: 0.3441 instance_segmentation_loss_poly: 0.8933 +2023/11/03 18:53:38 - mmengine - INFO - Saving checkpoint at 332000 iterations +2023/11/03 19:03:23 - mmengine - INFO - Iter(train) [332500/640000] base_lr: 9.4930e-05 lr: 1.0448e-05 eta: 3 days, 23:16:16 time: 1.1211 data_time: 0.0366 memory: 21521 grad_norm: 3.0970 loss: 1.3545 caption_loss_cls: 2.2277 grounding_loss_reg: 2.7676 detection_loss_cls: 0.0358 detection_loss_reg: 0.3411 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3439 instance_segmentation_loss_poly: 0.8926 +2023/11/03 19:13:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 19:13:01 - mmengine - INFO - Iter(train) [333000/640000] base_lr: 9.4687e-05 lr: 1.0426e-05 eta: 3 days, 23:09:43 time: 1.1280 data_time: 0.0368 memory: 21521 grad_norm: 3.0992 loss: 1.3506 caption_loss_cls: 2.2236 grounding_loss_reg: 2.7676 detection_loss_cls: 0.0358 detection_loss_reg: 0.3410 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0369 instance_segmentation_loss_reg: 0.3434 instance_segmentation_loss_poly: 0.8927 +2023/11/03 19:13:01 - mmengine - INFO - Saving checkpoint at 333000 iterations +2023/11/03 19:21:49 - mmengine - INFO - Iter(train) [333500/640000] base_lr: 9.4445e-05 lr: 1.0404e-05 eta: 3 days, 22:56:21 time: 1.1230 data_time: 0.0366 memory: 21521 grad_norm: 3.1311 loss: 1.3543 caption_loss_cls: 2.2276 grounding_loss_reg: 2.7671 detection_loss_cls: 0.0359 detection_loss_reg: 0.3411 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0369 instance_segmentation_loss_reg: 0.3432 instance_segmentation_loss_poly: 0.8928 +2023/11/03 19:31:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 19:31:27 - mmengine - INFO - Iter(train) [334000/640000] base_lr: 9.4202e-05 lr: 1.0382e-05 eta: 3 days, 22:49:47 time: 1.1267 data_time: 0.0368 memory: 21521 grad_norm: 3.1096 loss: 1.3525 caption_loss_cls: 2.2310 grounding_loss_reg: 2.7688 detection_loss_cls: 0.0358 detection_loss_reg: 0.3408 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0369 instance_segmentation_loss_reg: 0.3437 instance_segmentation_loss_poly: 0.8925 +2023/11/03 19:31:27 - mmengine - INFO - Saving checkpoint at 334000 iterations +2023/11/03 19:41:25 - mmengine - INFO - Iter(train) [334500/640000] base_lr: 9.3960e-05 lr: 1.0360e-05 eta: 3 days, 22:45:41 time: 1.1316 data_time: 0.0368 memory: 21521 grad_norm: 3.0994 loss: 1.3437 caption_loss_cls: 2.2331 grounding_loss_reg: 2.7672 detection_loss_cls: 0.0359 detection_loss_reg: 0.3410 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0368 instance_segmentation_loss_reg: 0.3435 instance_segmentation_loss_poly: 0.8926 +2023/11/03 19:50:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 19:50:32 - mmengine - INFO - Iter(train) [335000/640000] base_lr: 9.3718e-05 lr: 1.0338e-05 eta: 3 days, 22:34:56 time: 1.1305 data_time: 0.0368 memory: 21521 grad_norm: 3.1082 loss: 1.3414 caption_loss_cls: 2.2268 grounding_loss_reg: 2.7675 detection_loss_cls: 0.0360 detection_loss_reg: 0.3419 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0369 instance_segmentation_loss_reg: 0.3433 instance_segmentation_loss_poly: 0.8932 +2023/11/03 19:50:32 - mmengine - INFO - Saving checkpoint at 335000 iterations +2023/11/03 19:59:54 - mmengine - INFO - Iter(train) [335500/640000] base_lr: 9.3475e-05 lr: 1.0316e-05 eta: 3 days, 22:26:01 time: 1.1314 data_time: 0.0370 memory: 21521 grad_norm: 3.1179 loss: 1.3471 caption_loss_cls: 2.2271 grounding_loss_reg: 2.7664 detection_loss_cls: 0.0359 detection_loss_reg: 0.3415 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3441 instance_segmentation_loss_poly: 0.8962 +2023/11/03 20:09:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 20:09:02 - mmengine - INFO - Iter(train) [336000/640000] base_lr: 9.3233e-05 lr: 1.0294e-05 eta: 3 days, 22:15:24 time: 1.1304 data_time: 0.0368 memory: 21521 grad_norm: 3.1394 loss: 1.3530 caption_loss_cls: 2.2309 grounding_loss_reg: 2.7682 detection_loss_cls: 0.0360 detection_loss_reg: 0.3412 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3446 instance_segmentation_loss_poly: 0.8971 +2023/11/03 20:09:02 - mmengine - INFO - Saving checkpoint at 336000 iterations +2023/11/03 20:17:53 - mmengine - INFO - Iter(train) [336500/640000] base_lr: 9.2991e-05 lr: 1.0272e-05 eta: 3 days, 22:02:43 time: 1.1170 data_time: 0.0362 memory: 21521 grad_norm: 3.1411 loss: 1.3453 caption_loss_cls: 2.2273 grounding_loss_reg: 2.7660 detection_loss_cls: 0.0360 detection_loss_reg: 0.3416 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0369 instance_segmentation_loss_reg: 0.3440 instance_segmentation_loss_poly: 0.8953 +2023/11/03 20:27:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 20:27:03 - mmengine - INFO - Iter(train) [337000/640000] base_lr: 9.2749e-05 lr: 1.0250e-05 eta: 3 days, 21:52:21 time: 1.1099 data_time: 0.0358 memory: 21521 grad_norm: 3.1134 loss: 1.3492 caption_loss_cls: 2.2270 grounding_loss_reg: 2.7670 detection_loss_cls: 0.0360 detection_loss_reg: 0.3413 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0368 instance_segmentation_loss_reg: 0.3437 instance_segmentation_loss_poly: 0.8939 +2023/11/03 20:27:03 - mmengine - INFO - Saving checkpoint at 337000 iterations +2023/11/03 20:36:09 - mmengine - INFO - Iter(train) [337500/640000] base_lr: 9.2507e-05 lr: 1.0228e-05 eta: 3 days, 21:41:40 time: 1.1144 data_time: 0.0358 memory: 21521 grad_norm: 3.0818 loss: 1.3343 caption_loss_cls: 2.2279 grounding_loss_reg: 2.7659 detection_loss_cls: 0.0361 detection_loss_reg: 0.3419 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0368 instance_segmentation_loss_reg: 0.3436 instance_segmentation_loss_poly: 0.8934 +2023/11/03 20:45:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 20:45:08 - mmengine - INFO - Iter(train) [338000/640000] base_lr: 9.2264e-05 lr: 1.0206e-05 eta: 3 days, 21:30:09 time: 1.1047 data_time: 0.0353 memory: 21521 grad_norm: 3.1174 loss: 1.3345 caption_loss_cls: 2.2261 grounding_loss_reg: 2.7664 detection_loss_cls: 0.0360 detection_loss_reg: 0.3411 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0366 instance_segmentation_loss_reg: 0.3428 instance_segmentation_loss_poly: 0.8918 +2023/11/03 20:45:08 - mmengine - INFO - Saving checkpoint at 338000 iterations +2023/11/03 20:54:23 - mmengine - INFO - Iter(train) [338500/640000] base_lr: 9.2022e-05 lr: 1.0184e-05 eta: 3 days, 21:20:28 time: 1.0939 data_time: 0.0350 memory: 21521 grad_norm: 3.1716 loss: 1.3461 caption_loss_cls: 2.2286 grounding_loss_reg: 2.7637 detection_loss_cls: 0.0359 detection_loss_reg: 0.3402 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0365 instance_segmentation_loss_reg: 0.3429 instance_segmentation_loss_poly: 0.8921 +2023/11/03 21:03:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 21:03:59 - mmengine - INFO - Iter(train) [339000/640000] base_lr: 9.1781e-05 lr: 1.0162e-05 eta: 3 days, 21:13:25 time: 1.1012 data_time: 0.0351 memory: 21521 grad_norm: 3.1513 loss: 1.3382 caption_loss_cls: 2.2319 grounding_loss_reg: 2.7617 detection_loss_cls: 0.0357 detection_loss_reg: 0.3398 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0365 instance_segmentation_loss_reg: 0.3423 instance_segmentation_loss_poly: 0.8908 +2023/11/03 21:03:59 - mmengine - INFO - Saving checkpoint at 339000 iterations +2023/11/03 21:13:28 - mmengine - INFO - Iter(train) [339500/640000] base_lr: 9.1539e-05 lr: 1.0140e-05 eta: 3 days, 21:05:25 time: 1.1031 data_time: 0.0350 memory: 21521 grad_norm: 3.1696 loss: 1.3385 caption_loss_cls: 2.2272 grounding_loss_reg: 2.7602 detection_loss_cls: 0.0357 detection_loss_reg: 0.3393 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0364 instance_segmentation_loss_reg: 0.3414 instance_segmentation_loss_poly: 0.8895 +2023/11/03 21:22:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 21:22:41 - mmengine - INFO - Iter(train) [340000/640000] base_lr: 9.1297e-05 lr: 1.0118e-05 eta: 3 days, 20:55:29 time: 1.1041 data_time: 0.0352 memory: 21521 grad_norm: 3.1763 loss: 1.3342 caption_loss_cls: 2.2222 grounding_loss_reg: 2.7609 detection_loss_cls: 0.0356 detection_loss_reg: 0.3389 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0364 instance_segmentation_loss_reg: 0.3412 instance_segmentation_loss_poly: 0.8896 +2023/11/03 21:22:41 - mmengine - INFO - Saving checkpoint at 340000 iterations +2023/11/03 21:31:24 - mmengine - INFO - Evaluating bbox... +2023/11/03 21:32:20 - mmengine - INFO - bbox_mAP_copypaste: 0.429 0.600 0.469 0.257 0.478 0.582 +2023/11/03 21:32:20 - mmengine - INFO - Evaluating segm... +2023/11/03 21:33:32 - mmengine - INFO - segm_mAP_copypaste: 0.294 0.529 0.287 0.147 0.336 0.460 +2023/11/03 21:38:21 - mmengine - INFO - per class results: +2023/11/03 21:38:21 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.27 | 86.2 | +| building | 81.29 | 90.91 | +| sky | 92.62 | 97.31 | +| floor | 79.8 | 89.68 | +| tree | 71.3 | 86.97 | +| ceiling | 82.03 | 93.93 | +| road | 79.49 | 84.15 | +| bed | 86.61 | 95.07 | +| windowpane | 58.59 | 77.58 | +| grass | 65.17 | 77.58 | +| cabinet | 57.72 | 70.47 | +| sidewalk | 62.38 | 82.42 | +| person | 78.66 | 91.35 | +| earth | 36.96 | 55.4 | +| door | 49.51 | 66.95 | +| table | 56.71 | 72.36 | +| mountain | 52.44 | 64.36 | +| plant | 49.99 | 61.33 | +| curtain | 69.04 | 81.3 | +| chair | 55.74 | 70.64 | +| car | 79.51 | 86.25 | +| water | 42.5 | 53.55 | +| painting | 70.72 | 84.49 | +| sofa | 67.45 | 87.07 | +| shelf | 38.21 | 60.69 | +| house | 45.93 | 70.72 | +| sea | 47.84 | 78.56 | +| mirror | 62.38 | 70.38 | +| rug | 63.87 | 69.38 | +| field | 35.76 | 50.88 | +| armchair | 42.52 | 52.45 | +| seat | 61.31 | 84.83 | +| fence | 37.88 | 56.49 | +| desk | 42.47 | 64.31 | +| rock | 39.09 | 57.12 | +| wardrobe | 44.86 | 62.17 | +| lamp | 56.17 | 71.24 | +| bathtub | 71.23 | 85.25 | +| railing | 27.78 | 40.16 | +| cushion | 54.22 | 68.57 | +| base | 20.37 | 30.65 | +| box | 22.07 | 29.02 | +| column | 47.47 | 59.6 | +| signboard | 34.22 | 44.43 | +| chest of drawers | 31.34 | 43.95 | +| counter | 35.36 | 59.96 | +| sand | 29.6 | 44.15 | +| sink | 69.19 | 76.69 | +| skyscraper | 69.54 | 91.05 | +| fireplace | 70.95 | 85.07 | +| refrigerator | 69.26 | 75.64 | +| grandstand | 37.51 | 54.75 | +| path | 26.28 | 36.92 | +| stairs | 25.53 | 34.91 | +| runway | 75.35 | 84.72 | +| case | 42.66 | 55.29 | +| pool table | 90.08 | 94.77 | +| pillow | 51.4 | 62.71 | +| screen door | 50.42 | 56.13 | +| stairway | 27.92 | 49.6 | +| river | 16.13 | 33.19 | +| bridge | 46.97 | 56.02 | +| bookcase | 32.78 | 67.84 | +| blind | 24.16 | 26.54 | +| coffee table | 62.73 | 80.72 | +| toilet | 83.49 | 88.3 | +| flower | 29.62 | 40.77 | +| book | 42.69 | 58.33 | +| hill | 7.64 | 16.84 | +| bench | 47.75 | 55.47 | +| countertop | 47.05 | 69.76 | +| stove | 65.26 | 84.51 | +| palm | 44.75 | 58.93 | +| kitchen island | 38.83 | 74.31 | +| computer | 67.54 | 76.06 | +| swivel chair | 47.6 | 65.02 | +| boat | 63.39 | 82.46 | +| bar | 57.79 | 66.16 | +| arcade machine | 28.19 | 28.7 | +| hovel | 9.21 | 11.15 | +| bus | 80.28 | 94.93 | +| towel | 57.85 | 67.92 | +| light | 42.69 | 47.94 | +| truck | 40.3 | 52.44 | +| tower | 49.37 | 68.78 | +| chandelier | 62.73 | 79.89 | +| awning | 19.13 | 26.29 | +| streetlight | 25.07 | 32.84 | +| booth | 58.76 | 68.96 | +| television receiver | 68.28 | 79.99 | +| airplane | 57.06 | 62.68 | +| dirt track | 10.4 | 15.86 | +| apparel | 25.28 | 39.22 | +| pole | 28.85 | 39.88 | +| land | 3.13 | 5.57 | +| bannister | 13.72 | 19.89 | +| escalator | 36.86 | 41.78 | +| ottoman | 52.53 | 61.47 | +| bottle | 20.31 | 23.31 | +| buffet | 44.9 | 51.34 | +| poster | 30.27 | 38.49 | +| stage | 13.57 | 29.7 | +| van | 40.33 | 60.6 | +| ship | 58.84 | 61.65 | +| fountain | 19.75 | 20.77 | +| conveyer belt | 75.3 | 87.78 | +| canopy | 18.76 | 21.75 | +| washer | 54.18 | 54.42 | +| plaything | 16.23 | 19.61 | +| swimming pool | 52.88 | 85.05 | +| stool | 38.82 | 51.4 | +| barrel | 5.74 | 48.54 | +| basket | 26.63 | 35.36 | +| waterfall | 45.17 | 58.63 | +| tent | 80.01 | 96.93 | +| bag | 9.31 | 10.22 | +| minibike | 62.1 | 76.13 | +| cradle | 71.84 | 94.52 | +| oven | 14.63 | 17.43 | +| ball | 42.41 | 48.77 | +| food | 53.82 | 60.86 | +| step | 12.8 | 13.77 | +| tank | 26.33 | 35.02 | +| trade name | 25.21 | 32.76 | +| microwave | 69.41 | 77.04 | +| pot | 46.08 | 51.79 | +| animal | 64.05 | 67.95 | +| bicycle | 54.02 | 69.14 | +| lake | 45.64 | 68.13 | +| dishwasher | 51.04 | 73.93 | +| screen | 75.74 | 84.39 | +| blanket | 8.58 | 9.96 | +| sculpture | 43.83 | 71.46 | +| hood | 48.94 | 54.28 | +| sconce | 35.6 | 65.74 | +| vase | 39.3 | 49.48 | +| traffic light | 30.62 | 46.29 | +| tray | 9.26 | 12.32 | +| ashcan | 34.26 | 40.42 | +| fan | 52.03 | 66.74 | +| pier | 34.94 | 49.84 | +| crt screen | 13.01 | 22.84 | +| plate | 52.41 | 61.85 | +| monitor | 40.49 | 48.0 | +| bulletin board | 35.68 | 49.97 | +| shower | 4.49 | 15.63 | +| radiator | 49.93 | 54.15 | +| glass | 13.52 | 14.19 | +| clock | 18.19 | 19.39 | +| flag | 32.12 | 37.0 | ++---------------------+-------+-------+ +2023/11/03 21:38:37 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4290 coco/bbox_mAP_50: 0.6000 coco/bbox_mAP_75: 0.4690 coco/bbox_mAP_s: 0.2570 coco/bbox_mAP_m: 0.4780 coco/bbox_mAP_l: 0.5820 coco/segm_mAP: 0.2940 coco/segm_mAP_50: 0.5290 coco/segm_mAP_75: 0.2870 coco/segm_mAP_s: 0.1470 coco/segm_mAP_m: 0.3360 coco/segm_mAP_l: 0.4600 Bleu_1: 0.7212 Bleu_2: 0.5495 Bleu_3: 0.4089 Bleu_4: 0.3019 METEOR: 0.2516 ROUGE_L: 0.5297 CIDEr: 0.9694 SPICE: 0.1843 aAcc: 81.3100 mIoU: 45.7200 mAcc: 57.9000 visual-grounding/miou: 0.7589 visual-grounding/acc: 0.8356 data_time: 0.0048 time: 0.5598 +2023/11/03 21:47:59 - mmengine - INFO - Iter(train) [340500/640000] base_lr: 9.1055e-05 lr: 1.0096e-05 eta: 3 days, 20:46:51 time: 1.1122 data_time: 0.0325 memory: 21521 grad_norm: 3.1698 loss: 1.3366 caption_loss_cls: 2.2187 grounding_loss_reg: 2.7593 detection_loss_cls: 0.0355 detection_loss_reg: 0.3388 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0363 instance_segmentation_loss_reg: 0.3413 instance_segmentation_loss_poly: 0.8897 +2023/11/03 21:57:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 21:57:10 - mmengine - INFO - Iter(train) [341000/640000] base_lr: 9.0813e-05 lr: 1.0074e-05 eta: 3 days, 20:36:48 time: 1.1126 data_time: 0.0326 memory: 21521 grad_norm: 3.2019 loss: 1.3358 caption_loss_cls: 2.2185 grounding_loss_reg: 2.7564 detection_loss_cls: 0.0355 detection_loss_reg: 0.3390 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0364 instance_segmentation_loss_reg: 0.3421 instance_segmentation_loss_poly: 0.8904 +2023/11/03 21:57:10 - mmengine - INFO - Saving checkpoint at 341000 iterations +2023/11/03 22:06:44 - mmengine - INFO - Iter(train) [341500/640000] base_lr: 9.0572e-05 lr: 1.0052e-05 eta: 3 days, 20:29:21 time: 1.1197 data_time: 0.0330 memory: 21521 grad_norm: 3.1640 loss: 1.3294 caption_loss_cls: 2.2160 grounding_loss_reg: 2.7530 detection_loss_cls: 0.0356 detection_loss_reg: 0.3390 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0364 instance_segmentation_loss_reg: 0.3423 instance_segmentation_loss_poly: 0.8909 +2023/11/03 22:16:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 22:16:37 - mmengine - INFO - Iter(train) [342000/640000] base_lr: 9.0330e-05 lr: 1.0030e-05 eta: 3 days, 20:23:45 time: 1.1329 data_time: 0.0334 memory: 21521 grad_norm: 3.1234 loss: 1.3202 caption_loss_cls: 2.2184 grounding_loss_reg: 2.7522 detection_loss_cls: 0.0356 detection_loss_reg: 0.3399 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0365 instance_segmentation_loss_reg: 0.3432 instance_segmentation_loss_poly: 0.8926 +2023/11/03 22:16:37 - mmengine - INFO - Saving checkpoint at 342000 iterations +2023/11/03 22:26:09 - mmengine - INFO - Iter(train) [342500/640000] base_lr: 9.0088e-05 lr: 1.0008e-05 eta: 3 days, 20:15:55 time: 1.1374 data_time: 0.0333 memory: 21521 grad_norm: 3.1020 loss: 1.3103 caption_loss_cls: 2.2203 grounding_loss_reg: 2.7506 detection_loss_cls: 0.0356 detection_loss_reg: 0.3396 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0366 instance_segmentation_loss_reg: 0.3437 instance_segmentation_loss_poly: 0.8936 +2023/11/03 22:35:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 22:35:54 - mmengine - INFO - Iter(train) [343000/640000] base_lr: 8.9847e-05 lr: 9.9861e-06 eta: 3 days, 20:09:25 time: 1.1395 data_time: 0.0334 memory: 21521 grad_norm: 3.0500 loss: 1.3020 caption_loss_cls: 2.2199 grounding_loss_reg: 2.7514 detection_loss_cls: 0.0357 detection_loss_reg: 0.3399 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0365 instance_segmentation_loss_reg: 0.3436 instance_segmentation_loss_poly: 0.8927 +2023/11/03 22:35:54 - mmengine - INFO - Saving checkpoint at 343000 iterations +2023/11/03 22:45:22 - mmengine - INFO - Iter(train) [343500/640000] base_lr: 8.9606e-05 lr: 9.9641e-06 eta: 3 days, 20:01:04 time: 1.1392 data_time: 0.0336 memory: 21521 grad_norm: 3.0454 loss: 1.3093 caption_loss_cls: 2.2226 grounding_loss_reg: 2.7520 detection_loss_cls: 0.0356 detection_loss_reg: 0.3393 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0366 instance_segmentation_loss_reg: 0.3434 instance_segmentation_loss_poly: 0.8922 +2023/11/03 22:54:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 22:54:52 - mmengine - INFO - Iter(train) [344000/640000] base_lr: 8.9364e-05 lr: 9.9422e-06 eta: 3 days, 19:52:50 time: 1.1435 data_time: 0.0338 memory: 21521 grad_norm: 3.0162 loss: 1.3099 caption_loss_cls: 2.2270 grounding_loss_reg: 2.7542 detection_loss_cls: 0.0356 detection_loss_reg: 0.3401 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0368 instance_segmentation_loss_reg: 0.3441 instance_segmentation_loss_poly: 0.8928 +2023/11/03 22:54:52 - mmengine - INFO - Saving checkpoint at 344000 iterations +2023/11/03 23:04:23 - mmengine - INFO - Iter(train) [344500/640000] base_lr: 8.9123e-05 lr: 9.9203e-06 eta: 3 days, 19:44:47 time: 1.1455 data_time: 0.0370 memory: 21521 grad_norm: 3.0165 loss: 1.3140 caption_loss_cls: 2.2249 grounding_loss_reg: 2.7501 detection_loss_cls: 0.0356 detection_loss_reg: 0.3397 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0368 instance_segmentation_loss_reg: 0.3455 instance_segmentation_loss_poly: 0.8948 +2023/11/03 23:13:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 23:13:52 - mmengine - INFO - Iter(train) [345000/640000] base_lr: 8.8882e-05 lr: 9.8983e-06 eta: 3 days, 19:36:29 time: 1.1500 data_time: 0.0369 memory: 21521 grad_norm: 2.9729 loss: 1.2995 caption_loss_cls: 2.2273 grounding_loss_reg: 2.7435 detection_loss_cls: 0.0358 detection_loss_reg: 0.3407 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0367 instance_segmentation_loss_reg: 0.3448 instance_segmentation_loss_poly: 0.8940 +2023/11/03 23:13:52 - mmengine - INFO - Saving checkpoint at 345000 iterations +2023/11/03 23:23:20 - mmengine - INFO - Iter(train) [345500/640000] base_lr: 8.8641e-05 lr: 9.8764e-06 eta: 3 days, 19:28:01 time: 1.1483 data_time: 0.0368 memory: 21521 grad_norm: 2.9889 loss: 1.3048 caption_loss_cls: 2.2277 grounding_loss_reg: 2.7427 detection_loss_cls: 0.0357 detection_loss_reg: 0.3417 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0368 instance_segmentation_loss_reg: 0.3455 instance_segmentation_loss_poly: 0.8955 +2023/11/03 23:32:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 23:32:50 - mmengine - INFO - Iter(train) [346000/640000] base_lr: 8.8400e-05 lr: 9.8545e-06 eta: 3 days, 19:19:43 time: 1.1427 data_time: 0.0366 memory: 21521 grad_norm: 3.0219 loss: 1.3129 caption_loss_cls: 2.2273 grounding_loss_reg: 2.7404 detection_loss_cls: 0.0356 detection_loss_reg: 0.3412 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0366 instance_segmentation_loss_reg: 0.3447 instance_segmentation_loss_poly: 0.8946 +2023/11/03 23:32:50 - mmengine - INFO - Saving checkpoint at 346000 iterations +2023/11/03 23:42:14 - mmengine - INFO - Iter(train) [346500/640000] base_lr: 8.8159e-05 lr: 9.8326e-06 eta: 3 days, 19:10:48 time: 1.1405 data_time: 0.0367 memory: 21521 grad_norm: 3.0053 loss: 1.3181 caption_loss_cls: 2.2287 grounding_loss_reg: 2.7417 detection_loss_cls: 0.0357 detection_loss_reg: 0.3418 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0366 instance_segmentation_loss_reg: 0.3453 instance_segmentation_loss_poly: 0.8958 +2023/11/03 23:51:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/03 23:51:16 - mmengine - INFO - Iter(train) [347000/640000] base_lr: 8.7918e-05 lr: 9.8107e-06 eta: 3 days, 18:59:53 time: 1.1299 data_time: 0.0364 memory: 21521 grad_norm: 3.0831 loss: 1.3296 caption_loss_cls: 2.2306 grounding_loss_reg: 2.7400 detection_loss_cls: 0.0356 detection_loss_reg: 0.3414 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0365 instance_segmentation_loss_reg: 0.3446 instance_segmentation_loss_poly: 0.8942 +2023/11/03 23:51:16 - mmengine - INFO - Saving checkpoint at 347000 iterations +2023/11/04 00:00:47 - mmengine - INFO - Iter(train) [347500/640000] base_lr: 8.7677e-05 lr: 9.7888e-06 eta: 3 days, 18:51:37 time: 1.1306 data_time: 0.0360 memory: 21521 grad_norm: 3.0686 loss: 1.3080 caption_loss_cls: 2.2304 grounding_loss_reg: 2.7370 detection_loss_cls: 0.0355 detection_loss_reg: 0.3415 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0363 instance_segmentation_loss_reg: 0.3445 instance_segmentation_loss_poly: 0.8940 +2023/11/04 00:10:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 00:10:42 - mmengine - INFO - Iter(train) [348000/640000] base_lr: 8.7436e-05 lr: 9.7669e-06 eta: 3 days, 18:45:38 time: 1.1370 data_time: 0.0365 memory: 21521 grad_norm: 3.1022 loss: 1.3113 caption_loss_cls: 2.2302 grounding_loss_reg: 2.7363 detection_loss_cls: 0.0354 detection_loss_reg: 0.3413 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0363 instance_segmentation_loss_reg: 0.3443 instance_segmentation_loss_poly: 0.8935 +2023/11/04 00:10:42 - mmengine - INFO - Saving checkpoint at 348000 iterations +2023/11/04 00:19:32 - mmengine - INFO - Iter(train) [348500/640000] base_lr: 8.7196e-05 lr: 9.7451e-06 eta: 3 days, 18:33:33 time: 1.1266 data_time: 0.0362 memory: 21521 grad_norm: 3.1385 loss: 1.3191 caption_loss_cls: 2.2318 grounding_loss_reg: 2.7328 detection_loss_cls: 0.0353 detection_loss_reg: 0.3413 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0362 instance_segmentation_loss_reg: 0.3438 instance_segmentation_loss_poly: 0.8927 +2023/11/04 00:29:26 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 00:29:26 - mmengine - INFO - Iter(train) [349000/640000] base_lr: 8.6955e-05 lr: 9.7232e-06 eta: 3 days, 18:27:23 time: 1.1327 data_time: 0.0365 memory: 21521 grad_norm: 3.1402 loss: 1.3258 caption_loss_cls: 2.2329 grounding_loss_reg: 2.7305 detection_loss_cls: 0.0352 detection_loss_reg: 0.3402 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0361 instance_segmentation_loss_reg: 0.3432 instance_segmentation_loss_poly: 0.8904 +2023/11/04 00:29:26 - mmengine - INFO - Saving checkpoint at 349000 iterations +2023/11/04 00:38:50 - mmengine - INFO - Iter(train) [349500/640000] base_lr: 8.6715e-05 lr: 9.7013e-06 eta: 3 days, 18:18:26 time: 1.1318 data_time: 0.0365 memory: 21521 grad_norm: 3.1508 loss: 1.3320 caption_loss_cls: 2.2302 grounding_loss_reg: 2.7311 detection_loss_cls: 0.0352 detection_loss_reg: 0.3405 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0361 instance_segmentation_loss_reg: 0.3425 instance_segmentation_loss_poly: 0.8883 +2023/11/04 00:48:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 00:48:12 - mmengine - INFO - Iter(train) [350000/640000] base_lr: 8.6474e-05 lr: 9.6795e-06 eta: 3 days, 18:09:18 time: 1.1299 data_time: 0.0366 memory: 21521 grad_norm: 3.1458 loss: 1.3275 caption_loss_cls: 2.2322 grounding_loss_reg: 2.7299 detection_loss_cls: 0.0351 detection_loss_reg: 0.3400 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0360 instance_segmentation_loss_reg: 0.3410 instance_segmentation_loss_poly: 0.8860 +2023/11/04 00:48:12 - mmengine - INFO - Saving checkpoint at 350000 iterations +2023/11/04 00:57:19 - mmengine - INFO - Iter(train) [350500/640000] base_lr: 8.6234e-05 lr: 9.6576e-06 eta: 3 days, 17:58:51 time: 1.1258 data_time: 0.0364 memory: 21521 grad_norm: 3.1622 loss: 1.3151 caption_loss_cls: 2.2318 grounding_loss_reg: 2.7295 detection_loss_cls: 0.0351 detection_loss_reg: 0.3399 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0358 instance_segmentation_loss_reg: 0.3398 instance_segmentation_loss_poly: 0.8831 +2023/11/04 01:06:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 01:06:38 - mmengine - INFO - Iter(train) [351000/640000] base_lr: 8.5994e-05 lr: 9.6358e-06 eta: 3 days, 17:49:26 time: 1.1298 data_time: 0.0366 memory: 21521 grad_norm: 3.1482 loss: 1.3246 caption_loss_cls: 2.2345 grounding_loss_reg: 2.7279 detection_loss_cls: 0.0350 detection_loss_reg: 0.3386 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0357 instance_segmentation_loss_reg: 0.3392 instance_segmentation_loss_poly: 0.8825 +2023/11/04 01:06:38 - mmengine - INFO - Saving checkpoint at 351000 iterations +2023/11/04 01:15:52 - mmengine - INFO - Iter(train) [351500/640000] base_lr: 8.5754e-05 lr: 9.6140e-06 eta: 3 days, 17:39:39 time: 1.1257 data_time: 0.0366 memory: 21521 grad_norm: 3.1626 loss: 1.3379 caption_loss_cls: 2.2343 grounding_loss_reg: 2.7277 detection_loss_cls: 0.0349 detection_loss_reg: 0.3375 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3391 instance_segmentation_loss_poly: 0.8818 +2023/11/04 01:24:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 01:24:10 - mmengine - INFO - Iter(train) [352000/640000] base_lr: 8.5513e-05 lr: 9.5921e-06 eta: 3 days, 17:24:59 time: 1.1013 data_time: 0.0355 memory: 21521 grad_norm: 3.1916 loss: 1.3429 caption_loss_cls: 2.2352 grounding_loss_reg: 2.7278 detection_loss_cls: 0.0349 detection_loss_reg: 0.3377 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3386 instance_segmentation_loss_poly: 0.8811 +2023/11/04 01:24:10 - mmengine - INFO - Saving checkpoint at 352000 iterations +2023/11/04 01:33:49 - mmengine - INFO - Iter(train) [352500/640000] base_lr: 8.5274e-05 lr: 9.5703e-06 eta: 3 days, 17:17:23 time: 1.1137 data_time: 0.0357 memory: 21521 grad_norm: 3.1439 loss: 1.3280 caption_loss_cls: 2.2401 grounding_loss_reg: 2.7247 detection_loss_cls: 0.0348 detection_loss_reg: 0.3376 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3389 instance_segmentation_loss_poly: 0.8815 +2023/11/04 01:42:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 01:42:59 - mmengine - INFO - Iter(train) [353000/640000] base_lr: 8.5034e-05 lr: 9.5485e-06 eta: 3 days, 17:07:14 time: 1.1025 data_time: 0.0354 memory: 21521 grad_norm: 3.2016 loss: 1.3321 caption_loss_cls: 2.2372 grounding_loss_reg: 2.7208 detection_loss_cls: 0.0347 detection_loss_reg: 0.3358 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0355 instance_segmentation_loss_reg: 0.3386 instance_segmentation_loss_poly: 0.8804 +2023/11/04 01:42:59 - mmengine - INFO - Saving checkpoint at 353000 iterations +2023/11/04 01:52:11 - mmengine - INFO - Iter(train) [353500/640000] base_lr: 8.4794e-05 lr: 9.5267e-06 eta: 3 days, 16:57:21 time: 1.0997 data_time: 0.0351 memory: 21521 grad_norm: 3.1888 loss: 1.3195 caption_loss_cls: 2.2340 grounding_loss_reg: 2.7187 detection_loss_cls: 0.0346 detection_loss_reg: 0.3358 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3376 instance_segmentation_loss_poly: 0.8790 +2023/11/04 02:01:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 02:01:07 - mmengine - INFO - Iter(train) [354000/640000] base_lr: 8.4554e-05 lr: 9.5049e-06 eta: 3 days, 16:46:05 time: 1.0930 data_time: 0.0346 memory: 21521 grad_norm: 3.2187 loss: 1.3174 caption_loss_cls: 2.2329 grounding_loss_reg: 2.7161 detection_loss_cls: 0.0345 detection_loss_reg: 0.3358 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0353 instance_segmentation_loss_reg: 0.3362 instance_segmentation_loss_poly: 0.8761 +2023/11/04 02:01:07 - mmengine - INFO - Saving checkpoint at 354000 iterations +2023/11/04 02:11:11 - mmengine - INFO - Iter(train) [354500/640000] base_lr: 8.4315e-05 lr: 9.4832e-06 eta: 3 days, 16:40:27 time: 1.1073 data_time: 0.0353 memory: 21521 grad_norm: 3.1791 loss: 1.3213 caption_loss_cls: 2.2326 grounding_loss_reg: 2.7169 detection_loss_cls: 0.0345 detection_loss_reg: 0.3356 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3366 instance_segmentation_loss_poly: 0.8764 +2023/11/04 02:20:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 02:20:32 - mmengine - INFO - Iter(train) [355000/640000] base_lr: 8.4075e-05 lr: 9.4614e-06 eta: 3 days, 16:31:16 time: 1.1078 data_time: 0.0353 memory: 21521 grad_norm: 3.1677 loss: 1.3116 caption_loss_cls: 2.2319 grounding_loss_reg: 2.7137 detection_loss_cls: 0.0344 detection_loss_reg: 0.3349 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0353 instance_segmentation_loss_reg: 0.3361 instance_segmentation_loss_poly: 0.8743 +2023/11/04 02:20:32 - mmengine - INFO - Saving checkpoint at 355000 iterations +2023/11/04 02:30:09 - mmengine - INFO - Iter(train) [355500/640000] base_lr: 8.3836e-05 lr: 9.4396e-06 eta: 3 days, 16:23:24 time: 1.1136 data_time: 0.0355 memory: 21521 grad_norm: 3.1574 loss: 1.3079 caption_loss_cls: 2.2283 grounding_loss_reg: 2.7122 detection_loss_cls: 0.0344 detection_loss_reg: 0.3351 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0353 instance_segmentation_loss_reg: 0.3359 instance_segmentation_loss_poly: 0.8731 +2023/11/04 02:39:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 02:39:38 - mmengine - INFO - Iter(train) [356000/640000] base_lr: 8.3597e-05 lr: 9.4179e-06 eta: 3 days, 16:14:46 time: 1.1313 data_time: 0.0369 memory: 21521 grad_norm: 3.1182 loss: 1.2994 caption_loss_cls: 2.2308 grounding_loss_reg: 2.7110 detection_loss_cls: 0.0342 detection_loss_reg: 0.3345 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0353 instance_segmentation_loss_reg: 0.3364 instance_segmentation_loss_poly: 0.8743 +2023/11/04 02:39:38 - mmengine - INFO - Saving checkpoint at 356000 iterations +2023/11/04 02:49:20 - mmengine - INFO - Iter(train) [356500/640000] base_lr: 8.3358e-05 lr: 9.3961e-06 eta: 3 days, 16:07:11 time: 1.1319 data_time: 0.0371 memory: 21521 grad_norm: 3.1466 loss: 1.3070 caption_loss_cls: 2.2288 grounding_loss_reg: 2.7097 detection_loss_cls: 0.0342 detection_loss_reg: 0.3345 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3374 instance_segmentation_loss_poly: 0.8761 +2023/11/04 02:58:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 02:58:56 - mmengine - INFO - Iter(train) [357000/640000] base_lr: 8.3118e-05 lr: 9.3744e-06 eta: 3 days, 15:59:10 time: 1.1388 data_time: 0.0374 memory: 21521 grad_norm: 3.1132 loss: 1.3006 caption_loss_cls: 2.2244 grounding_loss_reg: 2.7083 detection_loss_cls: 0.0342 detection_loss_reg: 0.3348 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3377 instance_segmentation_loss_poly: 0.8767 +2023/11/04 02:58:56 - mmengine - INFO - Saving checkpoint at 357000 iterations +2023/11/04 03:08:44 - mmengine - INFO - Iter(train) [357500/640000] base_lr: 8.2880e-05 lr: 9.3527e-06 eta: 3 days, 15:51:58 time: 1.1476 data_time: 0.0381 memory: 21521 grad_norm: 3.1022 loss: 1.3117 caption_loss_cls: 2.2237 grounding_loss_reg: 2.7073 detection_loss_cls: 0.0343 detection_loss_reg: 0.3356 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0357 instance_segmentation_loss_reg: 0.3399 instance_segmentation_loss_poly: 0.8810 +2023/11/04 03:17:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 03:17:34 - mmengine - INFO - Iter(train) [358000/640000] base_lr: 8.2641e-05 lr: 9.3310e-06 eta: 3 days, 15:40:19 time: 1.1461 data_time: 0.0380 memory: 21521 grad_norm: 3.0641 loss: 1.3064 caption_loss_cls: 2.2217 grounding_loss_reg: 2.7041 detection_loss_cls: 0.0344 detection_loss_reg: 0.3358 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3389 instance_segmentation_loss_poly: 0.8785 +2023/11/04 03:17:34 - mmengine - INFO - Saving checkpoint at 358000 iterations +2023/11/04 03:27:01 - mmengine - INFO - Iter(train) [358500/640000] base_lr: 8.2402e-05 lr: 9.3093e-06 eta: 3 days, 15:31:33 time: 1.1369 data_time: 0.0375 memory: 21521 grad_norm: 3.0778 loss: 1.3085 caption_loss_cls: 2.2186 grounding_loss_reg: 2.7040 detection_loss_cls: 0.0346 detection_loss_reg: 0.3379 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3395 instance_segmentation_loss_poly: 0.8787 +2023/11/04 03:36:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 03:36:03 - mmengine - INFO - Iter(train) [359000/640000] base_lr: 8.2163e-05 lr: 9.2876e-06 eta: 3 days, 15:20:52 time: 1.1321 data_time: 0.0374 memory: 21521 grad_norm: 3.0910 loss: 1.3130 caption_loss_cls: 2.2205 grounding_loss_reg: 2.7019 detection_loss_cls: 0.0347 detection_loss_reg: 0.3381 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0357 instance_segmentation_loss_reg: 0.3400 instance_segmentation_loss_poly: 0.8800 +2023/11/04 03:36:03 - mmengine - INFO - Saving checkpoint at 359000 iterations +2023/11/04 03:45:41 - mmengine - INFO - Iter(train) [359500/640000] base_lr: 8.1925e-05 lr: 9.2659e-06 eta: 3 days, 15:12:54 time: 1.1323 data_time: 0.0380 memory: 21521 grad_norm: 3.1093 loss: 1.3131 caption_loss_cls: 2.2216 grounding_loss_reg: 2.6975 detection_loss_cls: 0.0347 detection_loss_reg: 0.3379 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3392 instance_segmentation_loss_poly: 0.8772 +2023/11/04 03:55:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 03:55:20 - mmengine - INFO - Iter(train) [360000/640000] base_lr: 8.1687e-05 lr: 9.2442e-06 eta: 3 days, 15:04:55 time: 1.1348 data_time: 0.0373 memory: 21521 grad_norm: 3.1139 loss: 1.3112 caption_loss_cls: 2.2196 grounding_loss_reg: 2.6977 detection_loss_cls: 0.0347 detection_loss_reg: 0.3385 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3398 instance_segmentation_loss_poly: 0.8784 +2023/11/04 03:55:20 - mmengine - INFO - Saving checkpoint at 360000 iterations +2023/11/04 04:04:01 - mmengine - INFO - Evaluating bbox... +2023/11/04 04:04:57 - mmengine - INFO - bbox_mAP_copypaste: 0.437 0.610 0.473 0.264 0.487 0.579 +2023/11/04 04:04:57 - mmengine - INFO - Evaluating segm... +2023/11/04 04:06:10 - mmengine - INFO - segm_mAP_copypaste: 0.291 0.527 0.282 0.142 0.335 0.461 +2023/11/04 04:10:30 - mmengine - INFO - per class results: +2023/11/04 04:10:30 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.59 | 85.94 | +| building | 80.76 | 89.33 | +| sky | 92.28 | 97.85 | +| floor | 79.69 | 88.97 | +| tree | 72.31 | 85.85 | +| ceiling | 81.78 | 93.92 | +| road | 81.54 | 87.57 | +| bed | 85.64 | 94.93 | +| windowpane | 59.49 | 81.07 | +| grass | 64.58 | 81.15 | +| cabinet | 57.61 | 72.34 | +| sidewalk | 65.15 | 78.92 | +| person | 78.25 | 92.44 | +| earth | 33.02 | 39.42 | +| door | 50.79 | 65.72 | +| table | 57.62 | 77.12 | +| mountain | 51.26 | 74.11 | +| plant | 50.56 | 61.89 | +| curtain | 72.67 | 83.65 | +| chair | 54.8 | 75.12 | +| car | 80.23 | 88.99 | +| water | 48.4 | 64.06 | +| painting | 67.3 | 85.48 | +| sofa | 64.14 | 76.54 | +| shelf | 39.95 | 56.4 | +| house | 44.27 | 67.19 | +| sea | 50.77 | 80.64 | +| mirror | 62.52 | 70.6 | +| rug | 65.81 | 72.06 | +| field | 33.3 | 56.63 | +| armchair | 40.2 | 55.77 | +| seat | 57.6 | 69.95 | +| fence | 41.43 | 68.33 | +| desk | 43.81 | 62.11 | +| rock | 23.36 | 30.41 | +| wardrobe | 43.13 | 60.5 | +| lamp | 57.47 | 76.0 | +| bathtub | 74.11 | 81.31 | +| railing | 31.28 | 47.4 | +| cushion | 53.66 | 63.82 | +| base | 26.68 | 53.19 | +| box | 20.41 | 25.61 | +| column | 47.11 | 57.8 | +| signboard | 36.38 | 50.25 | +| chest of drawers | 40.52 | 57.46 | +| counter | 35.16 | 43.95 | +| sand | 39.77 | 66.73 | +| sink | 68.3 | 77.39 | +| skyscraper | 65.77 | 86.15 | +| fireplace | 70.89 | 87.95 | +| refrigerator | 69.77 | 85.22 | +| grandstand | 28.8 | 68.61 | +| path | 30.29 | 42.9 | +| stairs | 22.32 | 28.59 | +| runway | 68.17 | 95.32 | +| case | 41.34 | 60.29 | +| pool table | 91.0 | 95.41 | +| pillow | 54.55 | 74.45 | +| screen door | 67.53 | 77.28 | +| stairway | 28.9 | 33.25 | +| river | 18.37 | 29.89 | +| bridge | 51.57 | 61.43 | +| bookcase | 32.37 | 56.81 | +| blind | 29.92 | 33.7 | +| coffee table | 58.44 | 79.72 | +| toilet | 84.61 | 88.93 | +| flower | 31.52 | 49.97 | +| book | 45.66 | 69.78 | +| hill | 3.75 | 5.78 | +| bench | 47.6 | 56.2 | +| countertop | 51.05 | 59.98 | +| stove | 74.58 | 79.95 | +| palm | 47.29 | 67.68 | +| kitchen island | 35.55 | 69.77 | +| computer | 63.69 | 77.14 | +| swivel chair | 44.17 | 60.65 | +| boat | 57.63 | 81.08 | +| bar | 28.14 | 30.95 | +| arcade machine | 44.04 | 45.84 | +| hovel | 7.94 | 10.29 | +| bus | 84.79 | 95.7 | +| towel | 62.01 | 70.87 | +| light | 43.36 | 49.87 | +| truck | 39.97 | 54.31 | +| tower | 48.62 | 69.12 | +| chandelier | 61.23 | 76.89 | +| awning | 17.14 | 19.81 | +| streetlight | 24.55 | 31.76 | +| booth | 63.82 | 67.76 | +| television receiver | 70.26 | 82.26 | +| airplane | 55.09 | 65.47 | +| dirt track | 0.94 | 2.48 | +| apparel | 28.8 | 45.91 | +| pole | 30.08 | 43.39 | +| land | 4.0 | 5.47 | +| bannister | 13.84 | 21.68 | +| escalator | 38.55 | 52.83 | +| ottoman | 47.81 | 66.38 | +| bottle | 23.75 | 31.25 | +| buffet | 39.04 | 46.29 | +| poster | 25.78 | 42.41 | +| stage | 21.34 | 30.22 | +| van | 33.05 | 47.06 | +| ship | 14.53 | 14.86 | +| fountain | 5.24 | 5.35 | +| conveyer belt | 63.62 | 86.21 | +| canopy | 32.48 | 43.51 | +| washer | 69.49 | 70.12 | +| plaything | 28.03 | 43.86 | +| swimming pool | 53.28 | 73.41 | +| stool | 35.0 | 48.54 | +| barrel | 13.66 | 14.27 | +| basket | 26.53 | 36.8 | +| waterfall | 55.76 | 71.47 | +| tent | 77.49 | 98.67 | +| bag | 12.85 | 15.43 | +| minibike | 71.88 | 83.21 | +| cradle | 70.75 | 91.0 | +| oven | 34.3 | 40.49 | +| ball | 36.02 | 42.58 | +| food | 47.6 | 53.4 | +| step | 14.27 | 16.46 | +| tank | 44.81 | 48.21 | +| trade name | 25.97 | 34.46 | +| microwave | 81.44 | 88.2 | +| pot | 44.0 | 50.12 | +| animal | 62.65 | 68.52 | +| bicycle | 55.04 | 72.2 | +| lake | 42.77 | 44.09 | +| dishwasher | 54.26 | 72.25 | +| screen | 45.67 | 58.09 | +| blanket | 7.2 | 8.46 | +| sculpture | 50.46 | 67.11 | +| hood | 51.47 | 57.78 | +| sconce | 33.17 | 42.8 | +| vase | 37.9 | 55.17 | +| traffic light | 34.93 | 52.04 | +| tray | 9.62 | 15.32 | +| ashcan | 31.22 | 50.58 | +| fan | 48.2 | 59.04 | +| pier | 54.35 | 67.97 | +| crt screen | 8.15 | 33.75 | +| plate | 53.88 | 73.27 | +| monitor | 10.35 | 14.42 | +| bulletin board | 21.46 | 36.84 | +| shower | 4.11 | 4.32 | +| radiator | 49.02 | 59.78 | +| glass | 15.36 | 16.72 | +| clock | 24.61 | 32.2 | +| flag | 31.54 | 36.45 | ++---------------------+-------+-------+ +2023/11/04 04:10:45 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4370 coco/bbox_mAP_50: 0.6100 coco/bbox_mAP_75: 0.4730 coco/bbox_mAP_s: 0.2640 coco/bbox_mAP_m: 0.4870 coco/bbox_mAP_l: 0.5790 coco/segm_mAP: 0.2910 coco/segm_mAP_50: 0.5270 coco/segm_mAP_75: 0.2820 coco/segm_mAP_s: 0.1420 coco/segm_mAP_m: 0.3350 coco/segm_mAP_l: 0.4610 Bleu_1: 0.7361 Bleu_2: 0.5703 Bleu_3: 0.4285 Bleu_4: 0.3206 METEOR: 0.2567 ROUGE_L: 0.5400 CIDEr: 1.0016 SPICE: 0.1881 aAcc: 81.4100 mIoU: 45.6900 mAcc: 58.0900 visual-grounding/miou: 0.7587 visual-grounding/acc: 0.8306 data_time: 0.0049 time: 0.5271 +2023/11/04 04:20:04 - mmengine - INFO - Iter(train) [360500/640000] base_lr: 8.1448e-05 lr: 9.2226e-06 eta: 3 days, 14:55:36 time: 1.1294 data_time: 0.0337 memory: 21521 grad_norm: 3.0851 loss: 1.2928 caption_loss_cls: 2.2190 grounding_loss_reg: 2.6970 detection_loss_cls: 0.0346 detection_loss_reg: 0.3381 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3399 instance_segmentation_loss_poly: 0.8792 +2023/11/04 04:29:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 04:29:28 - mmengine - INFO - Iter(train) [361000/640000] base_lr: 8.1210e-05 lr: 9.2009e-06 eta: 3 days, 14:46:31 time: 1.1261 data_time: 0.0336 memory: 21521 grad_norm: 3.1150 loss: 1.3007 caption_loss_cls: 2.2216 grounding_loss_reg: 2.6951 detection_loss_cls: 0.0347 detection_loss_reg: 0.3387 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3391 instance_segmentation_loss_poly: 0.8772 +2023/11/04 04:29:28 - mmengine - INFO - Saving checkpoint at 361000 iterations +2023/11/04 04:39:02 - mmengine - INFO - Iter(train) [361500/640000] base_lr: 8.0972e-05 lr: 9.1793e-06 eta: 3 days, 14:38:13 time: 1.1229 data_time: 0.0332 memory: 21521 grad_norm: 3.1132 loss: 1.2911 caption_loss_cls: 2.2208 grounding_loss_reg: 2.6934 detection_loss_cls: 0.0347 detection_loss_reg: 0.3388 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3392 instance_segmentation_loss_poly: 0.8771 +2023/11/04 04:48:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 04:48:10 - mmengine - INFO - Iter(train) [362000/640000] base_lr: 8.0734e-05 lr: 9.1577e-06 eta: 3 days, 14:28:01 time: 1.1275 data_time: 0.0335 memory: 21521 grad_norm: 3.1059 loss: 1.2934 caption_loss_cls: 2.2212 grounding_loss_reg: 2.6938 detection_loss_cls: 0.0346 detection_loss_reg: 0.3380 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0358 instance_segmentation_loss_reg: 0.3409 instance_segmentation_loss_poly: 0.8806 +2023/11/04 04:48:10 - mmengine - INFO - Saving checkpoint at 362000 iterations +2023/11/04 04:57:25 - mmengine - INFO - Iter(train) [362500/640000] base_lr: 8.0496e-05 lr: 9.1360e-06 eta: 3 days, 14:18:18 time: 1.1242 data_time: 0.0334 memory: 21521 grad_norm: 3.1230 loss: 1.2931 caption_loss_cls: 2.2217 grounding_loss_reg: 2.6960 detection_loss_cls: 0.0346 detection_loss_reg: 0.3380 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0357 instance_segmentation_loss_reg: 0.3405 instance_segmentation_loss_poly: 0.8796 +2023/11/04 05:06:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 05:06:43 - mmengine - INFO - Iter(train) [363000/640000] base_lr: 8.0259e-05 lr: 9.1144e-06 eta: 3 days, 14:08:50 time: 1.1284 data_time: 0.0334 memory: 21521 grad_norm: 3.1043 loss: 1.2888 caption_loss_cls: 2.2169 grounding_loss_reg: 2.6944 detection_loss_cls: 0.0347 detection_loss_reg: 0.3390 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0358 instance_segmentation_loss_reg: 0.3415 instance_segmentation_loss_poly: 0.8815 +2023/11/04 05:06:43 - mmengine - INFO - Saving checkpoint at 363000 iterations +2023/11/04 05:16:08 - mmengine - INFO - Iter(train) [363500/640000] base_lr: 8.0021e-05 lr: 9.0928e-06 eta: 3 days, 13:59:50 time: 1.1251 data_time: 0.0328 memory: 21521 grad_norm: 3.1113 loss: 1.2894 caption_loss_cls: 2.2138 grounding_loss_reg: 2.6911 detection_loss_cls: 0.0347 detection_loss_reg: 0.3387 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0357 instance_segmentation_loss_reg: 0.3410 instance_segmentation_loss_poly: 0.8804 +2023/11/04 05:25:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 05:25:39 - mmengine - INFO - Iter(train) [364000/640000] base_lr: 7.9784e-05 lr: 9.0713e-06 eta: 3 days, 13:51:13 time: 1.1231 data_time: 0.0327 memory: 21521 grad_norm: 3.0884 loss: 1.2842 caption_loss_cls: 2.2157 grounding_loss_reg: 2.6889 detection_loss_cls: 0.0347 detection_loss_reg: 0.3392 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0355 instance_segmentation_loss_reg: 0.3404 instance_segmentation_loss_poly: 0.8791 +2023/11/04 05:25:39 - mmengine - INFO - Saving checkpoint at 364000 iterations +2023/11/04 05:35:13 - mmengine - INFO - Iter(train) [364500/640000] base_lr: 7.9547e-05 lr: 9.0497e-06 eta: 3 days, 13:42:48 time: 1.1265 data_time: 0.0361 memory: 21521 grad_norm: 3.1276 loss: 1.2991 caption_loss_cls: 2.2122 grounding_loss_reg: 2.6878 detection_loss_cls: 0.0346 detection_loss_reg: 0.3387 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3394 instance_segmentation_loss_poly: 0.8765 +2023/11/04 05:44:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 05:44:42 - mmengine - INFO - Iter(train) [365000/640000] base_lr: 7.9309e-05 lr: 9.0281e-06 eta: 3 days, 13:34:04 time: 1.1280 data_time: 0.0364 memory: 21521 grad_norm: 3.0888 loss: 1.2997 caption_loss_cls: 2.2156 grounding_loss_reg: 2.6889 detection_loss_cls: 0.0346 detection_loss_reg: 0.3385 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3398 instance_segmentation_loss_poly: 0.8768 +2023/11/04 05:44:42 - mmengine - INFO - Saving checkpoint at 365000 iterations +2023/11/04 05:54:11 - mmengine - INFO - Iter(train) [365500/640000] base_lr: 7.9072e-05 lr: 9.0066e-06 eta: 3 days, 13:25:20 time: 1.1266 data_time: 0.0364 memory: 21521 grad_norm: 3.1120 loss: 1.3000 caption_loss_cls: 2.2161 grounding_loss_reg: 2.6905 detection_loss_cls: 0.0345 detection_loss_reg: 0.3380 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3395 instance_segmentation_loss_poly: 0.8749 +2023/11/04 06:03:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 06:03:48 - mmengine - INFO - Iter(train) [366000/640000] base_lr: 7.8836e-05 lr: 8.9851e-06 eta: 3 days, 13:17:04 time: 1.1339 data_time: 0.0368 memory: 21521 grad_norm: 3.1157 loss: 1.3061 caption_loss_cls: 2.2104 grounding_loss_reg: 2.6892 detection_loss_cls: 0.0347 detection_loss_reg: 0.3389 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0355 instance_segmentation_loss_reg: 0.3398 instance_segmentation_loss_poly: 0.8761 +2023/11/04 06:03:48 - mmengine - INFO - Saving checkpoint at 366000 iterations +2023/11/04 06:12:51 - mmengine - INFO - Iter(train) [366500/640000] base_lr: 7.8599e-05 lr: 8.9635e-06 eta: 3 days, 13:06:33 time: 1.1308 data_time: 0.0368 memory: 21521 grad_norm: 3.1296 loss: 1.3102 caption_loss_cls: 2.2102 grounding_loss_reg: 2.6888 detection_loss_cls: 0.0346 detection_loss_reg: 0.3381 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3405 instance_segmentation_loss_poly: 0.8773 +2023/11/04 06:22:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 06:22:20 - mmengine - INFO - Iter(train) [367000/640000] base_lr: 7.8362e-05 lr: 8.9420e-06 eta: 3 days, 12:57:45 time: 1.1335 data_time: 0.0369 memory: 21521 grad_norm: 3.1581 loss: 1.3104 caption_loss_cls: 2.2098 grounding_loss_reg: 2.6872 detection_loss_cls: 0.0346 detection_loss_reg: 0.3382 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0357 instance_segmentation_loss_reg: 0.3407 instance_segmentation_loss_poly: 0.8785 +2023/11/04 06:22:20 - mmengine - INFO - Saving checkpoint at 367000 iterations +2023/11/04 06:31:36 - mmengine - INFO - Iter(train) [367500/640000] base_lr: 7.8126e-05 lr: 8.9205e-06 eta: 3 days, 12:48:07 time: 1.1312 data_time: 0.0369 memory: 21521 grad_norm: 3.1412 loss: 1.3054 caption_loss_cls: 2.2074 grounding_loss_reg: 2.6874 detection_loss_cls: 0.0347 detection_loss_reg: 0.3389 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0357 instance_segmentation_loss_reg: 0.3408 instance_segmentation_loss_poly: 0.8786 +2023/11/04 06:40:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 06:40:38 - mmengine - INFO - Iter(train) [368000/640000] base_lr: 7.7889e-05 lr: 8.8990e-06 eta: 3 days, 12:37:38 time: 1.1241 data_time: 0.0367 memory: 21521 grad_norm: 3.1597 loss: 1.3077 caption_loss_cls: 2.2035 grounding_loss_reg: 2.6890 detection_loss_cls: 0.0348 detection_loss_reg: 0.3396 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0357 instance_segmentation_loss_reg: 0.3405 instance_segmentation_loss_poly: 0.8777 +2023/11/04 06:40:38 - mmengine - INFO - Saving checkpoint at 368000 iterations +2023/11/04 06:50:12 - mmengine - INFO - Iter(train) [368500/640000] base_lr: 7.7653e-05 lr: 8.8776e-06 eta: 3 days, 12:29:08 time: 1.1241 data_time: 0.0369 memory: 21521 grad_norm: 3.1576 loss: 1.3148 caption_loss_cls: 2.2048 grounding_loss_reg: 2.6901 detection_loss_cls: 0.0348 detection_loss_reg: 0.3390 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3414 instance_segmentation_loss_poly: 0.8790 +2023/11/04 06:59:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231103_070902 +2023/11/04 06:59:37 - mmengine - INFO - Iter(train) [369000/640000] base_lr: 7.7417e-05 lr: 8.8561e-06 eta: 3 days, 12:20:07 time: 1.1231 data_time: 0.0366 memory: 21521 grad_norm: 3.1733 loss: 1.3075 caption_loss_cls: 2.2044 grounding_loss_reg: 2.6878 detection_loss_cls: 0.0348 detection_loss_reg: 0.3395 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0358 instance_segmentation_loss_reg: 0.3412 instance_segmentation_loss_poly: 0.8784 +2023/11/04 06:59:37 - mmengine - INFO - Saving checkpoint at 369000 iterations +2023/11/04 14:04:36 - mmengine - INFO - Iter(train) [369500/640000] base_lr: 7.7181e-05 lr: 8.8347e-06 eta: 3 days, 12:02:51 time: 1.1206 data_time: 0.0331 memory: 21521 grad_norm: 3.1677 loss: 1.3073 caption_loss_cls: 2.2050 grounding_loss_reg: 2.6857 detection_loss_cls: 0.0347 detection_loss_reg: 0.3389 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0360 instance_segmentation_loss_reg: 0.3425 instance_segmentation_loss_poly: 0.8816 +2023/11/04 14:13:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 14:13:30 - mmengine - INFO - Iter(train) [370000/640000] base_lr: 7.6945e-05 lr: 8.8132e-06 eta: 3 days, 9:57:10 time: 1.1098 data_time: 0.0326 memory: 21519 grad_norm: 3.1957 loss: 1.2946 caption_loss_cls: 2.2006 grounding_loss_reg: 2.6814 detection_loss_cls: 0.0348 detection_loss_reg: 0.3394 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0361 instance_segmentation_loss_reg: 0.3429 instance_segmentation_loss_poly: 0.8822 +2023/11/04 14:13:30 - mmengine - INFO - Saving checkpoint at 370000 iterations +2023/11/04 14:22:39 - mmengine - INFO - Iter(train) [370500/640000] base_lr: 7.6710e-05 lr: 8.7918e-06 eta: 3 days, 9:56:11 time: 1.1116 data_time: 0.0324 memory: 21519 grad_norm: 3.1807 loss: 1.2816 caption_loss_cls: 2.1964 grounding_loss_reg: 2.6802 detection_loss_cls: 0.0348 detection_loss_reg: 0.3401 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0360 instance_segmentation_loss_reg: 0.3427 instance_segmentation_loss_poly: 0.8819 +2023/11/04 14:31:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 14:31:13 - mmengine - INFO - Iter(train) [371000/640000] base_lr: 7.6474e-05 lr: 8.7704e-06 eta: 3 days, 8:30:25 time: 1.0977 data_time: 0.0320 memory: 21519 grad_norm: 3.1828 loss: 1.2829 caption_loss_cls: 2.1976 grounding_loss_reg: 2.6773 detection_loss_cls: 0.0349 detection_loss_reg: 0.3397 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3425 instance_segmentation_loss_poly: 0.8817 +2023/11/04 14:31:13 - mmengine - INFO - Saving checkpoint at 371000 iterations +2023/11/04 14:40:27 - mmengine - INFO - Iter(train) [371500/640000] base_lr: 7.6239e-05 lr: 8.7490e-06 eta: 3 days, 8:47:53 time: 1.0972 data_time: 0.0317 memory: 21519 grad_norm: 3.1566 loss: 1.2744 caption_loss_cls: 2.1926 grounding_loss_reg: 2.6750 detection_loss_cls: 0.0349 detection_loss_reg: 0.3398 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0358 instance_segmentation_loss_reg: 0.3415 instance_segmentation_loss_poly: 0.8800 +2023/11/04 14:49:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 14:49:40 - mmengine - INFO - Iter(train) [372000/640000] base_lr: 7.6004e-05 lr: 8.7276e-06 eta: 3 days, 8:55:50 time: 1.1000 data_time: 0.0318 memory: 21519 grad_norm: 3.1630 loss: 1.2695 caption_loss_cls: 2.1860 grounding_loss_reg: 2.6717 detection_loss_cls: 0.0349 detection_loss_reg: 0.3399 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0358 instance_segmentation_loss_reg: 0.3427 instance_segmentation_loss_poly: 0.8829 +2023/11/04 14:49:40 - mmengine - INFO - Saving checkpoint at 372000 iterations +2023/11/04 14:59:11 - mmengine - INFO - Iter(train) [372500/640000] base_lr: 7.5769e-05 lr: 8.7063e-06 eta: 3 days, 9:21:38 time: 1.0994 data_time: 0.0313 memory: 21519 grad_norm: 3.1304 loss: 1.2486 caption_loss_cls: 2.1852 grounding_loss_reg: 2.6693 detection_loss_cls: 0.0349 detection_loss_reg: 0.3397 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0358 instance_segmentation_loss_reg: 0.3423 instance_segmentation_loss_poly: 0.8829 +2023/11/04 15:08:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 15:08:15 - mmengine - INFO - Iter(train) [373000/640000] base_lr: 7.5534e-05 lr: 8.6849e-06 eta: 3 days, 9:08:05 time: 1.0940 data_time: 0.0313 memory: 21519 grad_norm: 3.1596 loss: 1.2534 caption_loss_cls: 2.1879 grounding_loss_reg: 2.6687 detection_loss_cls: 0.0349 detection_loss_reg: 0.3400 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0355 instance_segmentation_loss_reg: 0.3412 instance_segmentation_loss_poly: 0.8800 +2023/11/04 15:08:15 - mmengine - INFO - Saving checkpoint at 373000 iterations +2023/11/04 15:17:36 - mmengine - INFO - Iter(train) [373500/640000] base_lr: 7.5299e-05 lr: 8.6636e-06 eta: 3 days, 9:12:55 time: 1.0944 data_time: 0.0348 memory: 21519 grad_norm: 3.1722 loss: 1.2564 caption_loss_cls: 2.1874 grounding_loss_reg: 2.6696 detection_loss_cls: 0.0349 detection_loss_reg: 0.3402 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3423 instance_segmentation_loss_poly: 0.8820 +2023/11/04 15:25:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 15:25:29 - mmengine - INFO - Iter(train) [374000/640000] base_lr: 7.5065e-05 lr: 8.6422e-06 eta: 3 days, 7:56:25 time: 1.0792 data_time: 0.0345 memory: 21519 grad_norm: 3.2353 loss: 1.2806 caption_loss_cls: 2.1859 grounding_loss_reg: 2.6678 detection_loss_cls: 0.0348 detection_loss_reg: 0.3398 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3429 instance_segmentation_loss_poly: 0.8827 +2023/11/04 15:25:29 - mmengine - INFO - Saving checkpoint at 374000 iterations +2023/11/04 15:35:16 - mmengine - INFO - Iter(train) [374500/640000] base_lr: 7.4830e-05 lr: 8.6209e-06 eta: 3 days, 8:23:33 time: 1.0884 data_time: 0.0349 memory: 21519 grad_norm: 3.2547 loss: 1.2846 caption_loss_cls: 2.1863 grounding_loss_reg: 2.6678 detection_loss_cls: 0.0348 detection_loss_reg: 0.3397 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0355 instance_segmentation_loss_reg: 0.3429 instance_segmentation_loss_poly: 0.8826 +2023/11/04 15:44:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 15:44:40 - mmengine - INFO - Iter(train) [375000/640000] base_lr: 7.4596e-05 lr: 8.5996e-06 eta: 3 days, 8:28:21 time: 1.1011 data_time: 0.0351 memory: 21519 grad_norm: 3.2072 loss: 1.2695 caption_loss_cls: 2.1870 grounding_loss_reg: 2.6654 detection_loss_cls: 0.0348 detection_loss_reg: 0.3409 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0355 instance_segmentation_loss_reg: 0.3427 instance_segmentation_loss_poly: 0.8830 +2023/11/04 15:44:40 - mmengine - INFO - Saving checkpoint at 375000 iterations +2023/11/04 15:54:07 - mmengine - INFO - Iter(train) [375500/640000] base_lr: 7.4362e-05 lr: 8.5783e-06 eta: 3 days, 8:33:02 time: 1.1045 data_time: 0.0354 memory: 21519 grad_norm: 3.2610 loss: 1.2810 caption_loss_cls: 2.1848 grounding_loss_reg: 2.6650 detection_loss_cls: 0.0347 detection_loss_reg: 0.3403 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3425 instance_segmentation_loss_poly: 0.8823 +2023/11/04 16:03:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 16:03:05 - mmengine - INFO - Iter(train) [376000/640000] base_lr: 7.4128e-05 lr: 8.5571e-06 eta: 3 days, 8:17:17 time: 1.1006 data_time: 0.0352 memory: 21519 grad_norm: 3.2639 loss: 1.2832 caption_loss_cls: 2.1808 grounding_loss_reg: 2.6618 detection_loss_cls: 0.0346 detection_loss_reg: 0.3395 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0352 instance_segmentation_loss_reg: 0.3414 instance_segmentation_loss_poly: 0.8804 +2023/11/04 16:03:05 - mmengine - INFO - Saving checkpoint at 376000 iterations +2023/11/04 16:11:30 - mmengine - INFO - Iter(train) [376500/640000] base_lr: 7.3894e-05 lr: 8.5358e-06 eta: 3 days, 7:43:07 time: 1.0841 data_time: 0.0349 memory: 21519 grad_norm: 3.3402 loss: 1.2972 caption_loss_cls: 2.1814 grounding_loss_reg: 2.6620 detection_loss_cls: 0.0347 detection_loss_reg: 0.3396 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0350 instance_segmentation_loss_reg: 0.3406 instance_segmentation_loss_poly: 0.8792 +2023/11/04 16:19:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 16:19:57 - mmengine - INFO - Iter(train) [377000/640000] base_lr: 7.3660e-05 lr: 8.5146e-06 eta: 3 days, 7:13:15 time: 1.0748 data_time: 0.0347 memory: 21519 grad_norm: 3.3723 loss: 1.3024 caption_loss_cls: 2.1767 grounding_loss_reg: 2.6602 detection_loss_cls: 0.0346 detection_loss_reg: 0.3390 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0349 instance_segmentation_loss_reg: 0.3406 instance_segmentation_loss_poly: 0.8792 +2023/11/04 16:19:57 - mmengine - INFO - Saving checkpoint at 377000 iterations +2023/11/04 16:28:35 - mmengine - INFO - Iter(train) [377500/640000] base_lr: 7.3427e-05 lr: 8.4934e-06 eta: 3 days, 6:51:52 time: 1.0641 data_time: 0.0344 memory: 21519 grad_norm: 3.4040 loss: 1.3101 caption_loss_cls: 2.1759 grounding_loss_reg: 2.6569 detection_loss_cls: 0.0345 detection_loss_reg: 0.3380 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0348 instance_segmentation_loss_reg: 0.3388 instance_segmentation_loss_poly: 0.8756 +2023/11/04 16:37:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 16:37:35 - mmengine - INFO - Iter(train) [378000/640000] base_lr: 7.3194e-05 lr: 8.4722e-06 eta: 3 days, 6:42:12 time: 1.0808 data_time: 0.0349 memory: 21519 grad_norm: 3.3389 loss: 1.2979 caption_loss_cls: 2.1749 grounding_loss_reg: 2.6550 detection_loss_cls: 0.0345 detection_loss_reg: 0.3390 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0348 instance_segmentation_loss_reg: 0.3391 instance_segmentation_loss_poly: 0.8771 +2023/11/04 16:37:35 - mmengine - INFO - Saving checkpoint at 378000 iterations +2023/11/04 16:46:31 - mmengine - INFO - Iter(train) [378500/640000] base_lr: 7.2961e-05 lr: 8.4510e-06 eta: 3 days, 6:30:49 time: 1.0682 data_time: 0.0346 memory: 21519 grad_norm: 3.3413 loss: 1.2970 caption_loss_cls: 2.1765 grounding_loss_reg: 2.6540 detection_loss_cls: 0.0343 detection_loss_reg: 0.3371 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0346 instance_segmentation_loss_reg: 0.3386 instance_segmentation_loss_poly: 0.8768 +2023/11/04 16:55:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 16:55:13 - mmengine - INFO - Iter(train) [379000/640000] base_lr: 7.2728e-05 lr: 8.4298e-06 eta: 3 days, 6:13:43 time: 1.0577 data_time: 0.0346 memory: 21519 grad_norm: 3.4327 loss: 1.3155 caption_loss_cls: 2.1740 grounding_loss_reg: 2.6565 detection_loss_cls: 0.0342 detection_loss_reg: 0.3360 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0344 instance_segmentation_loss_reg: 0.3373 instance_segmentation_loss_poly: 0.8738 +2023/11/04 16:55:13 - mmengine - INFO - Saving checkpoint at 379000 iterations +2023/11/04 17:04:30 - mmengine - INFO - Iter(train) [379500/640000] base_lr: 7.2495e-05 lr: 8.4086e-06 eta: 3 days, 6:11:46 time: 1.0551 data_time: 0.0344 memory: 21519 grad_norm: 3.4405 loss: 1.3162 caption_loss_cls: 2.1708 grounding_loss_reg: 2.6571 detection_loss_cls: 0.0341 detection_loss_reg: 0.3359 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0344 instance_segmentation_loss_reg: 0.3380 instance_segmentation_loss_poly: 0.8749 +2023/11/04 17:12:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 17:12:56 - mmengine - INFO - Iter(train) [380000/640000] base_lr: 7.2262e-05 lr: 8.3875e-06 eta: 3 days, 5:49:04 time: 1.0471 data_time: 0.0343 memory: 21519 grad_norm: 3.4693 loss: 1.3231 caption_loss_cls: 2.1731 grounding_loss_reg: 2.6540 detection_loss_cls: 0.0340 detection_loss_reg: 0.3350 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0344 instance_segmentation_loss_reg: 0.3375 instance_segmentation_loss_poly: 0.8739 +2023/11/04 17:12:56 - mmengine - INFO - Saving checkpoint at 380000 iterations +2023/11/04 17:21:35 - mmengine - INFO - Evaluating bbox... +2023/11/04 17:22:32 - mmengine - INFO - bbox_mAP_copypaste: 0.435 0.606 0.471 0.272 0.482 0.575 +2023/11/04 17:22:32 - mmengine - INFO - Evaluating segm... +2023/11/04 17:23:44 - mmengine - INFO - segm_mAP_copypaste: 0.292 0.526 0.282 0.146 0.334 0.451 +2023/11/04 17:28:03 - mmengine - INFO - per class results: +2023/11/04 17:28:03 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.64 | 88.14 | +| building | 79.37 | 92.06 | +| sky | 93.01 | 97.12 | +| floor | 79.09 | 89.83 | +| tree | 72.41 | 86.69 | +| ceiling | 82.82 | 92.17 | +| road | 83.4 | 87.77 | +| bed | 86.84 | 94.89 | +| windowpane | 58.73 | 71.61 | +| grass | 66.88 | 78.11 | +| cabinet | 58.33 | 70.03 | +| sidewalk | 64.02 | 80.79 | +| person | 79.31 | 90.28 | +| earth | 40.02 | 55.41 | +| door | 47.95 | 63.93 | +| table | 59.17 | 73.94 | +| mountain | 54.93 | 65.12 | +| plant | 48.89 | 59.14 | +| curtain | 72.27 | 81.44 | +| chair | 53.91 | 66.94 | +| car | 80.98 | 89.22 | +| water | 51.41 | 63.83 | +| painting | 69.82 | 83.05 | +| sofa | 64.73 | 85.22 | +| shelf | 40.06 | 60.9 | +| house | 36.5 | 56.29 | +| sea | 53.38 | 80.95 | +| mirror | 61.71 | 72.87 | +| rug | 57.91 | 62.27 | +| field | 33.21 | 55.09 | +| armchair | 40.07 | 56.9 | +| seat | 61.86 | 80.55 | +| fence | 40.77 | 58.26 | +| desk | 46.33 | 65.84 | +| rock | 38.48 | 60.24 | +| wardrobe | 44.01 | 57.27 | +| lamp | 58.88 | 74.65 | +| bathtub | 68.71 | 79.6 | +| railing | 27.48 | 43.65 | +| cushion | 50.94 | 60.56 | +| base | 27.38 | 32.34 | +| box | 23.41 | 31.58 | +| column | 47.82 | 57.99 | +| signboard | 35.17 | 49.27 | +| chest of drawers | 41.73 | 55.54 | +| counter | 33.11 | 47.46 | +| sand | 39.51 | 46.46 | +| sink | 69.02 | 75.16 | +| skyscraper | 63.74 | 77.05 | +| fireplace | 75.12 | 86.71 | +| refrigerator | 73.2 | 85.93 | +| grandstand | 45.44 | 68.73 | +| path | 27.24 | 44.34 | +| stairs | 32.52 | 40.42 | +| runway | 75.28 | 94.25 | +| case | 39.93 | 53.37 | +| pool table | 87.89 | 95.08 | +| pillow | 51.83 | 62.5 | +| screen door | 44.59 | 48.71 | +| stairway | 30.4 | 47.55 | +| river | 21.87 | 37.28 | +| bridge | 37.85 | 49.01 | +| bookcase | 35.84 | 55.47 | +| blind | 29.35 | 34.45 | +| coffee table | 59.96 | 77.79 | +| toilet | 81.57 | 86.28 | +| flower | 34.01 | 51.59 | +| book | 45.72 | 69.56 | +| hill | 12.7 | 18.94 | +| bench | 50.03 | 66.24 | +| countertop | 51.82 | 68.61 | +| stove | 76.82 | 83.22 | +| palm | 45.51 | 57.39 | +| kitchen island | 37.17 | 81.55 | +| computer | 72.08 | 84.61 | +| swivel chair | 46.23 | 68.5 | +| boat | 66.7 | 79.6 | +| bar | 44.9 | 56.91 | +| arcade machine | 40.1 | 43.83 | +| hovel | 6.67 | 8.81 | +| bus | 76.94 | 94.71 | +| towel | 63.92 | 73.12 | +| light | 36.34 | 38.68 | +| truck | 35.94 | 44.26 | +| tower | 16.11 | 19.3 | +| chandelier | 63.76 | 76.76 | +| awning | 10.21 | 10.4 | +| streetlight | 27.28 | 34.86 | +| booth | 36.16 | 69.63 | +| television receiver | 66.56 | 80.22 | +| airplane | 53.87 | 65.59 | +| dirt track | 1.11 | 6.94 | +| apparel | 29.18 | 46.08 | +| pole | 28.96 | 40.3 | +| land | 2.31 | 3.28 | +| bannister | 11.94 | 16.73 | +| escalator | 35.35 | 54.72 | +| ottoman | 47.38 | 68.43 | +| bottle | 25.63 | 32.93 | +| buffet | 35.43 | 42.19 | +| poster | 27.92 | 42.7 | +| stage | 13.08 | 28.86 | +| van | 35.14 | 48.86 | +| ship | 20.66 | 23.55 | +| fountain | 20.15 | 23.52 | +| conveyer belt | 74.95 | 89.7 | +| canopy | 34.6 | 39.05 | +| washer | 58.88 | 62.84 | +| plaything | 26.44 | 34.36 | +| swimming pool | 41.72 | 76.14 | +| stool | 36.92 | 51.85 | +| barrel | 17.09 | 53.45 | +| basket | 23.85 | 32.0 | +| waterfall | 50.39 | 58.15 | +| tent | 87.93 | 98.13 | +| bag | 11.66 | 13.76 | +| minibike | 65.17 | 73.63 | +| cradle | 70.02 | 83.86 | +| oven | 31.66 | 52.41 | +| ball | 44.37 | 52.13 | +| food | 50.27 | 59.74 | +| step | 15.86 | 19.62 | +| tank | 35.09 | 48.61 | +| trade name | 14.82 | 16.09 | +| microwave | 67.13 | 71.18 | +| pot | 46.27 | 52.31 | +| animal | 58.39 | 60.95 | +| bicycle | 54.36 | 70.17 | +| lake | 38.54 | 39.39 | +| dishwasher | 49.94 | 71.74 | +| screen | 64.18 | 74.91 | +| blanket | 9.96 | 11.87 | +| sculpture | 52.47 | 70.41 | +| hood | 52.62 | 56.34 | +| sconce | 33.51 | 41.19 | +| vase | 38.12 | 53.62 | +| traffic light | 33.16 | 50.48 | +| tray | 10.15 | 16.63 | +| ashcan | 40.71 | 53.53 | +| fan | 52.06 | 67.92 | +| pier | 38.57 | 66.78 | +| crt screen | 15.62 | 41.41 | +| plate | 55.25 | 68.45 | +| monitor | 33.17 | 37.67 | +| bulletin board | 25.98 | 28.38 | +| shower | 1.68 | 14.23 | +| radiator | 49.09 | 56.03 | +| glass | 17.02 | 19.36 | +| clock | 27.91 | 34.46 | +| flag | 25.63 | 28.29 | ++---------------------+-------+-------+ +2023/11/04 17:28:19 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4350 coco/bbox_mAP_50: 0.6060 coco/bbox_mAP_75: 0.4710 coco/bbox_mAP_s: 0.2720 coco/bbox_mAP_m: 0.4820 coco/bbox_mAP_l: 0.5750 coco/segm_mAP: 0.2920 coco/segm_mAP_50: 0.5260 coco/segm_mAP_75: 0.2820 coco/segm_mAP_s: 0.1460 coco/segm_mAP_m: 0.3340 coco/segm_mAP_l: 0.4510 Bleu_1: 0.7337 Bleu_2: 0.5701 Bleu_3: 0.4309 Bleu_4: 0.3238 METEOR: 0.2631 ROUGE_L: 0.5433 CIDEr: 1.0300 SPICE: 0.1931 aAcc: 81.6100 mIoU: 45.6700 mAcc: 57.8200 visual-grounding/miou: 0.7702 visual-grounding/acc: 0.8453 data_time: 0.0098 time: 0.5273 +2023/11/04 17:37:05 - mmengine - INFO - Iter(train) [380500/640000] base_lr: 7.2030e-05 lr: 8.3663e-06 eta: 3 days, 5:35:55 time: 1.0528 data_time: 0.0316 memory: 21521 grad_norm: 3.4642 loss: 1.3217 caption_loss_cls: 2.1671 grounding_loss_reg: 2.6513 detection_loss_cls: 0.0340 detection_loss_reg: 0.3348 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0344 instance_segmentation_loss_reg: 0.3374 instance_segmentation_loss_poly: 0.8735 +2023/11/04 17:45:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 17:45:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 17:45:59 - mmengine - INFO - Iter(train) [381000/640000] base_lr: 7.1798e-05 lr: 8.3452e-06 eta: 3 days, 5:25:12 time: 1.0596 data_time: 0.0317 memory: 21521 grad_norm: 3.4200 loss: 1.3096 caption_loss_cls: 2.1654 grounding_loss_reg: 2.6477 detection_loss_cls: 0.0341 detection_loss_reg: 0.3360 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3388 instance_segmentation_loss_poly: 0.8764 +2023/11/04 17:45:59 - mmengine - INFO - Saving checkpoint at 381000 iterations +2023/11/04 17:55:27 - mmengine - INFO - Iter(train) [381500/640000] base_lr: 7.1566e-05 lr: 8.3241e-06 eta: 3 days, 5:26:19 time: 1.0718 data_time: 0.0321 memory: 21521 grad_norm: 3.3943 loss: 1.3029 caption_loss_cls: 2.1632 grounding_loss_reg: 2.6472 detection_loss_cls: 0.0342 detection_loss_reg: 0.3374 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3398 instance_segmentation_loss_poly: 0.8789 +2023/11/04 18:04:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 18:04:44 - mmengine - INFO - Iter(train) [382000/640000] base_lr: 7.1334e-05 lr: 8.3031e-06 eta: 3 days, 5:23:15 time: 1.0762 data_time: 0.0320 memory: 21521 grad_norm: 3.4043 loss: 1.3009 caption_loss_cls: 2.1592 grounding_loss_reg: 2.6460 detection_loss_cls: 0.0342 detection_loss_reg: 0.3378 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3395 instance_segmentation_loss_poly: 0.8783 +2023/11/04 18:04:44 - mmengine - INFO - Saving checkpoint at 382000 iterations +2023/11/04 18:14:10 - mmengine - INFO - Iter(train) [382500/640000] base_lr: 7.1102e-05 lr: 8.2820e-06 eta: 3 days, 5:22:31 time: 1.0838 data_time: 0.0322 memory: 21521 grad_norm: 3.3926 loss: 1.3018 caption_loss_cls: 2.1579 grounding_loss_reg: 2.6416 detection_loss_cls: 0.0342 detection_loss_reg: 0.3377 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3394 instance_segmentation_loss_poly: 0.8784 +2023/11/04 18:22:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 18:22:56 - mmengine - INFO - Iter(train) [383000/640000] base_lr: 7.0870e-05 lr: 8.2609e-06 eta: 3 days, 5:08:46 time: 1.0847 data_time: 0.0321 memory: 21521 grad_norm: 3.3516 loss: 1.2888 caption_loss_cls: 2.1578 grounding_loss_reg: 2.6389 detection_loss_cls: 0.0342 detection_loss_reg: 0.3376 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0344 instance_segmentation_loss_reg: 0.3385 instance_segmentation_loss_poly: 0.8761 +2023/11/04 18:22:56 - mmengine - INFO - Saving checkpoint at 383000 iterations +2023/11/04 18:32:17 - mmengine - INFO - Iter(train) [383500/640000] base_lr: 7.0639e-05 lr: 8.2399e-06 eta: 3 days, 5:05:36 time: 1.0856 data_time: 0.0321 memory: 21521 grad_norm: 3.2934 loss: 1.2720 caption_loss_cls: 2.1535 grounding_loss_reg: 2.6370 detection_loss_cls: 0.0342 detection_loss_reg: 0.3374 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0344 instance_segmentation_loss_reg: 0.3382 instance_segmentation_loss_poly: 0.8758 +2023/11/04 18:41:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 18:41:02 - mmengine - INFO - Iter(train) [384000/640000] base_lr: 7.0408e-05 lr: 8.2189e-06 eta: 3 days, 4:52:10 time: 1.0906 data_time: 0.0323 memory: 21521 grad_norm: 3.2837 loss: 1.2643 caption_loss_cls: 2.1512 grounding_loss_reg: 2.6334 detection_loss_cls: 0.0341 detection_loss_reg: 0.3368 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0342 instance_segmentation_loss_reg: 0.3371 instance_segmentation_loss_poly: 0.8730 +2023/11/04 18:41:02 - mmengine - INFO - Saving checkpoint at 384000 iterations +2023/11/04 18:50:15 - mmengine - INFO - Iter(train) [384500/640000] base_lr: 7.0177e-05 lr: 8.1979e-06 eta: 3 days, 4:46:21 time: 1.0967 data_time: 0.0355 memory: 21521 grad_norm: 3.2792 loss: 1.2715 caption_loss_cls: 2.1479 grounding_loss_reg: 2.6346 detection_loss_cls: 0.0340 detection_loss_reg: 0.3362 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0343 instance_segmentation_loss_reg: 0.3372 instance_segmentation_loss_poly: 0.8734 +2023/11/04 18:59:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 18:59:20 - mmengine - INFO - Iter(train) [385000/640000] base_lr: 6.9946e-05 lr: 8.1769e-06 eta: 3 days, 4:38:21 time: 1.0995 data_time: 0.0355 memory: 21521 grad_norm: 3.2843 loss: 1.2735 caption_loss_cls: 2.1466 grounding_loss_reg: 2.6313 detection_loss_cls: 0.0340 detection_loss_reg: 0.3359 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0341 instance_segmentation_loss_reg: 0.3363 instance_segmentation_loss_poly: 0.8717 +2023/11/04 18:59:20 - mmengine - INFO - Saving checkpoint at 385000 iterations +2023/11/04 19:08:04 - mmengine - INFO - Iter(train) [385500/640000] base_lr: 6.9715e-05 lr: 8.1559e-06 eta: 3 days, 4:24:58 time: 1.0887 data_time: 0.0353 memory: 21521 grad_norm: 3.3178 loss: 1.2780 caption_loss_cls: 2.1489 grounding_loss_reg: 2.6286 detection_loss_cls: 0.0338 detection_loss_reg: 0.3349 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0341 instance_segmentation_loss_reg: 0.3367 instance_segmentation_loss_poly: 0.8725 +2023/11/04 19:16:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 19:16:38 - mmengine - INFO - Iter(train) [386000/640000] base_lr: 6.9485e-05 lr: 8.1350e-06 eta: 3 days, 4:09:10 time: 1.0777 data_time: 0.0350 memory: 21521 grad_norm: 3.3097 loss: 1.2748 caption_loss_cls: 2.1461 grounding_loss_reg: 2.6266 detection_loss_cls: 0.0339 detection_loss_reg: 0.3356 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0342 instance_segmentation_loss_reg: 0.3375 instance_segmentation_loss_poly: 0.8738 +2023/11/04 19:16:38 - mmengine - INFO - Saving checkpoint at 386000 iterations +2023/11/04 19:25:45 - mmengine - INFO - Iter(train) [386500/640000] base_lr: 6.9255e-05 lr: 8.1141e-06 eta: 3 days, 4:01:52 time: 1.0729 data_time: 0.0348 memory: 21521 grad_norm: 3.2975 loss: 1.2682 caption_loss_cls: 2.1435 grounding_loss_reg: 2.6258 detection_loss_cls: 0.0338 detection_loss_reg: 0.3348 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0340 instance_segmentation_loss_reg: 0.3366 instance_segmentation_loss_poly: 0.8711 +2023/11/04 19:34:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 19:34:35 - mmengine - INFO - Iter(train) [387000/640000] base_lr: 6.9025e-05 lr: 8.0931e-06 eta: 3 days, 3:50:30 time: 1.0740 data_time: 0.0348 memory: 21521 grad_norm: 3.3237 loss: 1.2781 caption_loss_cls: 2.1439 grounding_loss_reg: 2.6263 detection_loss_cls: 0.0337 detection_loss_reg: 0.3347 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0339 instance_segmentation_loss_reg: 0.3358 instance_segmentation_loss_poly: 0.8689 +2023/11/04 19:34:35 - mmengine - INFO - Saving checkpoint at 387000 iterations +2023/11/04 19:43:54 - mmengine - INFO - Iter(train) [387500/640000] base_lr: 6.8795e-05 lr: 8.0722e-06 eta: 3 days, 3:45:48 time: 1.0736 data_time: 0.0348 memory: 21521 grad_norm: 3.3539 loss: 1.2881 caption_loss_cls: 2.1434 grounding_loss_reg: 2.6244 detection_loss_cls: 0.0337 detection_loss_reg: 0.3348 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0339 instance_segmentation_loss_reg: 0.3358 instance_segmentation_loss_poly: 0.8689 +2023/11/04 19:52:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 19:52:58 - mmengine - INFO - Iter(train) [388000/640000] base_lr: 6.8565e-05 lr: 8.0514e-06 eta: 3 days, 3:37:34 time: 1.0781 data_time: 0.0350 memory: 21521 grad_norm: 3.3585 loss: 1.2916 caption_loss_cls: 2.1443 grounding_loss_reg: 2.6197 detection_loss_cls: 0.0336 detection_loss_reg: 0.3350 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0339 instance_segmentation_loss_reg: 0.3357 instance_segmentation_loss_poly: 0.8692 +2023/11/04 19:52:58 - mmengine - INFO - Saving checkpoint at 388000 iterations +2023/11/04 20:01:49 - mmengine - INFO - Iter(train) [388500/640000] base_lr: 6.8336e-05 lr: 8.0305e-06 eta: 3 days, 3:26:39 time: 1.0729 data_time: 0.0345 memory: 21521 grad_norm: 3.3458 loss: 1.2792 caption_loss_cls: 2.1383 grounding_loss_reg: 2.6165 detection_loss_cls: 0.0336 detection_loss_reg: 0.3348 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3356 instance_segmentation_loss_poly: 0.8696 +2023/11/04 20:10:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 20:10:43 - mmengine - INFO - Iter(train) [389000/640000] base_lr: 6.8106e-05 lr: 8.0097e-06 eta: 3 days, 3:16:18 time: 1.0701 data_time: 0.0343 memory: 21521 grad_norm: 3.3495 loss: 1.2765 caption_loss_cls: 2.1372 grounding_loss_reg: 2.6151 detection_loss_cls: 0.0334 detection_loss_reg: 0.3335 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3343 instance_segmentation_loss_poly: 0.8676 +2023/11/04 20:10:43 - mmengine - INFO - Saving checkpoint at 389000 iterations +2023/11/04 20:20:10 - mmengine - INFO - Iter(train) [389500/640000] base_lr: 6.7877e-05 lr: 7.9888e-06 eta: 3 days, 3:12:51 time: 1.0809 data_time: 0.0347 memory: 21521 grad_norm: 3.3502 loss: 1.2729 caption_loss_cls: 2.1350 grounding_loss_reg: 2.6163 detection_loss_cls: 0.0336 detection_loss_reg: 0.3348 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3356 instance_segmentation_loss_poly: 0.8695 +2023/11/04 20:29:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 20:29:10 - mmengine - INFO - Iter(train) [390000/640000] base_lr: 6.7648e-05 lr: 7.9680e-06 eta: 3 days, 3:03:38 time: 1.0874 data_time: 0.0348 memory: 21521 grad_norm: 3.3320 loss: 1.2707 caption_loss_cls: 2.1405 grounding_loss_reg: 2.6156 detection_loss_cls: 0.0336 detection_loss_reg: 0.3347 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3356 instance_segmentation_loss_poly: 0.8692 +2023/11/04 20:29:10 - mmengine - INFO - Saving checkpoint at 390000 iterations +2023/11/04 20:37:50 - mmengine - INFO - Iter(train) [390500/640000] base_lr: 6.7420e-05 lr: 7.9472e-06 eta: 3 days, 2:50:30 time: 1.0805 data_time: 0.0349 memory: 21521 grad_norm: 3.3909 loss: 1.2822 caption_loss_cls: 2.1377 grounding_loss_reg: 2.6148 detection_loss_cls: 0.0336 detection_loss_reg: 0.3347 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3357 instance_segmentation_loss_poly: 0.8702 +2023/11/04 20:46:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 20:46:52 - mmengine - INFO - Iter(train) [391000/640000] base_lr: 6.7191e-05 lr: 7.9265e-06 eta: 3 days, 2:41:53 time: 1.0836 data_time: 0.0352 memory: 21521 grad_norm: 3.3598 loss: 1.2794 caption_loss_cls: 2.1353 grounding_loss_reg: 2.6165 detection_loss_cls: 0.0335 detection_loss_reg: 0.3339 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3354 instance_segmentation_loss_poly: 0.8692 +2023/11/04 20:46:52 - mmengine - INFO - Saving checkpoint at 391000 iterations +2023/11/04 20:56:08 - mmengine - INFO - Iter(train) [391500/640000] base_lr: 6.6963e-05 lr: 7.9057e-06 eta: 3 days, 2:35:51 time: 1.0830 data_time: 0.0352 memory: 21521 grad_norm: 3.3984 loss: 1.2864 caption_loss_cls: 2.1390 grounding_loss_reg: 2.6144 detection_loss_cls: 0.0335 detection_loss_reg: 0.3348 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3353 instance_segmentation_loss_poly: 0.8686 +2023/11/04 21:05:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 21:05:19 - mmengine - INFO - Iter(train) [392000/640000] base_lr: 6.6735e-05 lr: 7.8850e-06 eta: 3 days, 2:28:41 time: 1.0847 data_time: 0.0352 memory: 21521 grad_norm: 3.3727 loss: 1.2832 caption_loss_cls: 2.1427 grounding_loss_reg: 2.6153 detection_loss_cls: 0.0335 detection_loss_reg: 0.3345 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3354 instance_segmentation_loss_poly: 0.8679 +2023/11/04 21:05:19 - mmengine - INFO - Saving checkpoint at 392000 iterations +2023/11/04 21:14:45 - mmengine - INFO - Iter(train) [392500/640000] base_lr: 6.6507e-05 lr: 7.8643e-06 eta: 3 days, 2:24:01 time: 1.0932 data_time: 0.0357 memory: 21521 grad_norm: 3.3680 loss: 1.2891 caption_loss_cls: 2.1400 grounding_loss_reg: 2.6142 detection_loss_cls: 0.0334 detection_loss_reg: 0.3346 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0339 instance_segmentation_loss_reg: 0.3373 instance_segmentation_loss_poly: 0.8700 +2023/11/04 21:23:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 21:23:31 - mmengine - INFO - Iter(train) [393000/640000] base_lr: 6.6279e-05 lr: 7.8436e-06 eta: 3 days, 2:12:23 time: 1.0913 data_time: 0.0359 memory: 21521 grad_norm: 3.3941 loss: 1.3000 caption_loss_cls: 2.1368 grounding_loss_reg: 2.6133 detection_loss_cls: 0.0335 detection_loss_reg: 0.3355 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0340 instance_segmentation_loss_reg: 0.3372 instance_segmentation_loss_poly: 0.8700 +2023/11/04 21:23:31 - mmengine - INFO - Saving checkpoint at 393000 iterations +2023/11/04 21:33:12 - mmengine - INFO - Iter(train) [393500/640000] base_lr: 6.6052e-05 lr: 7.8229e-06 eta: 3 days, 2:10:05 time: 1.0948 data_time: 0.0358 memory: 21521 grad_norm: 3.3142 loss: 1.2860 caption_loss_cls: 2.1377 grounding_loss_reg: 2.6147 detection_loss_cls: 0.0336 detection_loss_reg: 0.3363 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0341 instance_segmentation_loss_reg: 0.3381 instance_segmentation_loss_poly: 0.8713 +2023/11/04 21:42:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 21:42:50 - mmengine - INFO - Iter(train) [394000/640000] base_lr: 6.5825e-05 lr: 7.8022e-06 eta: 3 days, 2:06:56 time: 1.1043 data_time: 0.0362 memory: 21521 grad_norm: 3.2907 loss: 1.2791 caption_loss_cls: 2.1369 grounding_loss_reg: 2.6138 detection_loss_cls: 0.0338 detection_loss_reg: 0.3375 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0341 instance_segmentation_loss_reg: 0.3379 instance_segmentation_loss_poly: 0.8713 +2023/11/04 21:42:50 - mmengine - INFO - Saving checkpoint at 394000 iterations +2023/11/04 21:52:04 - mmengine - INFO - Iter(train) [394500/640000] base_lr: 6.5598e-05 lr: 7.7816e-06 eta: 3 days, 1:59:45 time: 1.1130 data_time: 0.0364 memory: 21521 grad_norm: 3.2706 loss: 1.2765 caption_loss_cls: 2.1342 grounding_loss_reg: 2.6124 detection_loss_cls: 0.0337 detection_loss_reg: 0.3364 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0342 instance_segmentation_loss_reg: 0.3383 instance_segmentation_loss_poly: 0.8720 +2023/11/04 22:01:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 22:01:34 - mmengine - INFO - Iter(train) [395000/640000] base_lr: 6.5371e-05 lr: 7.7610e-06 eta: 3 days, 1:54:57 time: 1.1199 data_time: 0.0363 memory: 21521 grad_norm: 3.2430 loss: 1.2637 caption_loss_cls: 2.1301 grounding_loss_reg: 2.6124 detection_loss_cls: 0.0338 detection_loss_reg: 0.3371 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0341 instance_segmentation_loss_reg: 0.3378 instance_segmentation_loss_poly: 0.8703 +2023/11/04 22:01:34 - mmengine - INFO - Saving checkpoint at 395000 iterations +2023/11/04 22:10:38 - mmengine - INFO - Iter(train) [395500/640000] base_lr: 6.5144e-05 lr: 7.7404e-06 eta: 3 days, 1:45:58 time: 1.1167 data_time: 0.0362 memory: 21521 grad_norm: 3.1711 loss: 1.2490 caption_loss_cls: 2.1305 grounding_loss_reg: 2.6113 detection_loss_cls: 0.0338 detection_loss_reg: 0.3363 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0340 instance_segmentation_loss_reg: 0.3375 instance_segmentation_loss_poly: 0.8699 +2023/11/04 22:19:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 22:19:37 - mmengine - INFO - Iter(train) [396000/640000] base_lr: 6.4918e-05 lr: 7.7198e-06 eta: 3 days, 1:36:13 time: 1.1137 data_time: 0.0361 memory: 21521 grad_norm: 3.2156 loss: 1.2528 caption_loss_cls: 2.1289 grounding_loss_reg: 2.6092 detection_loss_cls: 0.0338 detection_loss_reg: 0.3371 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0341 instance_segmentation_loss_reg: 0.3389 instance_segmentation_loss_poly: 0.8734 +2023/11/04 22:19:37 - mmengine - INFO - Saving checkpoint at 396000 iterations +2023/11/04 22:28:48 - mmengine - INFO - Iter(train) [396500/640000] base_lr: 6.4692e-05 lr: 7.6992e-06 eta: 3 days, 1:28:14 time: 1.1099 data_time: 0.0356 memory: 21521 grad_norm: 3.2131 loss: 1.2408 caption_loss_cls: 2.1289 grounding_loss_reg: 2.6084 detection_loss_cls: 0.0338 detection_loss_reg: 0.3368 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0342 instance_segmentation_loss_reg: 0.3379 instance_segmentation_loss_poly: 0.8716 +2023/11/04 22:37:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 22:37:56 - mmengine - INFO - Iter(train) [397000/640000] base_lr: 6.4466e-05 lr: 7.6787e-06 eta: 3 days, 1:19:50 time: 1.1154 data_time: 0.0358 memory: 21521 grad_norm: 3.1802 loss: 1.2354 caption_loss_cls: 2.1292 grounding_loss_reg: 2.6062 detection_loss_cls: 0.0337 detection_loss_reg: 0.3369 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0343 instance_segmentation_loss_reg: 0.3391 instance_segmentation_loss_poly: 0.8737 +2023/11/04 22:37:56 - mmengine - INFO - Saving checkpoint at 397000 iterations +2023/11/04 22:47:02 - mmengine - INFO - Iter(train) [397500/640000] base_lr: 6.4240e-05 lr: 7.6582e-06 eta: 3 days, 1:11:14 time: 1.1067 data_time: 0.0354 memory: 21521 grad_norm: 3.2344 loss: 1.2446 caption_loss_cls: 2.1299 grounding_loss_reg: 2.6046 detection_loss_cls: 0.0338 detection_loss_reg: 0.3376 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0343 instance_segmentation_loss_reg: 0.3398 instance_segmentation_loss_poly: 0.8754 +2023/11/04 22:55:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 22:55:25 - mmengine - INFO - Iter(train) [398000/640000] base_lr: 6.4015e-05 lr: 7.6377e-06 eta: 3 days, 0:56:31 time: 1.0880 data_time: 0.0349 memory: 21521 grad_norm: 3.3167 loss: 1.2656 caption_loss_cls: 2.1309 grounding_loss_reg: 2.6059 detection_loss_cls: 0.0338 detection_loss_reg: 0.3382 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0344 instance_segmentation_loss_reg: 0.3401 instance_segmentation_loss_poly: 0.8761 +2023/11/04 22:55:25 - mmengine - INFO - Saving checkpoint at 398000 iterations +2023/11/04 23:04:37 - mmengine - INFO - Iter(train) [398500/640000] base_lr: 6.3789e-05 lr: 7.6172e-06 eta: 3 days, 0:48:41 time: 1.0874 data_time: 0.0350 memory: 21521 grad_norm: 3.3334 loss: 1.2755 caption_loss_cls: 2.1341 grounding_loss_reg: 2.6038 detection_loss_cls: 0.0338 detection_loss_reg: 0.3381 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0344 instance_segmentation_loss_reg: 0.3410 instance_segmentation_loss_poly: 0.8774 +2023/11/04 23:13:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 23:13:24 - mmengine - INFO - Iter(train) [399000/640000] base_lr: 6.3564e-05 lr: 7.5967e-06 eta: 3 days, 0:37:31 time: 1.0767 data_time: 0.0348 memory: 21521 grad_norm: 3.3994 loss: 1.2930 caption_loss_cls: 2.1361 grounding_loss_reg: 2.6018 detection_loss_cls: 0.0338 detection_loss_reg: 0.3393 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3412 instance_segmentation_loss_poly: 0.8779 +2023/11/04 23:13:24 - mmengine - INFO - Saving checkpoint at 399000 iterations +2023/11/04 23:22:40 - mmengine - INFO - Iter(train) [399500/640000] base_lr: 6.3339e-05 lr: 7.5763e-06 eta: 3 days, 0:30:08 time: 1.0796 data_time: 0.0349 memory: 21521 grad_norm: 3.4297 loss: 1.2995 caption_loss_cls: 2.1336 grounding_loss_reg: 2.6021 detection_loss_cls: 0.0338 detection_loss_reg: 0.3397 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3415 instance_segmentation_loss_poly: 0.8782 +2023/11/04 23:31:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/04 23:31:54 - mmengine - INFO - Iter(train) [400000/640000] base_lr: 6.3115e-05 lr: 7.5559e-06 eta: 3 days, 0:22:38 time: 1.0837 data_time: 0.0352 memory: 21521 grad_norm: 3.3997 loss: 1.3026 caption_loss_cls: 2.1389 grounding_loss_reg: 2.6011 detection_loss_cls: 0.0338 detection_loss_reg: 0.3397 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3415 instance_segmentation_loss_poly: 0.8799 +2023/11/04 23:31:54 - mmengine - INFO - Saving checkpoint at 400000 iterations +2023/11/04 23:40:35 - mmengine - INFO - Evaluating bbox... +2023/11/04 23:41:32 - mmengine - INFO - bbox_mAP_copypaste: 0.448 0.619 0.487 0.274 0.497 0.598 +2023/11/04 23:41:32 - mmengine - INFO - Evaluating segm... +2023/11/04 23:42:44 - mmengine - INFO - segm_mAP_copypaste: 0.300 0.539 0.294 0.145 0.343 0.468 +2023/11/04 23:48:33 - mmengine - INFO - per class results: +2023/11/04 23:48:33 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.55 | 87.46 | +| building | 80.08 | 89.14 | +| sky | 92.87 | 97.87 | +| floor | 79.81 | 89.28 | +| tree | 73.02 | 86.45 | +| ceiling | 82.63 | 93.64 | +| road | 82.13 | 89.78 | +| bed | 85.64 | 93.34 | +| windowpane | 60.09 | 77.89 | +| grass | 66.93 | 86.85 | +| cabinet | 57.37 | 68.01 | +| sidewalk | 64.6 | 77.46 | +| person | 78.14 | 91.15 | +| earth | 38.81 | 52.48 | +| door | 49.21 | 63.49 | +| table | 59.54 | 73.87 | +| mountain | 59.23 | 77.49 | +| plant | 50.64 | 58.19 | +| curtain | 70.22 | 83.19 | +| chair | 54.49 | 65.82 | +| car | 81.69 | 91.29 | +| water | 50.72 | 62.17 | +| painting | 68.42 | 86.49 | +| sofa | 62.41 | 76.4 | +| shelf | 40.76 | 56.41 | +| house | 40.97 | 62.49 | +| sea | 51.48 | 73.65 | +| mirror | 64.36 | 77.75 | +| rug | 63.47 | 72.41 | +| field | 27.41 | 37.6 | +| armchair | 39.51 | 62.14 | +| seat | 61.55 | 80.8 | +| fence | 40.43 | 62.47 | +| desk | 46.31 | 63.54 | +| rock | 34.46 | 55.78 | +| wardrobe | 44.35 | 61.57 | +| lamp | 59.04 | 73.36 | +| bathtub | 77.63 | 85.14 | +| railing | 30.01 | 44.67 | +| cushion | 55.63 | 71.43 | +| base | 21.82 | 29.56 | +| box | 20.79 | 26.41 | +| column | 46.82 | 66.01 | +| signboard | 36.09 | 46.82 | +| chest of drawers | 32.66 | 69.49 | +| counter | 26.03 | 29.97 | +| sand | 37.28 | 46.23 | +| sink | 70.9 | 77.8 | +| skyscraper | 52.33 | 65.18 | +| fireplace | 63.33 | 90.88 | +| refrigerator | 70.89 | 77.92 | +| grandstand | 33.14 | 66.62 | +| path | 29.55 | 41.12 | +| stairs | 25.63 | 32.67 | +| runway | 68.24 | 80.61 | +| case | 44.99 | 58.94 | +| pool table | 88.65 | 95.86 | +| pillow | 55.14 | 77.13 | +| screen door | 61.02 | 62.37 | +| stairway | 28.6 | 39.0 | +| river | 16.25 | 35.62 | +| bridge | 68.92 | 77.75 | +| bookcase | 35.54 | 54.51 | +| blind | 37.28 | 41.8 | +| coffee table | 63.0 | 76.68 | +| toilet | 82.97 | 89.13 | +| flower | 32.26 | 44.72 | +| book | 44.17 | 63.26 | +| hill | 9.81 | 16.81 | +| bench | 50.07 | 58.47 | +| countertop | 53.31 | 64.09 | +| stove | 70.82 | 85.61 | +| palm | 43.19 | 56.6 | +| kitchen island | 33.7 | 60.55 | +| computer | 67.67 | 79.64 | +| swivel chair | 43.58 | 57.53 | +| boat | 63.94 | 81.98 | +| bar | 33.1 | 42.97 | +| arcade machine | 46.85 | 51.36 | +| hovel | 14.98 | 17.53 | +| bus | 77.65 | 94.61 | +| towel | 62.37 | 74.55 | +| light | 44.19 | 50.24 | +| truck | 38.85 | 46.65 | +| tower | 34.84 | 52.34 | +| chandelier | 63.66 | 79.62 | +| awning | 28.67 | 37.61 | +| streetlight | 26.0 | 35.4 | +| booth | 49.99 | 60.94 | +| television receiver | 69.19 | 85.21 | +| airplane | 55.35 | 67.13 | +| dirt track | 5.19 | 15.68 | +| apparel | 31.89 | 51.6 | +| pole | 27.43 | 40.26 | +| land | 0.97 | 1.31 | +| bannister | 14.25 | 19.36 | +| escalator | 27.39 | 29.54 | +| ottoman | 37.54 | 68.64 | +| bottle | 30.02 | 34.8 | +| buffet | 42.55 | 51.77 | +| poster | 26.81 | 36.32 | +| stage | 13.08 | 18.98 | +| van | 37.65 | 53.58 | +| ship | 68.19 | 93.57 | +| fountain | 14.19 | 15.45 | +| conveyer belt | 79.15 | 89.24 | +| canopy | 29.87 | 42.96 | +| washer | 60.37 | 62.68 | +| plaything | 30.43 | 48.22 | +| swimming pool | 44.35 | 60.3 | +| stool | 39.84 | 56.0 | +| barrel | 29.89 | 53.03 | +| basket | 25.66 | 39.27 | +| waterfall | 47.6 | 62.09 | +| tent | 90.24 | 97.77 | +| bag | 12.15 | 13.28 | +| minibike | 71.72 | 81.23 | +| cradle | 78.15 | 95.41 | +| oven | 41.68 | 54.38 | +| ball | 38.41 | 41.37 | +| food | 55.02 | 65.21 | +| step | 14.42 | 18.68 | +| tank | 38.77 | 48.73 | +| trade name | 29.47 | 39.64 | +| microwave | 80.08 | 88.06 | +| pot | 44.25 | 50.61 | +| animal | 64.81 | 69.61 | +| bicycle | 54.15 | 71.58 | +| lake | 37.7 | 69.63 | +| dishwasher | 53.68 | 74.14 | +| screen | 69.33 | 84.84 | +| blanket | 11.97 | 14.74 | +| sculpture | 44.43 | 52.53 | +| hood | 57.59 | 66.26 | +| sconce | 31.36 | 42.26 | +| vase | 40.15 | 54.44 | +| traffic light | 32.74 | 50.38 | +| tray | 7.31 | 9.61 | +| ashcan | 41.31 | 53.25 | +| fan | 49.52 | 59.13 | +| pier | 43.98 | 81.63 | +| crt screen | 7.53 | 20.09 | +| plate | 54.73 | 67.22 | +| monitor | 9.47 | 11.46 | +| bulletin board | 32.83 | 65.97 | +| shower | 1.48 | 3.64 | +| radiator | 45.22 | 49.14 | +| glass | 14.48 | 15.48 | +| clock | 28.64 | 36.54 | +| flag | 31.7 | 36.98 | ++---------------------+-------+-------+ +2023/11/04 23:48:49 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4480 coco/bbox_mAP_50: 0.6190 coco/bbox_mAP_75: 0.4870 coco/bbox_mAP_s: 0.2740 coco/bbox_mAP_m: 0.4970 coco/bbox_mAP_l: 0.5980 coco/segm_mAP: 0.3000 coco/segm_mAP_50: 0.5390 coco/segm_mAP_75: 0.2940 coco/segm_mAP_s: 0.1450 coco/segm_mAP_m: 0.3430 coco/segm_mAP_l: 0.4680 Bleu_1: 0.7369 Bleu_2: 0.5664 Bleu_3: 0.4228 Bleu_4: 0.3140 METEOR: 0.2557 ROUGE_L: 0.5377 CIDEr: 1.0105 SPICE: 0.1873 aAcc: 81.7500 mIoU: 46.6800 mAcc: 59.2100 visual-grounding/miou: 0.7716 visual-grounding/acc: 0.8457 data_time: 0.0046 time: 0.5218 +2023/11/04 23:57:41 - mmengine - INFO - Iter(train) [400500/640000] base_lr: 6.2890e-05 lr: 7.5355e-06 eta: 3 days, 0:12:25 time: 1.0795 data_time: 0.0322 memory: 21521 grad_norm: 3.3612 loss: 1.2914 caption_loss_cls: 2.1359 grounding_loss_reg: 2.5996 detection_loss_cls: 0.0338 detection_loss_reg: 0.3400 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0344 instance_segmentation_loss_reg: 0.3405 instance_segmentation_loss_poly: 0.8774 +2023/11/05 00:06:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 00:06:52 - mmengine - INFO - Iter(train) [401000/640000] base_lr: 6.2666e-05 lr: 7.5151e-06 eta: 3 days, 0:04:23 time: 1.0803 data_time: 0.0324 memory: 21521 grad_norm: 3.3885 loss: 1.2887 caption_loss_cls: 2.1356 grounding_loss_reg: 2.5995 detection_loss_cls: 0.0337 detection_loss_reg: 0.3387 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0343 instance_segmentation_loss_reg: 0.3396 instance_segmentation_loss_poly: 0.8754 +2023/11/05 00:06:52 - mmengine - INFO - Saving checkpoint at 401000 iterations +2023/11/05 00:16:26 - mmengine - INFO - Iter(train) [401500/640000] base_lr: 6.2442e-05 lr: 7.4948e-06 eta: 2 days, 23:59:04 time: 1.0870 data_time: 0.0328 memory: 21521 grad_norm: 3.3644 loss: 1.2847 caption_loss_cls: 2.1364 grounding_loss_reg: 2.6006 detection_loss_cls: 0.0335 detection_loss_reg: 0.3368 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0342 instance_segmentation_loss_reg: 0.3386 instance_segmentation_loss_poly: 0.8727 +2023/11/05 00:25:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 00:25:18 - mmengine - INFO - Iter(train) [402000/640000] base_lr: 6.2219e-05 lr: 7.4744e-06 eta: 2 days, 23:48:37 time: 1.0943 data_time: 0.0330 memory: 21521 grad_norm: 3.3353 loss: 1.2664 caption_loss_cls: 2.1350 grounding_loss_reg: 2.5992 detection_loss_cls: 0.0334 detection_loss_reg: 0.3366 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0341 instance_segmentation_loss_reg: 0.3383 instance_segmentation_loss_poly: 0.8721 +2023/11/05 00:25:18 - mmengine - INFO - Saving checkpoint at 402000 iterations +2023/11/05 00:34:09 - mmengine - INFO - Iter(train) [402500/640000] base_lr: 6.1995e-05 lr: 7.4541e-06 eta: 2 days, 23:38:11 time: 1.0893 data_time: 0.0328 memory: 21521 grad_norm: 3.3542 loss: 1.2626 caption_loss_cls: 2.1361 grounding_loss_reg: 2.5992 detection_loss_cls: 0.0335 detection_loss_reg: 0.3368 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0341 instance_segmentation_loss_reg: 0.3384 instance_segmentation_loss_poly: 0.8726 +2023/11/05 00:43:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 00:43:13 - mmengine - INFO - Iter(train) [403000/640000] base_lr: 6.1772e-05 lr: 7.4338e-06 eta: 2 days, 23:29:13 time: 1.0935 data_time: 0.0331 memory: 21521 grad_norm: 3.3345 loss: 1.2544 caption_loss_cls: 2.1368 grounding_loss_reg: 2.5993 detection_loss_cls: 0.0333 detection_loss_reg: 0.3359 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0340 instance_segmentation_loss_reg: 0.3378 instance_segmentation_loss_poly: 0.8716 +2023/11/05 00:43:13 - mmengine - INFO - Saving checkpoint at 403000 iterations +2023/11/05 00:52:34 - mmengine - INFO - Iter(train) [403500/640000] base_lr: 6.1549e-05 lr: 7.4135e-06 eta: 2 days, 23:22:09 time: 1.0948 data_time: 0.0335 memory: 21521 grad_norm: 3.3432 loss: 1.2598 caption_loss_cls: 2.1372 grounding_loss_reg: 2.5989 detection_loss_cls: 0.0333 detection_loss_reg: 0.3355 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0340 instance_segmentation_loss_reg: 0.3385 instance_segmentation_loss_poly: 0.8732 +2023/11/05 01:01:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 01:01:29 - mmengine - INFO - Iter(train) [404000/640000] base_lr: 6.1326e-05 lr: 7.3933e-06 eta: 2 days, 23:12:07 time: 1.0898 data_time: 0.0333 memory: 21521 grad_norm: 3.3405 loss: 1.2543 caption_loss_cls: 2.1393 grounding_loss_reg: 2.5950 detection_loss_cls: 0.0333 detection_loss_reg: 0.3358 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0340 instance_segmentation_loss_reg: 0.3385 instance_segmentation_loss_poly: 0.8726 +2023/11/05 01:01:29 - mmengine - INFO - Saving checkpoint at 404000 iterations +2023/11/05 01:10:26 - mmengine - INFO - Iter(train) [404500/640000] base_lr: 6.1104e-05 lr: 7.3731e-06 eta: 2 days, 23:02:21 time: 1.0906 data_time: 0.0364 memory: 21521 grad_norm: 3.3867 loss: 1.2638 caption_loss_cls: 2.1412 grounding_loss_reg: 2.5934 detection_loss_cls: 0.0333 detection_loss_reg: 0.3364 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0339 instance_segmentation_loss_reg: 0.3386 instance_segmentation_loss_poly: 0.8719 +2023/11/05 01:19:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 01:19:23 - mmengine - INFO - Iter(train) [405000/640000] base_lr: 6.0882e-05 lr: 7.3529e-06 eta: 2 days, 22:52:40 time: 1.0871 data_time: 0.0361 memory: 21521 grad_norm: 3.3719 loss: 1.2597 caption_loss_cls: 2.1387 grounding_loss_reg: 2.5941 detection_loss_cls: 0.0333 detection_loss_reg: 0.3364 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0340 instance_segmentation_loss_reg: 0.3386 instance_segmentation_loss_poly: 0.8719 +2023/11/05 01:19:23 - mmengine - INFO - Saving checkpoint at 405000 iterations +2023/11/05 01:28:51 - mmengine - INFO - Iter(train) [405500/640000] base_lr: 6.0660e-05 lr: 7.3327e-06 eta: 2 days, 22:46:15 time: 1.0857 data_time: 0.0362 memory: 21521 grad_norm: 3.4083 loss: 1.2655 caption_loss_cls: 2.1352 grounding_loss_reg: 2.5918 detection_loss_cls: 0.0333 detection_loss_reg: 0.3361 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3377 instance_segmentation_loss_poly: 0.8697 +2023/11/05 01:38:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 01:38:10 - mmengine - INFO - Iter(train) [406000/640000] base_lr: 6.0438e-05 lr: 7.3125e-06 eta: 2 days, 22:38:50 time: 1.0925 data_time: 0.0365 memory: 21521 grad_norm: 3.4175 loss: 1.2672 caption_loss_cls: 2.1340 grounding_loss_reg: 2.5893 detection_loss_cls: 0.0331 detection_loss_reg: 0.3348 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3366 instance_segmentation_loss_poly: 0.8680 +2023/11/05 01:38:10 - mmengine - INFO - Saving checkpoint at 406000 iterations +2023/11/05 01:46:43 - mmengine - INFO - Iter(train) [406500/640000] base_lr: 6.0216e-05 lr: 7.2924e-06 eta: 2 days, 22:26:29 time: 1.0875 data_time: 0.0363 memory: 21521 grad_norm: 3.4308 loss: 1.2699 caption_loss_cls: 2.1361 grounding_loss_reg: 2.5865 detection_loss_cls: 0.0331 detection_loss_reg: 0.3355 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3364 instance_segmentation_loss_poly: 0.8675 +2023/11/05 01:56:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 01:56:07 - mmengine - INFO - Iter(train) [407000/640000] base_lr: 5.9995e-05 lr: 7.2723e-06 eta: 2 days, 22:19:35 time: 1.0926 data_time: 0.0365 memory: 21521 grad_norm: 3.4064 loss: 1.2671 caption_loss_cls: 2.1312 grounding_loss_reg: 2.5865 detection_loss_cls: 0.0331 detection_loss_reg: 0.3347 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3363 instance_segmentation_loss_poly: 0.8673 +2023/11/05 01:56:07 - mmengine - INFO - Saving checkpoint at 407000 iterations +2023/11/05 02:05:51 - mmengine - INFO - Iter(train) [407500/640000] base_lr: 5.9774e-05 lr: 7.2522e-06 eta: 2 days, 22:14:39 time: 1.0986 data_time: 0.0365 memory: 21521 grad_norm: 3.3812 loss: 1.2602 caption_loss_cls: 2.1305 grounding_loss_reg: 2.5891 detection_loss_cls: 0.0330 detection_loss_reg: 0.3344 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3358 instance_segmentation_loss_poly: 0.8652 +2023/11/05 02:14:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 02:14:38 - mmengine - INFO - Iter(train) [408000/640000] base_lr: 5.9553e-05 lr: 7.2321e-06 eta: 2 days, 22:03:50 time: 1.0965 data_time: 0.0365 memory: 21521 grad_norm: 3.4076 loss: 1.2640 caption_loss_cls: 2.1299 grounding_loss_reg: 2.5918 detection_loss_cls: 0.0330 detection_loss_reg: 0.3345 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3363 instance_segmentation_loss_poly: 0.8659 +2023/11/05 02:14:38 - mmengine - INFO - Saving checkpoint at 408000 iterations +2023/11/05 02:23:42 - mmengine - INFO - Iter(train) [408500/640000] base_lr: 5.9333e-05 lr: 7.2121e-06 eta: 2 days, 21:54:47 time: 1.0983 data_time: 0.0367 memory: 21521 grad_norm: 3.4080 loss: 1.2727 caption_loss_cls: 2.1282 grounding_loss_reg: 2.5926 detection_loss_cls: 0.0330 detection_loss_reg: 0.3355 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3369 instance_segmentation_loss_poly: 0.8670 +2023/11/05 02:32:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 02:32:36 - mmengine - INFO - Iter(train) [409000/640000] base_lr: 5.9112e-05 lr: 7.1920e-06 eta: 2 days, 21:44:44 time: 1.0974 data_time: 0.0367 memory: 21521 grad_norm: 3.4291 loss: 1.2791 caption_loss_cls: 2.1278 grounding_loss_reg: 2.5923 detection_loss_cls: 0.0330 detection_loss_reg: 0.3351 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3355 instance_segmentation_loss_poly: 0.8643 +2023/11/05 02:32:36 - mmengine - INFO - Saving checkpoint at 409000 iterations +2023/11/05 02:41:14 - mmengine - INFO - Iter(train) [409500/640000] base_lr: 5.8892e-05 lr: 7.1720e-06 eta: 2 days, 21:33:12 time: 1.0848 data_time: 0.0363 memory: 21521 grad_norm: 3.4327 loss: 1.2783 caption_loss_cls: 2.1266 grounding_loss_reg: 2.5916 detection_loss_cls: 0.0331 detection_loss_reg: 0.3358 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3361 instance_segmentation_loss_poly: 0.8658 +2023/11/05 02:50:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 02:50:07 - mmengine - INFO - Iter(train) [410000/640000] base_lr: 5.8672e-05 lr: 7.1520e-06 eta: 2 days, 21:23:12 time: 1.0784 data_time: 0.0362 memory: 21521 grad_norm: 3.3993 loss: 1.2848 caption_loss_cls: 2.1248 grounding_loss_reg: 2.5942 detection_loss_cls: 0.0329 detection_loss_reg: 0.3344 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3360 instance_segmentation_loss_poly: 0.8652 +2023/11/05 02:50:07 - mmengine - INFO - Saving checkpoint at 410000 iterations +2023/11/05 02:58:57 - mmengine - INFO - Iter(train) [410500/640000] base_lr: 5.8453e-05 lr: 7.1321e-06 eta: 2 days, 21:12:58 time: 1.0830 data_time: 0.0362 memory: 21521 grad_norm: 3.3719 loss: 1.2725 caption_loss_cls: 2.1262 grounding_loss_reg: 2.5932 detection_loss_cls: 0.0330 detection_loss_reg: 0.3354 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3360 instance_segmentation_loss_poly: 0.8653 +2023/11/05 03:07:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 03:07:41 - mmengine - INFO - Iter(train) [411000/640000] base_lr: 5.8234e-05 lr: 7.1122e-06 eta: 2 days, 21:02:08 time: 1.0728 data_time: 0.0357 memory: 21521 grad_norm: 3.4159 loss: 1.2784 caption_loss_cls: 2.1252 grounding_loss_reg: 2.5917 detection_loss_cls: 0.0330 detection_loss_reg: 0.3359 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3350 instance_segmentation_loss_poly: 0.8630 +2023/11/05 03:07:41 - mmengine - INFO - Saving checkpoint at 411000 iterations +2023/11/05 03:16:40 - mmengine - INFO - Iter(train) [411500/640000] base_lr: 5.8015e-05 lr: 7.0922e-06 eta: 2 days, 20:52:44 time: 1.0614 data_time: 0.0356 memory: 21521 grad_norm: 3.4854 loss: 1.2954 caption_loss_cls: 2.1230 grounding_loss_reg: 2.5925 detection_loss_cls: 0.0330 detection_loss_reg: 0.3354 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3361 instance_segmentation_loss_poly: 0.8653 +2023/11/05 03:26:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 03:26:03 - mmengine - INFO - Iter(train) [412000/640000] base_lr: 5.7796e-05 lr: 7.0724e-06 eta: 2 days, 20:45:25 time: 1.0704 data_time: 0.0358 memory: 21521 grad_norm: 3.4579 loss: 1.2883 caption_loss_cls: 2.1222 grounding_loss_reg: 2.5929 detection_loss_cls: 0.0330 detection_loss_reg: 0.3362 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3360 instance_segmentation_loss_poly: 0.8644 +2023/11/05 03:26:03 - mmengine - INFO - Saving checkpoint at 412000 iterations +2023/11/05 03:35:11 - mmengine - INFO - Iter(train) [412500/640000] base_lr: 5.7577e-05 lr: 7.0525e-06 eta: 2 days, 20:36:48 time: 1.0714 data_time: 0.0360 memory: 21521 grad_norm: 3.4737 loss: 1.2979 caption_loss_cls: 2.1234 grounding_loss_reg: 2.5937 detection_loss_cls: 0.0331 detection_loss_reg: 0.3369 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3370 instance_segmentation_loss_poly: 0.8665 +2023/11/05 03:44:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 03:44:07 - mmengine - INFO - Iter(train) [413000/640000] base_lr: 5.7359e-05 lr: 7.0327e-06 eta: 2 days, 20:27:08 time: 1.0720 data_time: 0.0361 memory: 21521 grad_norm: 3.4615 loss: 1.2967 caption_loss_cls: 2.1240 grounding_loss_reg: 2.5881 detection_loss_cls: 0.0331 detection_loss_reg: 0.3367 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3374 instance_segmentation_loss_poly: 0.8665 +2023/11/05 03:44:07 - mmengine - INFO - Saving checkpoint at 413000 iterations +2023/11/05 03:53:27 - mmengine - INFO - Iter(train) [413500/640000] base_lr: 5.7141e-05 lr: 7.0128e-06 eta: 2 days, 20:19:30 time: 1.0825 data_time: 0.0363 memory: 21521 grad_norm: 3.4545 loss: 1.2941 caption_loss_cls: 2.1222 grounding_loss_reg: 2.5891 detection_loss_cls: 0.0332 detection_loss_reg: 0.3379 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3376 instance_segmentation_loss_poly: 0.8656 +2023/11/05 04:02:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 04:02:24 - mmengine - INFO - Iter(train) [414000/640000] base_lr: 5.6924e-05 lr: 6.9930e-06 eta: 2 days, 20:09:58 time: 1.0836 data_time: 0.0364 memory: 21521 grad_norm: 3.4910 loss: 1.3003 caption_loss_cls: 2.1243 grounding_loss_reg: 2.5875 detection_loss_cls: 0.0330 detection_loss_reg: 0.3366 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3375 instance_segmentation_loss_poly: 0.8649 +2023/11/05 04:02:24 - mmengine - INFO - Saving checkpoint at 414000 iterations +2023/11/05 04:11:48 - mmengine - INFO - Iter(train) [414500/640000] base_lr: 5.6706e-05 lr: 6.9733e-06 eta: 2 days, 20:02:36 time: 1.0919 data_time: 0.0370 memory: 21521 grad_norm: 3.4418 loss: 1.3002 caption_loss_cls: 2.1246 grounding_loss_reg: 2.5875 detection_loss_cls: 0.0331 detection_loss_reg: 0.3367 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3384 instance_segmentation_loss_poly: 0.8657 +2023/11/05 04:21:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 04:21:23 - mmengine - INFO - Iter(train) [415000/640000] base_lr: 5.6489e-05 lr: 6.9535e-06 eta: 2 days, 19:56:06 time: 1.1046 data_time: 0.0376 memory: 21521 grad_norm: 3.4022 loss: 1.2999 caption_loss_cls: 2.1262 grounding_loss_reg: 2.5912 detection_loss_cls: 0.0331 detection_loss_reg: 0.3370 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0339 instance_segmentation_loss_reg: 0.3398 instance_segmentation_loss_poly: 0.8678 +2023/11/05 04:21:23 - mmengine - INFO - Saving checkpoint at 415000 iterations +2023/11/05 04:30:41 - mmengine - INFO - Iter(train) [415500/640000] base_lr: 5.6272e-05 lr: 6.9338e-06 eta: 2 days, 19:48:14 time: 1.1095 data_time: 0.0376 memory: 21521 grad_norm: 3.3701 loss: 1.2880 caption_loss_cls: 2.1263 grounding_loss_reg: 2.5925 detection_loss_cls: 0.0332 detection_loss_reg: 0.3381 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0340 instance_segmentation_loss_reg: 0.3404 instance_segmentation_loss_poly: 0.8687 +2023/11/05 04:40:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 04:40:12 - mmengine - INFO - Iter(train) [416000/640000] base_lr: 5.6055e-05 lr: 6.9141e-06 eta: 2 days, 19:41:16 time: 1.1115 data_time: 0.0375 memory: 21521 grad_norm: 3.3040 loss: 1.2785 caption_loss_cls: 2.1311 grounding_loss_reg: 2.5931 detection_loss_cls: 0.0332 detection_loss_reg: 0.3380 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0339 instance_segmentation_loss_reg: 0.3396 instance_segmentation_loss_poly: 0.8664 +2023/11/05 04:40:12 - mmengine - INFO - Saving checkpoint at 416000 iterations +2023/11/05 04:49:26 - mmengine - INFO - Iter(train) [416500/640000] base_lr: 5.5839e-05 lr: 6.8945e-06 eta: 2 days, 19:32:58 time: 1.1130 data_time: 0.0376 memory: 21521 grad_norm: 3.2922 loss: 1.2755 caption_loss_cls: 2.1323 grounding_loss_reg: 2.5922 detection_loss_cls: 0.0332 detection_loss_reg: 0.3390 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0339 instance_segmentation_loss_reg: 0.3391 instance_segmentation_loss_poly: 0.8645 +2023/11/05 04:58:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 04:58:41 - mmengine - INFO - Iter(train) [417000/640000] base_lr: 5.5623e-05 lr: 6.8748e-06 eta: 2 days, 19:24:46 time: 1.1179 data_time: 0.0378 memory: 21521 grad_norm: 3.2828 loss: 1.2735 caption_loss_cls: 2.1357 grounding_loss_reg: 2.5929 detection_loss_cls: 0.0331 detection_loss_reg: 0.3379 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0339 instance_segmentation_loss_reg: 0.3389 instance_segmentation_loss_poly: 0.8635 +2023/11/05 04:58:41 - mmengine - INFO - Saving checkpoint at 417000 iterations +2023/11/05 05:07:59 - mmengine - INFO - Iter(train) [417500/640000] base_lr: 5.5407e-05 lr: 6.8552e-06 eta: 2 days, 19:16:44 time: 1.1174 data_time: 0.0377 memory: 21521 grad_norm: 3.2868 loss: 1.2776 caption_loss_cls: 2.1372 grounding_loss_reg: 2.5936 detection_loss_cls: 0.0332 detection_loss_reg: 0.3382 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3378 instance_segmentation_loss_poly: 0.8606 +2023/11/05 05:17:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 05:17:14 - mmengine - INFO - Iter(train) [418000/640000] base_lr: 5.5192e-05 lr: 6.8356e-06 eta: 2 days, 19:08:24 time: 1.1216 data_time: 0.0376 memory: 21521 grad_norm: 3.2414 loss: 1.2555 caption_loss_cls: 2.1374 grounding_loss_reg: 2.5916 detection_loss_cls: 0.0330 detection_loss_reg: 0.3364 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3366 instance_segmentation_loss_poly: 0.8587 +2023/11/05 05:17:14 - mmengine - INFO - Saving checkpoint at 418000 iterations +2023/11/05 05:26:26 - mmengine - INFO - Iter(train) [418500/640000] base_lr: 5.4976e-05 lr: 6.8160e-06 eta: 2 days, 18:59:51 time: 1.1187 data_time: 0.0372 memory: 21521 grad_norm: 3.2663 loss: 1.2498 caption_loss_cls: 2.1334 grounding_loss_reg: 2.5893 detection_loss_cls: 0.0329 detection_loss_reg: 0.3355 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3363 instance_segmentation_loss_poly: 0.8576 +2023/11/05 05:35:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 05:35:38 - mmengine - INFO - Iter(train) [419000/640000] base_lr: 5.4761e-05 lr: 6.7965e-06 eta: 2 days, 18:51:18 time: 1.1130 data_time: 0.0369 memory: 21521 grad_norm: 3.3076 loss: 1.2507 caption_loss_cls: 2.1299 grounding_loss_reg: 2.5896 detection_loss_cls: 0.0330 detection_loss_reg: 0.3352 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3355 instance_segmentation_loss_poly: 0.8566 +2023/11/05 05:35:38 - mmengine - INFO - Saving checkpoint at 419000 iterations +2023/11/05 05:44:42 - mmengine - INFO - Iter(train) [419500/640000] base_lr: 5.4547e-05 lr: 6.7770e-06 eta: 2 days, 18:42:13 time: 1.1095 data_time: 0.0366 memory: 21521 grad_norm: 3.2958 loss: 1.2498 caption_loss_cls: 2.1346 grounding_loss_reg: 2.5899 detection_loss_cls: 0.0328 detection_loss_reg: 0.3347 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3353 instance_segmentation_loss_poly: 0.8555 +2023/11/05 05:53:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 05:53:28 - mmengine - INFO - Iter(train) [420000/640000] base_lr: 5.4332e-05 lr: 6.7575e-06 eta: 2 days, 18:31:45 time: 1.0983 data_time: 0.0364 memory: 21521 grad_norm: 3.3839 loss: 1.2567 caption_loss_cls: 2.1322 grounding_loss_reg: 2.5895 detection_loss_cls: 0.0328 detection_loss_reg: 0.3344 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3350 instance_segmentation_loss_poly: 0.8540 +2023/11/05 05:53:28 - mmengine - INFO - Saving checkpoint at 420000 iterations +2023/11/05 06:02:09 - mmengine - INFO - Evaluating bbox... +2023/11/05 06:03:05 - mmengine - INFO - bbox_mAP_copypaste: 0.445 0.616 0.484 0.271 0.496 0.595 +2023/11/05 06:03:05 - mmengine - INFO - Evaluating segm... +2023/11/05 06:04:17 - mmengine - INFO - segm_mAP_copypaste: 0.297 0.534 0.289 0.142 0.343 0.469 +2023/11/05 06:10:10 - mmengine - INFO - per class results: +2023/11/05 06:10:11 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.66 | 88.42 | +| building | 79.68 | 89.97 | +| sky | 92.69 | 97.7 | +| floor | 80.15 | 89.74 | +| tree | 73.01 | 85.33 | +| ceiling | 83.56 | 92.43 | +| road | 83.19 | 90.26 | +| bed | 86.8 | 94.47 | +| windowpane | 58.81 | 77.97 | +| grass | 65.8 | 89.34 | +| cabinet | 60.84 | 71.23 | +| sidewalk | 65.71 | 77.86 | +| person | 78.82 | 90.72 | +| earth | 37.09 | 50.94 | +| door | 47.67 | 61.63 | +| table | 58.52 | 74.62 | +| mountain | 53.32 | 62.61 | +| plant | 52.63 | 65.63 | +| curtain | 68.32 | 83.02 | +| chair | 55.79 | 73.0 | +| car | 81.11 | 92.79 | +| water | 49.47 | 64.25 | +| painting | 71.34 | 83.19 | +| sofa | 63.51 | 76.56 | +| shelf | 39.3 | 54.57 | +| house | 37.33 | 54.3 | +| sea | 45.56 | 71.68 | +| mirror | 62.71 | 72.79 | +| rug | 63.76 | 71.3 | +| field | 23.8 | 29.53 | +| armchair | 41.63 | 57.92 | +| seat | 66.42 | 78.67 | +| fence | 33.66 | 46.18 | +| desk | 45.83 | 68.86 | +| rock | 39.1 | 61.26 | +| wardrobe | 49.34 | 60.99 | +| lamp | 59.07 | 74.66 | +| bathtub | 69.92 | 78.55 | +| railing | 24.32 | 35.98 | +| cushion | 53.26 | 70.97 | +| base | 23.69 | 31.48 | +| box | 25.35 | 36.74 | +| column | 45.98 | 58.26 | +| signboard | 34.11 | 54.25 | +| chest of drawers | 34.67 | 50.5 | +| counter | 35.01 | 49.97 | +| sand | 35.39 | 50.46 | +| sink | 66.89 | 81.34 | +| skyscraper | 34.8 | 41.33 | +| fireplace | 73.57 | 85.21 | +| refrigerator | 73.49 | 77.96 | +| grandstand | 32.56 | 63.65 | +| path | 30.15 | 43.81 | +| stairs | 26.02 | 33.62 | +| runway | 74.32 | 94.71 | +| case | 38.71 | 58.63 | +| pool table | 89.23 | 95.01 | +| pillow | 48.86 | 57.7 | +| screen door | 64.02 | 68.15 | +| stairway | 32.35 | 39.6 | +| river | 13.03 | 22.68 | +| bridge | 67.37 | 81.33 | +| bookcase | 31.61 | 49.6 | +| blind | 19.39 | 20.73 | +| coffee table | 62.77 | 84.14 | +| toilet | 82.88 | 88.89 | +| flower | 33.1 | 47.39 | +| book | 44.82 | 69.16 | +| hill | 6.93 | 12.36 | +| bench | 42.01 | 46.65 | +| countertop | 50.08 | 69.24 | +| stove | 68.05 | 77.64 | +| palm | 44.57 | 58.44 | +| kitchen island | 35.48 | 84.43 | +| computer | 73.27 | 82.36 | +| swivel chair | 39.61 | 52.73 | +| boat | 70.8 | 86.88 | +| bar | 34.77 | 40.6 | +| arcade machine | 38.26 | 42.69 | +| hovel | 19.85 | 37.41 | +| bus | 83.8 | 95.53 | +| towel | 60.53 | 74.06 | +| light | 43.69 | 50.59 | +| truck | 38.69 | 46.01 | +| tower | 33.34 | 56.61 | +| chandelier | 55.65 | 60.34 | +| awning | 23.94 | 29.31 | +| streetlight | 23.5 | 28.27 | +| booth | 43.4 | 49.57 | +| television receiver | 69.33 | 79.38 | +| airplane | 58.8 | 66.62 | +| dirt track | 8.28 | 15.42 | +| apparel | 34.21 | 49.02 | +| pole | 29.83 | 40.16 | +| land | 0.11 | 0.15 | +| bannister | 10.15 | 13.03 | +| escalator | 29.97 | 37.2 | +| ottoman | 45.07 | 65.8 | +| bottle | 27.64 | 35.65 | +| buffet | 45.23 | 57.93 | +| poster | 24.91 | 38.31 | +| stage | 16.35 | 31.72 | +| van | 18.76 | 22.75 | +| ship | 68.02 | 70.26 | +| fountain | 16.22 | 17.0 | +| conveyer belt | 77.0 | 88.44 | +| canopy | 23.1 | 35.79 | +| washer | 56.26 | 69.98 | +| plaything | 29.79 | 45.12 | +| swimming pool | 49.18 | 62.77 | +| stool | 39.17 | 48.3 | +| barrel | 54.2 | 63.61 | +| basket | 27.27 | 37.0 | +| waterfall | 46.75 | 56.97 | +| tent | 83.78 | 97.63 | +| bag | 17.45 | 21.11 | +| minibike | 71.26 | 81.21 | +| cradle | 70.32 | 85.98 | +| oven | 32.68 | 39.28 | +| ball | 42.8 | 50.04 | +| food | 53.3 | 61.05 | +| step | 13.83 | 18.48 | +| tank | 36.79 | 45.16 | +| trade name | 13.39 | 14.65 | +| microwave | 77.71 | 85.39 | +| pot | 48.75 | 56.11 | +| animal | 62.5 | 65.01 | +| bicycle | 54.61 | 74.0 | +| lake | 37.75 | 41.71 | +| dishwasher | 58.35 | 70.82 | +| screen | 70.94 | 87.69 | +| blanket | 8.31 | 9.19 | +| sculpture | 57.24 | 73.42 | +| hood | 52.8 | 58.34 | +| sconce | 37.48 | 49.05 | +| vase | 38.56 | 52.14 | +| traffic light | 32.52 | 48.78 | +| tray | 6.64 | 10.33 | +| ashcan | 38.69 | 58.21 | +| fan | 50.76 | 61.35 | +| pier | 53.07 | 70.18 | +| crt screen | 12.54 | 25.76 | +| plate | 53.88 | 68.34 | +| monitor | 22.26 | 25.25 | +| bulletin board | 33.86 | 50.7 | +| shower | 3.01 | 15.15 | +| radiator | 42.32 | 44.54 | +| glass | 15.85 | 17.42 | +| clock | 24.47 | 28.43 | +| flag | 29.78 | 34.5 | ++---------------------+-------+-------+ +2023/11/05 06:10:26 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4450 coco/bbox_mAP_50: 0.6160 coco/bbox_mAP_75: 0.4840 coco/bbox_mAP_s: 0.2710 coco/bbox_mAP_m: 0.4960 coco/bbox_mAP_l: 0.5950 coco/segm_mAP: 0.2970 coco/segm_mAP_50: 0.5340 coco/segm_mAP_75: 0.2890 coco/segm_mAP_s: 0.1420 coco/segm_mAP_m: 0.3430 coco/segm_mAP_l: 0.4690 Bleu_1: 0.7349 Bleu_2: 0.5686 Bleu_3: 0.4288 Bleu_4: 0.3225 METEOR: 0.2607 ROUGE_L: 0.5429 CIDEr: 1.0318 SPICE: 0.1932 aAcc: 81.6700 mIoU: 46.3200 mAcc: 57.8300 visual-grounding/miou: 0.7715 visual-grounding/acc: 0.8409 data_time: 0.0046 time: 0.5234 +2023/11/05 06:19:26 - mmengine - INFO - Iter(train) [420500/640000] base_lr: 5.4118e-05 lr: 6.7380e-06 eta: 2 days, 18:22:30 time: 1.0953 data_time: 0.0329 memory: 21521 grad_norm: 3.3779 loss: 1.2382 caption_loss_cls: 2.1326 grounding_loss_reg: 2.5886 detection_loss_cls: 0.0328 detection_loss_reg: 0.3346 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3366 instance_segmentation_loss_poly: 0.8572 +2023/11/05 06:28:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 06:28:35 - mmengine - INFO - Iter(train) [421000/640000] base_lr: 5.3904e-05 lr: 6.7186e-06 eta: 2 days, 18:13:45 time: 1.0937 data_time: 0.0328 memory: 21521 grad_norm: 3.3999 loss: 1.2454 caption_loss_cls: 2.1368 grounding_loss_reg: 2.5857 detection_loss_cls: 0.0327 detection_loss_reg: 0.3346 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3354 instance_segmentation_loss_poly: 0.8557 +2023/11/05 06:28:35 - mmengine - INFO - Saving checkpoint at 421000 iterations +2023/11/05 06:37:10 - mmengine - INFO - Iter(train) [421500/640000] base_lr: 5.3691e-05 lr: 6.6991e-06 eta: 2 days, 18:02:34 time: 1.0828 data_time: 0.0325 memory: 21521 grad_norm: 3.4250 loss: 1.2453 caption_loss_cls: 2.1338 grounding_loss_reg: 2.5827 detection_loss_cls: 0.0327 detection_loss_reg: 0.3353 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3355 instance_segmentation_loss_poly: 0.8558 +2023/11/05 06:46:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 06:46:47 - mmengine - INFO - Iter(train) [422000/640000] base_lr: 5.3477e-05 lr: 6.6797e-06 eta: 2 days, 17:55:45 time: 1.0886 data_time: 0.0327 memory: 21521 grad_norm: 3.4240 loss: 1.2506 caption_loss_cls: 2.1332 grounding_loss_reg: 2.5823 detection_loss_cls: 0.0326 detection_loss_reg: 0.3349 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3358 instance_segmentation_loss_poly: 0.8568 +2023/11/05 06:46:47 - mmengine - INFO - Saving checkpoint at 422000 iterations +2023/11/05 06:55:55 - mmengine - INFO - Iter(train) [422500/640000] base_lr: 5.3264e-05 lr: 6.6604e-06 eta: 2 days, 17:46:54 time: 1.0876 data_time: 0.0329 memory: 21521 grad_norm: 3.4346 loss: 1.2634 caption_loss_cls: 2.1369 grounding_loss_reg: 2.5799 detection_loss_cls: 0.0325 detection_loss_reg: 0.3342 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3371 instance_segmentation_loss_poly: 0.8586 +2023/11/05 07:04:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 07:04:55 - mmengine - INFO - Iter(train) [423000/640000] base_lr: 5.3052e-05 lr: 6.6410e-06 eta: 2 days, 17:37:32 time: 1.0847 data_time: 0.0328 memory: 21521 grad_norm: 3.4283 loss: 1.2618 caption_loss_cls: 2.1352 grounding_loss_reg: 2.5795 detection_loss_cls: 0.0326 detection_loss_reg: 0.3347 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3377 instance_segmentation_loss_poly: 0.8596 +2023/11/05 07:04:55 - mmengine - INFO - Saving checkpoint at 423000 iterations +2023/11/05 07:13:46 - mmengine - INFO - Iter(train) [423500/640000] base_lr: 5.2839e-05 lr: 6.6217e-06 eta: 2 days, 17:27:32 time: 1.0811 data_time: 0.0326 memory: 21521 grad_norm: 3.4373 loss: 1.2574 caption_loss_cls: 2.1341 grounding_loss_reg: 2.5802 detection_loss_cls: 0.0327 detection_loss_reg: 0.3361 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3376 instance_segmentation_loss_poly: 0.8599 +2023/11/05 07:22:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 07:22:48 - mmengine - INFO - Iter(train) [424000/640000] base_lr: 5.2627e-05 lr: 6.6024e-06 eta: 2 days, 17:18:18 time: 1.0853 data_time: 0.0328 memory: 21521 grad_norm: 3.4131 loss: 1.2656 caption_loss_cls: 2.1327 grounding_loss_reg: 2.5802 detection_loss_cls: 0.0328 detection_loss_reg: 0.3371 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3376 instance_segmentation_loss_poly: 0.8607 +2023/11/05 07:22:48 - mmengine - INFO - Saving checkpoint at 424000 iterations +2023/11/05 07:31:48 - mmengine - INFO - Iter(train) [424500/640000] base_lr: 5.2415e-05 lr: 6.5832e-06 eta: 2 days, 17:08:56 time: 1.0848 data_time: 0.0359 memory: 21521 grad_norm: 3.4333 loss: 1.2752 caption_loss_cls: 2.1315 grounding_loss_reg: 2.5773 detection_loss_cls: 0.0328 detection_loss_reg: 0.3369 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3386 instance_segmentation_loss_poly: 0.8626 +2023/11/05 07:39:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 07:39:48 - mmengine - INFO - Iter(train) [425000/640000] base_lr: 5.2204e-05 lr: 6.5640e-06 eta: 2 days, 16:55:43 time: 1.0674 data_time: 0.0353 memory: 21521 grad_norm: 3.4820 loss: 1.2760 caption_loss_cls: 2.1332 grounding_loss_reg: 2.5753 detection_loss_cls: 0.0328 detection_loss_reg: 0.3367 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3386 instance_segmentation_loss_poly: 0.8628 +2023/11/05 07:39:48 - mmengine - INFO - Saving checkpoint at 425000 iterations +2023/11/05 07:49:08 - mmengine - INFO - Iter(train) [425500/640000] base_lr: 5.1992e-05 lr: 6.5447e-06 eta: 2 days, 16:47:40 time: 1.0788 data_time: 0.0356 memory: 21521 grad_norm: 3.4324 loss: 1.2642 caption_loss_cls: 2.1303 grounding_loss_reg: 2.5736 detection_loss_cls: 0.0329 detection_loss_reg: 0.3378 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3375 instance_segmentation_loss_poly: 0.8612 +2023/11/05 07:58:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 07:58:02 - mmengine - INFO - Iter(train) [426000/640000] base_lr: 5.1781e-05 lr: 6.5256e-06 eta: 2 days, 16:38:00 time: 1.0681 data_time: 0.0353 memory: 21521 grad_norm: 3.4966 loss: 1.2753 caption_loss_cls: 2.1313 grounding_loss_reg: 2.5752 detection_loss_cls: 0.0329 detection_loss_reg: 0.3376 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3390 instance_segmentation_loss_poly: 0.8642 +2023/11/05 07:58:02 - mmengine - INFO - Saving checkpoint at 426000 iterations +2023/11/05 08:07:03 - mmengine - INFO - Iter(train) [426500/640000] base_lr: 5.1571e-05 lr: 6.5064e-06 eta: 2 days, 16:28:45 time: 1.0663 data_time: 0.0351 memory: 21521 grad_norm: 3.4879 loss: 1.2659 caption_loss_cls: 2.1330 grounding_loss_reg: 2.5722 detection_loss_cls: 0.0328 detection_loss_reg: 0.3371 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0339 instance_segmentation_loss_reg: 0.3393 instance_segmentation_loss_poly: 0.8642 +2023/11/05 08:15:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 08:15:44 - mmengine - INFO - Iter(train) [427000/640000] base_lr: 5.1360e-05 lr: 6.4873e-06 eta: 2 days, 16:18:15 time: 1.0614 data_time: 0.0348 memory: 21521 grad_norm: 3.5209 loss: 1.2661 caption_loss_cls: 2.1363 grounding_loss_reg: 2.5698 detection_loss_cls: 0.0327 detection_loss_reg: 0.3370 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3390 instance_segmentation_loss_poly: 0.8642 +2023/11/05 08:15:44 - mmengine - INFO - Saving checkpoint at 427000 iterations +2023/11/05 08:25:34 - mmengine - INFO - Iter(train) [427500/640000] base_lr: 5.1150e-05 lr: 6.4682e-06 eta: 2 days, 16:11:59 time: 1.0761 data_time: 0.0353 memory: 21521 grad_norm: 3.4776 loss: 1.2626 caption_loss_cls: 2.1388 grounding_loss_reg: 2.5651 detection_loss_cls: 0.0329 detection_loss_reg: 0.3374 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3382 instance_segmentation_loss_poly: 0.8634 +2023/11/05 08:34:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 08:34:42 - mmengine - INFO - Iter(train) [428000/640000] base_lr: 5.0940e-05 lr: 6.4491e-06 eta: 2 days, 16:03:08 time: 1.0776 data_time: 0.0354 memory: 21521 grad_norm: 3.4834 loss: 1.2619 caption_loss_cls: 2.1384 grounding_loss_reg: 2.5630 detection_loss_cls: 0.0329 detection_loss_reg: 0.3378 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3383 instance_segmentation_loss_poly: 0.8632 +2023/11/05 08:34:42 - mmengine - INFO - Saving checkpoint at 428000 iterations +2023/11/05 08:44:03 - mmengine - INFO - Iter(train) [428500/640000] base_lr: 5.0731e-05 lr: 6.4301e-06 eta: 2 days, 15:55:07 time: 1.0830 data_time: 0.0354 memory: 21521 grad_norm: 3.4774 loss: 1.2578 caption_loss_cls: 2.1395 grounding_loss_reg: 2.5625 detection_loss_cls: 0.0327 detection_loss_reg: 0.3362 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3375 instance_segmentation_loss_poly: 0.8616 +2023/11/05 08:53:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 08:53:03 - mmengine - INFO - Iter(train) [429000/640000] base_lr: 5.0522e-05 lr: 6.4111e-06 eta: 2 days, 15:45:46 time: 1.0980 data_time: 0.0359 memory: 21521 grad_norm: 3.4310 loss: 1.2479 caption_loss_cls: 2.1356 grounding_loss_reg: 2.5581 detection_loss_cls: 0.0327 detection_loss_reg: 0.3360 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3376 instance_segmentation_loss_poly: 0.8619 +2023/11/05 08:53:03 - mmengine - INFO - Saving checkpoint at 429000 iterations +2023/11/05 09:02:27 - mmengine - INFO - Iter(train) [429500/640000] base_lr: 5.0313e-05 lr: 6.3921e-06 eta: 2 days, 15:37:49 time: 1.0989 data_time: 0.0361 memory: 21521 grad_norm: 3.4680 loss: 1.2557 caption_loss_cls: 2.1380 grounding_loss_reg: 2.5537 detection_loss_cls: 0.0326 detection_loss_reg: 0.3359 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3369 instance_segmentation_loss_poly: 0.8598 +2023/11/05 09:11:49 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 09:11:49 - mmengine - INFO - Iter(train) [430000/640000] base_lr: 5.0104e-05 lr: 6.3731e-06 eta: 2 days, 15:29:48 time: 1.1060 data_time: 0.0363 memory: 21521 grad_norm: 3.4312 loss: 1.2468 caption_loss_cls: 2.1385 grounding_loss_reg: 2.5506 detection_loss_cls: 0.0326 detection_loss_reg: 0.3359 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3373 instance_segmentation_loss_poly: 0.8609 +2023/11/05 09:11:49 - mmengine - INFO - Saving checkpoint at 430000 iterations +2023/11/05 09:21:25 - mmengine - INFO - Iter(train) [430500/640000] base_lr: 4.9896e-05 lr: 6.3542e-06 eta: 2 days, 15:22:29 time: 1.1146 data_time: 0.0366 memory: 21521 grad_norm: 3.4125 loss: 1.2389 caption_loss_cls: 2.1340 grounding_loss_reg: 2.5491 detection_loss_cls: 0.0325 detection_loss_reg: 0.3344 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3375 instance_segmentation_loss_poly: 0.8609 +2023/11/05 09:29:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 09:29:55 - mmengine - INFO - Iter(train) [431000/640000] base_lr: 4.9688e-05 lr: 6.3353e-06 eta: 2 days, 15:11:27 time: 1.1120 data_time: 0.0364 memory: 21521 grad_norm: 3.3657 loss: 1.2344 caption_loss_cls: 2.1345 grounding_loss_reg: 2.5484 detection_loss_cls: 0.0324 detection_loss_reg: 0.3337 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3367 instance_segmentation_loss_poly: 0.8598 +2023/11/05 09:29:55 - mmengine - INFO - Saving checkpoint at 431000 iterations +2023/11/05 09:39:06 - mmengine - INFO - Iter(train) [431500/640000] base_lr: 4.9480e-05 lr: 6.3164e-06 eta: 2 days, 15:02:45 time: 1.1024 data_time: 0.0361 memory: 21521 grad_norm: 3.4010 loss: 1.2388 caption_loss_cls: 2.1334 grounding_loss_reg: 2.5459 detection_loss_cls: 0.0323 detection_loss_reg: 0.3335 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3361 instance_segmentation_loss_poly: 0.8580 +2023/11/05 09:47:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 09:47:52 - mmengine - INFO - Iter(train) [432000/640000] base_lr: 4.9273e-05 lr: 6.2976e-06 eta: 2 days, 14:52:40 time: 1.0969 data_time: 0.0359 memory: 21521 grad_norm: 3.4208 loss: 1.2374 caption_loss_cls: 2.1355 grounding_loss_reg: 2.5414 detection_loss_cls: 0.0323 detection_loss_reg: 0.3328 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0332 instance_segmentation_loss_reg: 0.3353 instance_segmentation_loss_poly: 0.8565 +2023/11/05 09:47:52 - mmengine - INFO - Saving checkpoint at 432000 iterations +2023/11/05 09:57:07 - mmengine - INFO - Iter(train) [432500/640000] base_lr: 4.9066e-05 lr: 6.2787e-06 eta: 2 days, 14:44:09 time: 1.0952 data_time: 0.0360 memory: 21521 grad_norm: 3.4349 loss: 1.2422 caption_loss_cls: 2.1345 grounding_loss_reg: 2.5376 detection_loss_cls: 0.0323 detection_loss_reg: 0.3332 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0331 instance_segmentation_loss_reg: 0.3338 instance_segmentation_loss_poly: 0.8546 +2023/11/05 10:06:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 10:06:33 - mmengine - INFO - Iter(train) [433000/640000] base_lr: 4.8859e-05 lr: 6.2599e-06 eta: 2 days, 14:36:13 time: 1.1017 data_time: 0.0362 memory: 21521 grad_norm: 3.4308 loss: 1.2456 caption_loss_cls: 2.1343 grounding_loss_reg: 2.5351 detection_loss_cls: 0.0322 detection_loss_reg: 0.3322 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0330 instance_segmentation_loss_reg: 0.3341 instance_segmentation_loss_poly: 0.8562 +2023/11/05 10:06:33 - mmengine - INFO - Saving checkpoint at 433000 iterations +2023/11/05 10:15:47 - mmengine - INFO - Iter(train) [433500/640000] base_lr: 4.8653e-05 lr: 6.2412e-06 eta: 2 days, 14:27:38 time: 1.0993 data_time: 0.0359 memory: 21521 grad_norm: 3.3905 loss: 1.2336 caption_loss_cls: 2.1326 grounding_loss_reg: 2.5358 detection_loss_cls: 0.0320 detection_loss_reg: 0.3307 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0330 instance_segmentation_loss_reg: 0.3335 instance_segmentation_loss_poly: 0.8557 +2023/11/05 10:24:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 10:24:52 - mmengine - INFO - Iter(train) [434000/640000] base_lr: 4.8447e-05 lr: 6.2224e-06 eta: 2 days, 14:18:36 time: 1.0950 data_time: 0.0360 memory: 21521 grad_norm: 3.4189 loss: 1.2408 caption_loss_cls: 2.1345 grounding_loss_reg: 2.5321 detection_loss_cls: 0.0320 detection_loss_reg: 0.3307 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0330 instance_segmentation_loss_reg: 0.3339 instance_segmentation_loss_poly: 0.8569 +2023/11/05 10:24:52 - mmengine - INFO - Saving checkpoint at 434000 iterations +2023/11/05 10:34:16 - mmengine - INFO - Iter(train) [434500/640000] base_lr: 4.8241e-05 lr: 6.2037e-06 eta: 2 days, 14:10:30 time: 1.0920 data_time: 0.0360 memory: 21521 grad_norm: 3.4293 loss: 1.2500 caption_loss_cls: 2.1372 grounding_loss_reg: 2.5314 detection_loss_cls: 0.0320 detection_loss_reg: 0.3308 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0329 instance_segmentation_loss_reg: 0.3327 instance_segmentation_loss_poly: 0.8545 +2023/11/05 10:43:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 10:43:11 - mmengine - INFO - Iter(train) [435000/640000] base_lr: 4.8036e-05 lr: 6.1851e-06 eta: 2 days, 14:00:54 time: 1.0982 data_time: 0.0361 memory: 21521 grad_norm: 3.4227 loss: 1.2432 caption_loss_cls: 2.1344 grounding_loss_reg: 2.5277 detection_loss_cls: 0.0320 detection_loss_reg: 0.3315 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0328 instance_segmentation_loss_reg: 0.3314 instance_segmentation_loss_poly: 0.8525 +2023/11/05 10:43:11 - mmengine - INFO - Saving checkpoint at 435000 iterations +2023/11/05 10:52:07 - mmengine - INFO - Iter(train) [435500/640000] base_lr: 4.7831e-05 lr: 6.1664e-06 eta: 2 days, 13:51:21 time: 1.0943 data_time: 0.0361 memory: 21521 grad_norm: 3.4177 loss: 1.2380 caption_loss_cls: 2.1312 grounding_loss_reg: 2.5240 detection_loss_cls: 0.0319 detection_loss_reg: 0.3302 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0328 instance_segmentation_loss_reg: 0.3314 instance_segmentation_loss_poly: 0.8518 +2023/11/05 11:01:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 11:01:05 - mmengine - INFO - Iter(train) [436000/640000] base_lr: 4.7626e-05 lr: 6.1478e-06 eta: 2 days, 13:41:59 time: 1.0975 data_time: 0.0361 memory: 21521 grad_norm: 3.3882 loss: 1.2350 caption_loss_cls: 2.1325 grounding_loss_reg: 2.5227 detection_loss_cls: 0.0318 detection_loss_reg: 0.3296 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0327 instance_segmentation_loss_reg: 0.3308 instance_segmentation_loss_poly: 0.8511 +2023/11/05 11:01:05 - mmengine - INFO - Saving checkpoint at 436000 iterations +2023/11/05 11:10:03 - mmengine - INFO - Iter(train) [436500/640000] base_lr: 4.7421e-05 lr: 6.1292e-06 eta: 2 days, 13:32:33 time: 1.0932 data_time: 0.0359 memory: 21521 grad_norm: 3.3900 loss: 1.2333 caption_loss_cls: 2.1298 grounding_loss_reg: 2.5221 detection_loss_cls: 0.0317 detection_loss_reg: 0.3286 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0326 instance_segmentation_loss_reg: 0.3305 instance_segmentation_loss_poly: 0.8510 +2023/11/05 11:19:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 11:19:13 - mmengine - INFO - Iter(train) [437000/640000] base_lr: 4.7217e-05 lr: 6.1106e-06 eta: 2 days, 13:23:43 time: 1.0892 data_time: 0.0357 memory: 21521 grad_norm: 3.3752 loss: 1.2254 caption_loss_cls: 2.1289 grounding_loss_reg: 2.5195 detection_loss_cls: 0.0317 detection_loss_reg: 0.3289 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0325 instance_segmentation_loss_reg: 0.3302 instance_segmentation_loss_poly: 0.8498 +2023/11/05 11:19:13 - mmengine - INFO - Saving checkpoint at 437000 iterations +2023/11/05 11:28:23 - mmengine - INFO - Iter(train) [437500/640000] base_lr: 4.7013e-05 lr: 6.0921e-06 eta: 2 days, 13:14:54 time: 1.0882 data_time: 0.0358 memory: 21521 grad_norm: 3.4278 loss: 1.2362 caption_loss_cls: 2.1238 grounding_loss_reg: 2.5168 detection_loss_cls: 0.0315 detection_loss_reg: 0.3276 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0325 instance_segmentation_loss_reg: 0.3310 instance_segmentation_loss_poly: 0.8519 +2023/11/05 11:37:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 11:37:36 - mmengine - INFO - Iter(train) [438000/640000] base_lr: 4.6810e-05 lr: 6.0736e-06 eta: 2 days, 13:06:15 time: 1.0901 data_time: 0.0357 memory: 21521 grad_norm: 3.3960 loss: 1.2278 caption_loss_cls: 2.1260 grounding_loss_reg: 2.5158 detection_loss_cls: 0.0315 detection_loss_reg: 0.3279 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0325 instance_segmentation_loss_reg: 0.3313 instance_segmentation_loss_poly: 0.8522 +2023/11/05 11:37:36 - mmengine - INFO - Saving checkpoint at 438000 iterations +2023/11/05 11:46:46 - mmengine - INFO - Iter(train) [438500/640000] base_lr: 4.6607e-05 lr: 6.0551e-06 eta: 2 days, 12:57:24 time: 1.0867 data_time: 0.0357 memory: 21521 grad_norm: 3.4112 loss: 1.2287 caption_loss_cls: 2.1270 grounding_loss_reg: 2.5166 detection_loss_cls: 0.0315 detection_loss_reg: 0.3285 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0325 instance_segmentation_loss_reg: 0.3314 instance_segmentation_loss_poly: 0.8524 +2023/11/05 11:56:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 11:56:03 - mmengine - INFO - Iter(train) [439000/640000] base_lr: 4.6404e-05 lr: 6.0367e-06 eta: 2 days, 12:48:55 time: 1.0923 data_time: 0.0361 memory: 21521 grad_norm: 3.4136 loss: 1.2332 caption_loss_cls: 2.1246 grounding_loss_reg: 2.5150 detection_loss_cls: 0.0314 detection_loss_reg: 0.3285 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0325 instance_segmentation_loss_reg: 0.3317 instance_segmentation_loss_poly: 0.8522 +2023/11/05 11:56:03 - mmengine - INFO - Saving checkpoint at 439000 iterations +2023/11/05 12:04:53 - mmengine - INFO - Iter(train) [439500/640000] base_lr: 4.6201e-05 lr: 6.0183e-06 eta: 2 days, 12:39:09 time: 1.0909 data_time: 0.0360 memory: 21521 grad_norm: 3.4389 loss: 1.2357 caption_loss_cls: 2.1230 grounding_loss_reg: 2.5132 detection_loss_cls: 0.0315 detection_loss_reg: 0.3291 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0325 instance_segmentation_loss_reg: 0.3320 instance_segmentation_loss_poly: 0.8523 +2023/11/05 12:14:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 12:14:05 - mmengine - INFO - Iter(train) [440000/640000] base_lr: 4.5999e-05 lr: 5.9999e-06 eta: 2 days, 12:30:23 time: 1.0941 data_time: 0.0362 memory: 21521 grad_norm: 3.4714 loss: 1.2353 caption_loss_cls: 2.1217 grounding_loss_reg: 2.5101 detection_loss_cls: 0.0315 detection_loss_reg: 0.3295 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0325 instance_segmentation_loss_reg: 0.3322 instance_segmentation_loss_poly: 0.8526 +2023/11/05 12:14:05 - mmengine - INFO - Saving checkpoint at 440000 iterations +2023/11/05 12:22:57 - mmengine - INFO - Evaluating bbox... +2023/11/05 12:23:54 - mmengine - INFO - bbox_mAP_copypaste: 0.454 0.628 0.491 0.278 0.499 0.601 +2023/11/05 12:23:54 - mmengine - INFO - Evaluating segm... +2023/11/05 12:25:06 - mmengine - INFO - segm_mAP_copypaste: 0.308 0.550 0.301 0.152 0.350 0.477 +2023/11/05 12:29:56 - mmengine - INFO - per class results: +2023/11/05 12:29:56 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.47 | 88.13 | +| building | 79.72 | 89.34 | +| sky | 92.88 | 97.66 | +| floor | 79.54 | 88.95 | +| tree | 72.27 | 87.68 | +| ceiling | 83.26 | 94.92 | +| road | 81.91 | 89.88 | +| bed | 86.72 | 95.38 | +| windowpane | 60.27 | 76.66 | +| grass | 68.81 | 84.96 | +| cabinet | 57.03 | 68.88 | +| sidewalk | 66.56 | 80.18 | +| person | 79.19 | 90.21 | +| earth | 39.27 | 54.3 | +| door | 49.32 | 67.57 | +| table | 59.16 | 74.32 | +| mountain | 52.8 | 65.33 | +| plant | 51.12 | 60.86 | +| curtain | 67.69 | 84.52 | +| chair | 56.02 | 69.3 | +| car | 83.31 | 90.73 | +| water | 46.23 | 57.89 | +| painting | 70.46 | 86.05 | +| sofa | 65.73 | 80.4 | +| shelf | 40.92 | 59.9 | +| house | 36.8 | 57.57 | +| sea | 49.55 | 81.99 | +| mirror | 61.07 | 76.43 | +| rug | 67.19 | 77.62 | +| field | 25.59 | 34.51 | +| armchair | 43.5 | 62.28 | +| seat | 62.56 | 79.97 | +| fence | 34.02 | 45.3 | +| desk | 45.76 | 66.08 | +| rock | 35.4 | 52.68 | +| wardrobe | 45.46 | 66.87 | +| lamp | 59.24 | 74.01 | +| bathtub | 76.81 | 82.4 | +| railing | 26.63 | 40.79 | +| cushion | 55.39 | 70.03 | +| base | 18.98 | 25.96 | +| box | 23.75 | 33.18 | +| column | 48.13 | 60.34 | +| signboard | 35.17 | 47.32 | +| chest of drawers | 35.77 | 49.64 | +| counter | 33.27 | 40.34 | +| sand | 36.48 | 48.74 | +| sink | 70.84 | 77.29 | +| skyscraper | 57.09 | 70.78 | +| fireplace | 73.03 | 89.82 | +| refrigerator | 71.81 | 76.47 | +| grandstand | 34.27 | 67.07 | +| path | 16.09 | 19.06 | +| stairs | 23.57 | 29.82 | +| runway | 64.06 | 78.74 | +| case | 41.97 | 54.6 | +| pool table | 87.42 | 95.4 | +| pillow | 53.88 | 65.51 | +| screen door | 62.72 | 67.47 | +| stairway | 29.87 | 41.91 | +| river | 20.93 | 31.1 | +| bridge | 62.4 | 73.51 | +| bookcase | 35.66 | 57.23 | +| blind | 21.09 | 22.57 | +| coffee table | 63.7 | 77.33 | +| toilet | 81.83 | 88.62 | +| flower | 32.75 | 45.79 | +| book | 46.87 | 64.1 | +| hill | 11.82 | 17.98 | +| bench | 45.19 | 52.51 | +| countertop | 51.36 | 60.3 | +| stove | 72.44 | 83.25 | +| palm | 41.32 | 49.91 | +| kitchen island | 38.84 | 75.26 | +| computer | 58.07 | 62.34 | +| swivel chair | 44.3 | 62.97 | +| boat | 74.26 | 82.65 | +| bar | 30.01 | 36.03 | +| arcade machine | 42.32 | 48.33 | +| hovel | 16.51 | 26.44 | +| bus | 78.96 | 95.98 | +| towel | 56.11 | 65.76 | +| light | 44.9 | 52.66 | +| truck | 40.92 | 60.64 | +| tower | 33.81 | 55.76 | +| chandelier | 62.18 | 75.65 | +| awning | 23.23 | 26.94 | +| streetlight | 25.44 | 32.18 | +| booth | 44.01 | 44.55 | +| television receiver | 68.58 | 81.9 | +| airplane | 55.03 | 64.06 | +| dirt track | 1.41 | 8.04 | +| apparel | 35.48 | 52.82 | +| pole | 28.55 | 37.81 | +| land | 2.66 | 3.36 | +| bannister | 12.27 | 16.07 | +| escalator | 21.94 | 22.77 | +| ottoman | 49.57 | 60.31 | +| bottle | 27.1 | 33.48 | +| buffet | 45.15 | 49.75 | +| poster | 15.06 | 16.76 | +| stage | 13.22 | 26.17 | +| van | 38.97 | 49.27 | +| ship | 72.27 | 73.22 | +| fountain | 6.59 | 6.75 | +| conveyer belt | 70.84 | 86.53 | +| canopy | 13.11 | 15.51 | +| washer | 60.01 | 62.48 | +| plaything | 29.4 | 43.6 | +| swimming pool | 61.64 | 90.1 | +| stool | 43.3 | 65.67 | +| barrel | 24.32 | 84.63 | +| basket | 28.17 | 41.61 | +| waterfall | 62.72 | 94.02 | +| tent | 94.23 | 97.93 | +| bag | 11.7 | 12.59 | +| minibike | 71.91 | 80.36 | +| cradle | 69.51 | 94.65 | +| oven | 34.05 | 43.77 | +| ball | 43.62 | 50.38 | +| food | 46.83 | 51.26 | +| step | 13.38 | 19.34 | +| tank | 41.94 | 42.83 | +| trade name | 24.8 | 30.87 | +| microwave | 75.27 | 80.83 | +| pot | 44.8 | 50.93 | +| animal | 62.89 | 66.3 | +| bicycle | 56.15 | 74.49 | +| lake | 58.84 | 67.8 | +| dishwasher | 55.87 | 72.71 | +| screen | 61.81 | 65.93 | +| blanket | 8.52 | 10.04 | +| sculpture | 57.01 | 67.73 | +| hood | 58.04 | 62.18 | +| sconce | 30.81 | 37.94 | +| vase | 37.98 | 51.79 | +| traffic light | 32.61 | 55.8 | +| tray | 9.58 | 13.85 | +| ashcan | 38.32 | 46.62 | +| fan | 54.0 | 65.88 | +| pier | 44.29 | 83.32 | +| crt screen | 5.55 | 11.27 | +| plate | 54.58 | 67.3 | +| monitor | 40.23 | 67.74 | +| bulletin board | 20.04 | 24.64 | +| shower | 2.29 | 4.43 | +| radiator | 48.07 | 52.72 | +| glass | 16.12 | 17.52 | +| clock | 24.05 | 32.12 | +| flag | 29.22 | 33.01 | ++---------------------+-------+-------+ +2023/11/05 12:30:11 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4540 coco/bbox_mAP_50: 0.6280 coco/bbox_mAP_75: 0.4910 coco/bbox_mAP_s: 0.2780 coco/bbox_mAP_m: 0.4990 coco/bbox_mAP_l: 0.6010 coco/segm_mAP: 0.3080 coco/segm_mAP_50: 0.5500 coco/segm_mAP_75: 0.3010 coco/segm_mAP_s: 0.1520 coco/segm_mAP_m: 0.3500 coco/segm_mAP_l: 0.4770 Bleu_1: 0.7375 Bleu_2: 0.5732 Bleu_3: 0.4360 Bleu_4: 0.3303 METEOR: 0.2630 ROUGE_L: 0.5467 CIDEr: 1.0508 SPICE: 0.1933 aAcc: 81.7100 mIoU: 46.5100 mAcc: 58.1100 visual-grounding/miou: 0.7714 visual-grounding/acc: 0.8427 data_time: 0.0043 time: 0.5213 +2023/11/05 12:38:53 - mmengine - INFO - Iter(train) [440500/640000] base_lr: 4.5797e-05 lr: 5.9816e-06 eta: 2 days, 12:20:20 time: 1.0907 data_time: 0.0332 memory: 21521 grad_norm: 3.4522 loss: 1.2299 caption_loss_cls: 2.1171 grounding_loss_reg: 2.5115 detection_loss_cls: 0.0315 detection_loss_reg: 0.3296 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0325 instance_segmentation_loss_reg: 0.3317 instance_segmentation_loss_poly: 0.8517 +2023/11/05 12:47:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 12:47:39 - mmengine - INFO - Iter(train) [441000/640000] base_lr: 4.5596e-05 lr: 5.9632e-06 eta: 2 days, 12:10:23 time: 1.0848 data_time: 0.0330 memory: 21521 grad_norm: 3.4595 loss: 1.2343 caption_loss_cls: 2.1194 grounding_loss_reg: 2.5140 detection_loss_cls: 0.0316 detection_loss_reg: 0.3290 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0325 instance_segmentation_loss_reg: 0.3322 instance_segmentation_loss_poly: 0.8514 +2023/11/05 12:47:39 - mmengine - INFO - Saving checkpoint at 441000 iterations +2023/11/05 12:56:59 - mmengine - INFO - Iter(train) [441500/640000] base_lr: 4.5394e-05 lr: 5.9449e-06 eta: 2 days, 12:02:01 time: 1.0873 data_time: 0.0333 memory: 21521 grad_norm: 3.4495 loss: 1.2379 caption_loss_cls: 2.1203 grounding_loss_reg: 2.5148 detection_loss_cls: 0.0315 detection_loss_reg: 0.3283 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0325 instance_segmentation_loss_reg: 0.3324 instance_segmentation_loss_poly: 0.8513 +2023/11/05 13:06:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 13:06:11 - mmengine - INFO - Iter(train) [442000/640000] base_lr: 4.5193e-05 lr: 5.9267e-06 eta: 2 days, 11:53:16 time: 1.0869 data_time: 0.0333 memory: 21521 grad_norm: 3.4493 loss: 1.2373 caption_loss_cls: 2.1166 grounding_loss_reg: 2.5161 detection_loss_cls: 0.0316 detection_loss_reg: 0.3285 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0324 instance_segmentation_loss_reg: 0.3320 instance_segmentation_loss_poly: 0.8504 +2023/11/05 13:06:11 - mmengine - INFO - Saving checkpoint at 442000 iterations +2023/11/05 13:15:28 - mmengine - INFO - Iter(train) [442500/640000] base_lr: 4.4993e-05 lr: 5.9085e-06 eta: 2 days, 11:44:45 time: 1.0888 data_time: 0.0332 memory: 21521 grad_norm: 3.4192 loss: 1.2282 caption_loss_cls: 2.1176 grounding_loss_reg: 2.5131 detection_loss_cls: 0.0315 detection_loss_reg: 0.3282 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0324 instance_segmentation_loss_reg: 0.3318 instance_segmentation_loss_poly: 0.8499 +2023/11/05 13:24:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 13:24:32 - mmengine - INFO - Iter(train) [443000/640000] base_lr: 4.4793e-05 lr: 5.8903e-06 eta: 2 days, 11:35:38 time: 1.0854 data_time: 0.0331 memory: 21521 grad_norm: 3.4399 loss: 1.2286 caption_loss_cls: 2.1159 grounding_loss_reg: 2.5139 detection_loss_cls: 0.0315 detection_loss_reg: 0.3287 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0322 instance_segmentation_loss_reg: 0.3307 instance_segmentation_loss_poly: 0.8480 +2023/11/05 13:24:32 - mmengine - INFO - Saving checkpoint at 443000 iterations +2023/11/05 13:33:36 - mmengine - INFO - Iter(train) [443500/640000] base_lr: 4.4593e-05 lr: 5.8721e-06 eta: 2 days, 11:26:30 time: 1.0888 data_time: 0.0333 memory: 21521 grad_norm: 3.4595 loss: 1.2275 caption_loss_cls: 2.1126 grounding_loss_reg: 2.5124 detection_loss_cls: 0.0314 detection_loss_reg: 0.3278 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0321 instance_segmentation_loss_reg: 0.3296 instance_segmentation_loss_poly: 0.8452 +2023/11/05 13:42:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231104_135211 +2023/11/05 13:42:37 - mmengine - INFO - Iter(train) [444000/640000] base_lr: 4.4393e-05 lr: 5.8539e-06 eta: 2 days, 11:17:16 time: 1.0862 data_time: 0.0332 memory: 21521 grad_norm: 3.4538 loss: 1.2232 caption_loss_cls: 2.1160 grounding_loss_reg: 2.5134 detection_loss_cls: 0.0313 detection_loss_reg: 0.3267 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0320 instance_segmentation_loss_reg: 0.3292 instance_segmentation_loss_poly: 0.8439 +2023/11/05 13:42:37 - mmengine - INFO - Saving checkpoint at 444000 iterations +2023/11/05 17:50:34 - mmengine - INFO - Iter(train) [444500/640000] base_lr: 4.4194e-05 lr: 5.8358e-06 eta: 2 days, 14:44:56 time: 1.0998 data_time: 0.0330 memory: 21519 grad_norm: 3.4354 loss: 1.2250 caption_loss_cls: 2.1191 grounding_loss_reg: 2.5138 detection_loss_cls: 0.0313 detection_loss_reg: 0.3262 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0319 instance_segmentation_loss_reg: 0.3288 instance_segmentation_loss_poly: 0.8429 +2023/11/05 17:59:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 17:59:50 - mmengine - INFO - Iter(train) [445000/640000] base_lr: 4.3995e-05 lr: 5.8178e-06 eta: 2 days, 13:21:36 time: 1.1071 data_time: 0.0329 memory: 21519 grad_norm: 3.4663 loss: 1.2199 caption_loss_cls: 2.1186 grounding_loss_reg: 2.5132 detection_loss_cls: 0.0313 detection_loss_reg: 0.3265 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0319 instance_segmentation_loss_reg: 0.3285 instance_segmentation_loss_poly: 0.8425 +2023/11/05 17:59:50 - mmengine - INFO - Saving checkpoint at 445000 iterations +2023/11/05 18:09:17 - mmengine - INFO - Iter(train) [445500/640000] base_lr: 4.3797e-05 lr: 5.7997e-06 eta: 2 days, 13:13:22 time: 1.1090 data_time: 0.0324 memory: 21519 grad_norm: 3.4500 loss: 1.2069 caption_loss_cls: 2.1202 grounding_loss_reg: 2.5130 detection_loss_cls: 0.0313 detection_loss_reg: 0.3255 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0319 instance_segmentation_loss_reg: 0.3281 instance_segmentation_loss_poly: 0.8419 +2023/11/05 18:18:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 18:18:07 - mmengine - INFO - Iter(train) [446000/640000] base_lr: 4.3599e-05 lr: 5.7817e-06 eta: 2 days, 12:04:25 time: 1.1036 data_time: 0.0319 memory: 21519 grad_norm: 3.4837 loss: 1.2061 caption_loss_cls: 2.1174 grounding_loss_reg: 2.5124 detection_loss_cls: 0.0313 detection_loss_reg: 0.3252 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0318 instance_segmentation_loss_reg: 0.3279 instance_segmentation_loss_poly: 0.8417 +2023/11/05 18:18:07 - mmengine - INFO - Saving checkpoint at 446000 iterations +2023/11/05 18:27:35 - mmengine - INFO - Iter(train) [446500/640000] base_lr: 4.3401e-05 lr: 5.7637e-06 eta: 2 days, 12:07:32 time: 1.1061 data_time: 0.0316 memory: 21519 grad_norm: 3.4906 loss: 1.2057 caption_loss_cls: 2.1141 grounding_loss_reg: 2.5099 detection_loss_cls: 0.0314 detection_loss_reg: 0.3250 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0316 instance_segmentation_loss_reg: 0.3263 instance_segmentation_loss_poly: 0.8394 +2023/11/05 18:37:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 18:37:04 - mmengine - INFO - Iter(train) [447000/640000] base_lr: 4.3204e-05 lr: 5.7458e-06 eta: 2 days, 12:08:18 time: 1.1124 data_time: 0.0316 memory: 21519 grad_norm: 3.5077 loss: 1.2072 caption_loss_cls: 2.1097 grounding_loss_reg: 2.5098 detection_loss_cls: 0.0314 detection_loss_reg: 0.3252 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0317 instance_segmentation_loss_reg: 0.3273 instance_segmentation_loss_poly: 0.8410 +2023/11/05 18:37:04 - mmengine - INFO - Saving checkpoint at 447000 iterations +2023/11/05 18:46:48 - mmengine - INFO - Iter(train) [447500/640000] base_lr: 4.3006e-05 lr: 5.7279e-06 eta: 2 days, 12:20:23 time: 1.1226 data_time: 0.0315 memory: 21519 grad_norm: 3.4603 loss: 1.1957 caption_loss_cls: 2.1078 grounding_loss_reg: 2.5064 detection_loss_cls: 0.0314 detection_loss_reg: 0.3250 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0316 instance_segmentation_loss_reg: 0.3268 instance_segmentation_loss_poly: 0.8405 +2023/11/05 18:56:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 18:56:08 - mmengine - INFO - Iter(train) [448000/640000] base_lr: 4.2810e-05 lr: 5.7100e-06 eta: 2 days, 12:07:01 time: 1.1272 data_time: 0.0317 memory: 21519 grad_norm: 3.4826 loss: 1.1999 caption_loss_cls: 2.1033 grounding_loss_reg: 2.5052 detection_loss_cls: 0.0314 detection_loss_reg: 0.3247 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0315 instance_segmentation_loss_reg: 0.3269 instance_segmentation_loss_poly: 0.8407 +2023/11/05 18:56:08 - mmengine - INFO - Saving checkpoint at 448000 iterations +2023/11/05 19:05:45 - mmengine - INFO - Iter(train) [448500/640000] base_lr: 4.2613e-05 lr: 5.6921e-06 eta: 2 days, 12:06:47 time: 1.1269 data_time: 0.0351 memory: 21519 grad_norm: 3.5001 loss: 1.1990 caption_loss_cls: 2.1034 grounding_loss_reg: 2.5042 detection_loss_cls: 0.0315 detection_loss_reg: 0.3255 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0315 instance_segmentation_loss_reg: 0.3270 instance_segmentation_loss_poly: 0.8400 +2023/11/05 19:13:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 19:13:53 - mmengine - INFO - Iter(train) [449000/640000] base_lr: 4.2417e-05 lr: 5.6743e-06 eta: 2 days, 11:08:28 time: 1.1102 data_time: 0.0347 memory: 21519 grad_norm: 3.5542 loss: 1.2165 caption_loss_cls: 2.1017 grounding_loss_reg: 2.5001 detection_loss_cls: 0.0315 detection_loss_reg: 0.3256 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0315 instance_segmentation_loss_reg: 0.3268 instance_segmentation_loss_poly: 0.8394 +2023/11/05 19:13:53 - mmengine - INFO - Saving checkpoint at 449000 iterations +2023/11/05 19:23:36 - mmengine - INFO - Iter(train) [449500/640000] base_lr: 4.2222e-05 lr: 5.6565e-06 eta: 2 days, 11:13:46 time: 1.1141 data_time: 0.0349 memory: 21519 grad_norm: 3.5680 loss: 1.2227 caption_loss_cls: 2.1016 grounding_loss_reg: 2.5004 detection_loss_cls: 0.0314 detection_loss_reg: 0.3257 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0315 instance_segmentation_loss_reg: 0.3275 instance_segmentation_loss_poly: 0.8411 +2023/11/05 19:33:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 19:33:15 - mmengine - INFO - Iter(train) [450000/640000] base_lr: 4.2026e-05 lr: 5.6387e-06 eta: 2 days, 11:14:06 time: 1.1261 data_time: 0.0351 memory: 21519 grad_norm: 3.5169 loss: 1.2102 caption_loss_cls: 2.0989 grounding_loss_reg: 2.5019 detection_loss_cls: 0.0313 detection_loss_reg: 0.3258 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0315 instance_segmentation_loss_reg: 0.3278 instance_segmentation_loss_poly: 0.8413 +2023/11/05 19:33:15 - mmengine - INFO - Saving checkpoint at 450000 iterations +2023/11/05 19:43:02 - mmengine - INFO - Iter(train) [450500/640000] base_lr: 4.1831e-05 lr: 5.6210e-06 eta: 2 days, 11:17:08 time: 1.1311 data_time: 0.0357 memory: 21519 grad_norm: 3.5839 loss: 1.2237 caption_loss_cls: 2.1017 grounding_loss_reg: 2.5002 detection_loss_cls: 0.0314 detection_loss_reg: 0.3276 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0316 instance_segmentation_loss_reg: 0.3289 instance_segmentation_loss_poly: 0.8423 +2023/11/05 19:52:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 19:52:17 - mmengine - INFO - Iter(train) [451000/640000] base_lr: 4.1637e-05 lr: 5.6033e-06 eta: 2 days, 11:04:04 time: 1.1276 data_time: 0.0356 memory: 21519 grad_norm: 3.5890 loss: 1.2241 caption_loss_cls: 2.0979 grounding_loss_reg: 2.5005 detection_loss_cls: 0.0314 detection_loss_reg: 0.3277 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0315 instance_segmentation_loss_reg: 0.3291 instance_segmentation_loss_poly: 0.8427 +2023/11/05 19:52:17 - mmengine - INFO - Saving checkpoint at 451000 iterations +2023/11/05 20:00:58 - mmengine - INFO - Iter(train) [451500/640000] base_lr: 4.1442e-05 lr: 5.5857e-06 eta: 2 days, 10:37:11 time: 1.1117 data_time: 0.0352 memory: 21519 grad_norm: 3.6741 loss: 1.2406 caption_loss_cls: 2.0946 grounding_loss_reg: 2.4987 detection_loss_cls: 0.0315 detection_loss_reg: 0.3282 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0314 instance_segmentation_loss_reg: 0.3285 instance_segmentation_loss_poly: 0.8424 +2023/11/05 20:09:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 20:09:47 - mmengine - INFO - Iter(train) [452000/640000] base_lr: 4.1248e-05 lr: 5.5680e-06 eta: 2 days, 10:15:24 time: 1.1039 data_time: 0.0348 memory: 21519 grad_norm: 3.7020 loss: 1.2440 caption_loss_cls: 2.0899 grounding_loss_reg: 2.4989 detection_loss_cls: 0.0314 detection_loss_reg: 0.3280 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3283 instance_segmentation_loss_poly: 0.8414 +2023/11/05 20:09:47 - mmengine - INFO - Saving checkpoint at 452000 iterations +2023/11/05 20:18:41 - mmengine - INFO - Iter(train) [452500/640000] base_lr: 4.1055e-05 lr: 5.5504e-06 eta: 2 days, 9:57:13 time: 1.0932 data_time: 0.0346 memory: 21519 grad_norm: 3.7361 loss: 1.2557 caption_loss_cls: 2.0891 grounding_loss_reg: 2.4989 detection_loss_cls: 0.0313 detection_loss_reg: 0.3278 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3285 instance_segmentation_loss_poly: 0.8423 +2023/11/05 20:27:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 20:27:55 - mmengine - INFO - Iter(train) [453000/640000] base_lr: 4.0862e-05 lr: 5.5329e-06 eta: 2 days, 9:47:00 time: 1.1095 data_time: 0.0352 memory: 21519 grad_norm: 3.6649 loss: 1.2476 caption_loss_cls: 2.0894 grounding_loss_reg: 2.4983 detection_loss_cls: 0.0313 detection_loss_reg: 0.3277 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3285 instance_segmentation_loss_poly: 0.8419 +2023/11/05 20:27:55 - mmengine - INFO - Saving checkpoint at 453000 iterations +2023/11/05 20:37:08 - mmengine - INFO - Iter(train) [453500/640000] base_lr: 4.0669e-05 lr: 5.5153e-06 eta: 2 days, 9:36:41 time: 1.1021 data_time: 0.0349 memory: 21519 grad_norm: 3.6749 loss: 1.2411 caption_loss_cls: 2.0864 grounding_loss_reg: 2.4983 detection_loss_cls: 0.0312 detection_loss_reg: 0.3271 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0309 instance_segmentation_loss_reg: 0.3277 instance_segmentation_loss_poly: 0.8398 +2023/11/05 20:46:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 20:46:07 - mmengine - INFO - Iter(train) [454000/640000] base_lr: 4.0476e-05 lr: 5.4978e-06 eta: 2 days, 9:21:53 time: 1.0922 data_time: 0.0351 memory: 21519 grad_norm: 3.7767 loss: 1.2681 caption_loss_cls: 2.0834 grounding_loss_reg: 2.4974 detection_loss_cls: 0.0312 detection_loss_reg: 0.3276 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3269 instance_segmentation_loss_poly: 0.8390 +2023/11/05 20:46:07 - mmengine - INFO - Saving checkpoint at 454000 iterations +2023/11/05 20:55:39 - mmengine - INFO - Iter(train) [454500/640000] base_lr: 4.0284e-05 lr: 5.4804e-06 eta: 2 days, 9:17:37 time: 1.0885 data_time: 0.0348 memory: 21519 grad_norm: 3.7964 loss: 1.2667 caption_loss_cls: 2.0825 grounding_loss_reg: 2.4980 detection_loss_cls: 0.0311 detection_loss_reg: 0.3271 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3261 instance_segmentation_loss_poly: 0.8383 +2023/11/05 21:04:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 21:04:23 - mmengine - INFO - Iter(train) [455000/640000] base_lr: 4.0092e-05 lr: 5.4630e-06 eta: 2 days, 8:59:07 time: 1.0806 data_time: 0.0346 memory: 21519 grad_norm: 3.8177 loss: 1.2689 caption_loss_cls: 2.0787 grounding_loss_reg: 2.4966 detection_loss_cls: 0.0311 detection_loss_reg: 0.3267 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3262 instance_segmentation_loss_poly: 0.8382 +2023/11/05 21:04:23 - mmengine - INFO - Saving checkpoint at 455000 iterations +2023/11/05 21:13:41 - mmengine - INFO - Iter(train) [455500/640000] base_lr: 3.9901e-05 lr: 5.4456e-06 eta: 2 days, 8:50:48 time: 1.0898 data_time: 0.0349 memory: 21519 grad_norm: 3.8094 loss: 1.2744 caption_loss_cls: 2.0778 grounding_loss_reg: 2.4950 detection_loss_cls: 0.0310 detection_loss_reg: 0.3257 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3265 instance_segmentation_loss_poly: 0.8395 +2023/11/05 21:22:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 21:22:55 - mmengine - INFO - Iter(train) [456000/640000] base_lr: 3.9710e-05 lr: 5.4282e-06 eta: 2 days, 8:41:26 time: 1.0964 data_time: 0.0351 memory: 21519 grad_norm: 3.7656 loss: 1.2632 caption_loss_cls: 2.0762 grounding_loss_reg: 2.4928 detection_loss_cls: 0.0310 detection_loss_reg: 0.3263 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3270 instance_segmentation_loss_poly: 0.8399 +2023/11/05 21:22:55 - mmengine - INFO - Saving checkpoint at 456000 iterations +2023/11/05 21:32:37 - mmengine - INFO - Iter(train) [456500/640000] base_lr: 3.9519e-05 lr: 5.4109e-06 eta: 2 days, 8:38:38 time: 1.1082 data_time: 0.0352 memory: 21519 grad_norm: 3.7421 loss: 1.2477 caption_loss_cls: 2.0780 grounding_loss_reg: 2.4919 detection_loss_cls: 0.0311 detection_loss_reg: 0.3271 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3273 instance_segmentation_loss_poly: 0.8398 +2023/11/05 21:41:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 21:41:54 - mmengine - INFO - Iter(train) [457000/640000] base_lr: 3.9329e-05 lr: 5.3936e-06 eta: 2 days, 8:29:38 time: 1.1090 data_time: 0.0352 memory: 21519 grad_norm: 3.7595 loss: 1.2474 caption_loss_cls: 2.0758 grounding_loss_reg: 2.4914 detection_loss_cls: 0.0310 detection_loss_reg: 0.3271 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3277 instance_segmentation_loss_poly: 0.8408 +2023/11/05 21:41:54 - mmengine - INFO - Saving checkpoint at 457000 iterations +2023/11/05 21:51:36 - mmengine - INFO - Iter(train) [457500/640000] base_lr: 3.9139e-05 lr: 5.3763e-06 eta: 2 days, 8:26:17 time: 1.1162 data_time: 0.0355 memory: 21519 grad_norm: 3.7358 loss: 1.2542 caption_loss_cls: 2.0747 grounding_loss_reg: 2.4920 detection_loss_cls: 0.0311 detection_loss_reg: 0.3277 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0309 instance_segmentation_loss_reg: 0.3276 instance_segmentation_loss_poly: 0.8406 +2023/11/05 22:00:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 22:00:45 - mmengine - INFO - Iter(train) [458000/640000] base_lr: 3.8950e-05 lr: 5.3591e-06 eta: 2 days, 8:15:13 time: 1.1188 data_time: 0.0352 memory: 21519 grad_norm: 3.6919 loss: 1.2400 caption_loss_cls: 2.0745 grounding_loss_reg: 2.4916 detection_loss_cls: 0.0310 detection_loss_reg: 0.3277 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3275 instance_segmentation_loss_poly: 0.8398 +2023/11/05 22:00:45 - mmengine - INFO - Saving checkpoint at 458000 iterations +2023/11/05 22:10:25 - mmengine - INFO - Iter(train) [458500/640000] base_lr: 3.8761e-05 lr: 5.3419e-06 eta: 2 days, 8:10:51 time: 1.1207 data_time: 0.0349 memory: 21519 grad_norm: 3.6279 loss: 1.2188 caption_loss_cls: 2.0704 grounding_loss_reg: 2.4892 detection_loss_cls: 0.0309 detection_loss_reg: 0.3267 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3268 instance_segmentation_loss_poly: 0.8387 +2023/11/05 22:19:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 22:19:28 - mmengine - INFO - Iter(train) [459000/640000] base_lr: 3.8572e-05 lr: 5.3247e-06 eta: 2 days, 7:58:34 time: 1.1256 data_time: 0.0352 memory: 21519 grad_norm: 3.6278 loss: 1.2194 caption_loss_cls: 2.0686 grounding_loss_reg: 2.4873 detection_loss_cls: 0.0309 detection_loss_reg: 0.3258 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3268 instance_segmentation_loss_poly: 0.8391 +2023/11/05 22:19:28 - mmengine - INFO - Saving checkpoint at 459000 iterations +2023/11/05 22:28:58 - mmengine - INFO - Iter(train) [459500/640000] base_lr: 3.8383e-05 lr: 5.3076e-06 eta: 2 days, 7:51:47 time: 1.1284 data_time: 0.0355 memory: 21519 grad_norm: 3.6319 loss: 1.2247 caption_loss_cls: 2.0705 grounding_loss_reg: 2.4888 detection_loss_cls: 0.0310 detection_loss_reg: 0.3274 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3272 instance_segmentation_loss_poly: 0.8405 +2023/11/05 22:38:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 22:38:34 - mmengine - INFO - Iter(train) [460000/640000] base_lr: 3.8195e-05 lr: 5.2905e-06 eta: 2 days, 7:46:04 time: 1.1339 data_time: 0.0357 memory: 21519 grad_norm: 3.6460 loss: 1.2302 caption_loss_cls: 2.0725 grounding_loss_reg: 2.4874 detection_loss_cls: 0.0310 detection_loss_reg: 0.3269 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3264 instance_segmentation_loss_poly: 0.8401 +2023/11/05 22:38:34 - mmengine - INFO - Saving checkpoint at 460000 iterations +2023/11/05 22:47:04 - mmengine - INFO - Evaluating bbox... +2023/11/05 22:48:00 - mmengine - INFO - bbox_mAP_copypaste: 0.453 0.626 0.492 0.277 0.503 0.605 +2023/11/05 22:48:00 - mmengine - INFO - Evaluating segm... +2023/11/05 22:49:13 - mmengine - INFO - segm_mAP_copypaste: 0.306 0.546 0.298 0.150 0.354 0.477 +2023/11/05 22:53:58 - mmengine - INFO - per class results: +2023/11/05 22:53:58 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 76.12 | 87.23 | +| building | 79.88 | 89.84 | +| sky | 92.86 | 98.02 | +| floor | 80.67 | 89.25 | +| tree | 72.31 | 86.67 | +| ceiling | 83.54 | 94.09 | +| road | 81.8 | 89.02 | +| bed | 86.36 | 94.39 | +| windowpane | 58.25 | 71.14 | +| grass | 67.41 | 82.86 | +| cabinet | 59.52 | 72.17 | +| sidewalk | 65.63 | 80.94 | +| person | 78.96 | 91.48 | +| earth | 37.19 | 48.9 | +| door | 47.81 | 63.16 | +| table | 57.35 | 72.14 | +| mountain | 52.52 | 64.99 | +| plant | 50.89 | 64.67 | +| curtain | 69.28 | 85.85 | +| chair | 55.08 | 68.27 | +| car | 81.12 | 91.33 | +| water | 51.04 | 64.68 | +| painting | 66.57 | 85.72 | +| sofa | 66.06 | 77.63 | +| shelf | 42.52 | 67.51 | +| house | 43.95 | 60.98 | +| sea | 48.66 | 70.83 | +| mirror | 63.74 | 71.86 | +| rug | 63.02 | 70.67 | +| field | 32.83 | 53.24 | +| armchair | 44.2 | 70.72 | +| seat | 62.93 | 79.03 | +| fence | 43.45 | 58.83 | +| desk | 41.93 | 69.5 | +| rock | 37.34 | 56.13 | +| wardrobe | 46.4 | 67.22 | +| lamp | 58.53 | 74.73 | +| bathtub | 78.99 | 84.98 | +| railing | 29.53 | 49.93 | +| cushion | 55.22 | 68.15 | +| base | 24.99 | 37.3 | +| box | 23.96 | 29.04 | +| column | 47.97 | 60.24 | +| signboard | 35.29 | 44.54 | +| chest of drawers | 35.21 | 46.99 | +| counter | 29.15 | 42.56 | +| sand | 35.2 | 44.46 | +| sink | 70.83 | 78.01 | +| skyscraper | 31.25 | 37.24 | +| fireplace | 69.04 | 86.93 | +| refrigerator | 76.52 | 84.75 | +| grandstand | 30.78 | 70.6 | +| path | 21.25 | 29.93 | +| stairs | 28.73 | 41.99 | +| runway | 71.9 | 89.01 | +| case | 42.16 | 49.29 | +| pool table | 88.08 | 95.51 | +| pillow | 53.92 | 65.13 | +| screen door | 68.08 | 76.53 | +| stairway | 28.04 | 38.74 | +| river | 12.33 | 25.51 | +| bridge | 50.2 | 59.47 | +| bookcase | 34.44 | 54.45 | +| blind | 25.81 | 30.71 | +| coffee table | 60.68 | 82.58 | +| toilet | 83.91 | 88.73 | +| flower | 32.5 | 45.72 | +| book | 44.15 | 73.25 | +| hill | 8.2 | 19.68 | +| bench | 43.73 | 50.0 | +| countertop | 51.58 | 64.69 | +| stove | 76.88 | 82.44 | +| palm | 42.97 | 57.95 | +| kitchen island | 38.57 | 86.07 | +| computer | 71.73 | 83.29 | +| swivel chair | 43.5 | 61.08 | +| boat | 74.12 | 82.18 | +| bar | 44.21 | 66.3 | +| arcade machine | 32.29 | 34.99 | +| hovel | 12.87 | 16.97 | +| bus | 87.57 | 94.48 | +| towel | 57.71 | 70.71 | +| light | 45.73 | 53.29 | +| truck | 41.25 | 54.15 | +| tower | 37.31 | 48.5 | +| chandelier | 55.85 | 65.07 | +| awning | 24.89 | 30.16 | +| streetlight | 25.64 | 36.26 | +| booth | 43.1 | 51.25 | +| television receiver | 70.83 | 84.28 | +| airplane | 53.69 | 68.76 | +| dirt track | 0.44 | 1.55 | +| apparel | 35.75 | 53.54 | +| pole | 24.6 | 30.44 | +| land | 2.82 | 3.88 | +| bannister | 10.55 | 16.83 | +| escalator | 45.28 | 62.29 | +| ottoman | 46.62 | 68.12 | +| bottle | 24.29 | 29.29 | +| buffet | 38.55 | 41.58 | +| poster | 23.59 | 53.68 | +| stage | 14.57 | 25.79 | +| van | 24.5 | 31.56 | +| ship | 66.24 | 70.07 | +| fountain | 16.39 | 17.16 | +| conveyer belt | 76.36 | 88.25 | +| canopy | 26.11 | 43.28 | +| washer | 69.13 | 71.0 | +| plaything | 19.83 | 36.11 | +| swimming pool | 52.19 | 69.07 | +| stool | 41.12 | 51.97 | +| barrel | 47.31 | 65.2 | +| basket | 26.42 | 38.0 | +| waterfall | 59.19 | 74.97 | +| tent | 78.43 | 97.95 | +| bag | 14.26 | 16.81 | +| minibike | 71.18 | 82.62 | +| cradle | 75.74 | 93.65 | +| oven | 44.49 | 57.39 | +| ball | 46.12 | 58.52 | +| food | 52.98 | 59.98 | +| step | 15.8 | 18.91 | +| tank | 42.52 | 52.1 | +| trade name | 17.81 | 18.97 | +| microwave | 79.59 | 87.32 | +| pot | 48.57 | 56.39 | +| animal | 65.9 | 71.26 | +| bicycle | 54.73 | 76.63 | +| lake | 63.25 | 67.47 | +| dishwasher | 53.02 | 74.84 | +| screen | 53.94 | 70.37 | +| blanket | 12.1 | 15.38 | +| sculpture | 64.21 | 75.38 | +| hood | 58.25 | 63.42 | +| sconce | 36.16 | 44.16 | +| vase | 42.5 | 57.27 | +| traffic light | 32.3 | 47.78 | +| tray | 12.52 | 19.3 | +| ashcan | 40.23 | 60.38 | +| fan | 55.15 | 70.02 | +| pier | 29.25 | 37.61 | +| crt screen | 10.0 | 28.2 | +| plate | 54.36 | 71.44 | +| monitor | 17.67 | 20.25 | +| bulletin board | 15.24 | 19.91 | +| shower | 6.68 | 15.25 | +| radiator | 47.06 | 50.79 | +| glass | 15.16 | 16.47 | +| clock | 25.2 | 31.76 | +| flag | 29.21 | 33.15 | ++---------------------+-------+-------+ +2023/11/05 22:54:14 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4530 coco/bbox_mAP_50: 0.6260 coco/bbox_mAP_75: 0.4920 coco/bbox_mAP_s: 0.2770 coco/bbox_mAP_m: 0.5030 coco/bbox_mAP_l: 0.6050 coco/segm_mAP: 0.3060 coco/segm_mAP_50: 0.5460 coco/segm_mAP_75: 0.2980 coco/segm_mAP_s: 0.1500 coco/segm_mAP_m: 0.3540 coco/segm_mAP_l: 0.4770 Bleu_1: 0.7497 Bleu_2: 0.5840 Bleu_3: 0.4421 Bleu_4: 0.3304 METEOR: 0.2630 ROUGE_L: 0.5492 CIDEr: 1.0591 SPICE: 0.1962 aAcc: 81.7200 mIoU: 46.8400 mAcc: 58.9600 visual-grounding/miou: 0.7792 visual-grounding/acc: 0.8507 data_time: 0.0100 time: 0.5277 +2023/11/05 23:03:03 - mmengine - INFO - Iter(train) [460500/640000] base_lr: 3.8008e-05 lr: 5.2734e-06 eta: 2 days, 7:31:51 time: 1.1213 data_time: 0.0326 memory: 21518 grad_norm: 3.6864 loss: 1.2402 caption_loss_cls: 2.0737 grounding_loss_reg: 2.4854 detection_loss_cls: 0.0309 detection_loss_reg: 0.3260 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0306 instance_segmentation_loss_reg: 0.3266 instance_segmentation_loss_poly: 0.8402 +2023/11/05 23:11:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 23:11:50 - mmengine - INFO - Iter(train) [461000/640000] base_lr: 3.7821e-05 lr: 5.2564e-06 eta: 2 days, 7:17:19 time: 1.1139 data_time: 0.0322 memory: 21518 grad_norm: 3.6822 loss: 1.2298 caption_loss_cls: 2.0714 grounding_loss_reg: 2.4824 detection_loss_cls: 0.0309 detection_loss_reg: 0.3260 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0306 instance_segmentation_loss_reg: 0.3262 instance_segmentation_loss_poly: 0.8399 +2023/11/05 23:11:50 - mmengine - INFO - Saving checkpoint at 461000 iterations +2023/11/05 23:21:11 - mmengine - INFO - Iter(train) [461500/640000] base_lr: 3.7634e-05 lr: 5.2394e-06 eta: 2 days, 7:08:45 time: 1.1084 data_time: 0.0320 memory: 21518 grad_norm: 3.6700 loss: 1.2235 caption_loss_cls: 2.0743 grounding_loss_reg: 2.4816 detection_loss_cls: 0.0308 detection_loss_reg: 0.3255 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0306 instance_segmentation_loss_reg: 0.3257 instance_segmentation_loss_poly: 0.8388 +2023/11/05 23:30:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 23:30:10 - mmengine - INFO - Iter(train) [462000/640000] base_lr: 3.7447e-05 lr: 5.2225e-06 eta: 2 days, 6:56:35 time: 1.1060 data_time: 0.0322 memory: 21518 grad_norm: 3.7156 loss: 1.2309 caption_loss_cls: 2.0763 grounding_loss_reg: 2.4800 detection_loss_cls: 0.0308 detection_loss_reg: 0.3259 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3260 instance_segmentation_loss_poly: 0.8393 +2023/11/05 23:30:10 - mmengine - INFO - Saving checkpoint at 462000 iterations +2023/11/05 23:39:34 - mmengine - INFO - Iter(train) [462500/640000] base_lr: 3.7261e-05 lr: 5.2055e-06 eta: 2 days, 6:48:36 time: 1.1019 data_time: 0.0325 memory: 21518 grad_norm: 3.7426 loss: 1.2449 caption_loss_cls: 2.0736 grounding_loss_reg: 2.4800 detection_loss_cls: 0.0308 detection_loss_reg: 0.3256 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3254 instance_segmentation_loss_poly: 0.8378 +2023/11/05 23:48:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/05 23:48:51 - mmengine - INFO - Iter(train) [463000/640000] base_lr: 3.7075e-05 lr: 5.1887e-06 eta: 2 days, 6:39:31 time: 1.1055 data_time: 0.0325 memory: 21518 grad_norm: 3.7342 loss: 1.2368 caption_loss_cls: 2.0748 grounding_loss_reg: 2.4780 detection_loss_cls: 0.0307 detection_loss_reg: 0.3248 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3261 instance_segmentation_loss_poly: 0.8391 +2023/11/05 23:48:51 - mmengine - INFO - Saving checkpoint at 463000 iterations +2023/11/05 23:57:57 - mmengine - INFO - Iter(train) [463500/640000] base_lr: 3.6890e-05 lr: 5.1718e-06 eta: 2 days, 6:28:40 time: 1.0995 data_time: 0.0320 memory: 21518 grad_norm: 3.7239 loss: 1.2157 caption_loss_cls: 2.0750 grounding_loss_reg: 2.4715 detection_loss_cls: 0.0308 detection_loss_reg: 0.3244 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3256 instance_segmentation_loss_poly: 0.8381 +2023/11/06 00:07:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 00:07:09 - mmengine - INFO - Iter(train) [464000/640000] base_lr: 3.6705e-05 lr: 5.1550e-06 eta: 2 days, 6:18:49 time: 1.0934 data_time: 0.0317 memory: 21518 grad_norm: 3.7216 loss: 1.2098 caption_loss_cls: 2.0693 grounding_loss_reg: 2.4677 detection_loss_cls: 0.0307 detection_loss_reg: 0.3247 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3262 instance_segmentation_loss_poly: 0.8399 +2023/11/06 00:07:09 - mmengine - INFO - Saving checkpoint at 464000 iterations +2023/11/06 00:16:54 - mmengine - INFO - Iter(train) [464500/640000] base_lr: 3.6520e-05 lr: 5.1382e-06 eta: 2 days, 6:13:44 time: 1.1069 data_time: 0.0352 memory: 21518 grad_norm: 3.7211 loss: 1.2063 caption_loss_cls: 2.0704 grounding_loss_reg: 2.4650 detection_loss_cls: 0.0308 detection_loss_reg: 0.3256 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0309 instance_segmentation_loss_reg: 0.3266 instance_segmentation_loss_poly: 0.8403 +2023/11/06 00:26:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 00:26:05 - mmengine - INFO - Iter(train) [465000/640000] base_lr: 3.6336e-05 lr: 5.1215e-06 eta: 2 days, 6:03:41 time: 1.1128 data_time: 0.0354 memory: 21518 grad_norm: 3.6956 loss: 1.2054 caption_loss_cls: 2.0694 grounding_loss_reg: 2.4655 detection_loss_cls: 0.0307 detection_loss_reg: 0.3250 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3255 instance_segmentation_loss_poly: 0.8382 +2023/11/06 00:26:05 - mmengine - INFO - Saving checkpoint at 465000 iterations +2023/11/06 00:35:01 - mmengine - INFO - Iter(train) [465500/640000] base_lr: 3.6152e-05 lr: 5.1048e-06 eta: 2 days, 5:51:38 time: 1.1067 data_time: 0.0354 memory: 21518 grad_norm: 3.7826 loss: 1.2191 caption_loss_cls: 2.0718 grounding_loss_reg: 2.4666 detection_loss_cls: 0.0307 detection_loss_reg: 0.3258 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3268 instance_segmentation_loss_poly: 0.8394 +2023/11/06 00:44:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 00:44:25 - mmengine - INFO - Iter(train) [466000/640000] base_lr: 3.5969e-05 lr: 5.0881e-06 eta: 2 days, 5:43:24 time: 1.1129 data_time: 0.0359 memory: 21518 grad_norm: 3.7354 loss: 1.2149 caption_loss_cls: 2.0704 grounding_loss_reg: 2.4656 detection_loss_cls: 0.0308 detection_loss_reg: 0.3265 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0309 instance_segmentation_loss_reg: 0.3282 instance_segmentation_loss_poly: 0.8411 +2023/11/06 00:44:25 - mmengine - INFO - Saving checkpoint at 466000 iterations +2023/11/06 00:53:54 - mmengine - INFO - Iter(train) [466500/640000] base_lr: 3.5786e-05 lr: 5.0715e-06 eta: 2 days, 5:35:50 time: 1.1142 data_time: 0.0359 memory: 21518 grad_norm: 3.7824 loss: 1.2155 caption_loss_cls: 2.0682 grounding_loss_reg: 2.4654 detection_loss_cls: 0.0308 detection_loss_reg: 0.3274 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3286 instance_segmentation_loss_poly: 0.8414 +2023/11/06 01:03:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 01:03:44 - mmengine - INFO - Iter(train) [467000/640000] base_lr: 3.5603e-05 lr: 5.0549e-06 eta: 2 days, 5:30:43 time: 1.1223 data_time: 0.0360 memory: 21518 grad_norm: 3.7500 loss: 1.2137 caption_loss_cls: 2.0674 grounding_loss_reg: 2.4648 detection_loss_cls: 0.0307 detection_loss_reg: 0.3276 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3290 instance_segmentation_loss_poly: 0.8418 +2023/11/06 01:03:44 - mmengine - INFO - Saving checkpoint at 467000 iterations +2023/11/06 01:13:28 - mmengine - INFO - Iter(train) [467500/640000] base_lr: 3.5421e-05 lr: 5.0383e-06 eta: 2 days, 5:24:45 time: 1.1319 data_time: 0.0379 memory: 21518 grad_norm: 3.7356 loss: 1.2270 caption_loss_cls: 2.0675 grounding_loss_reg: 2.4660 detection_loss_cls: 0.0308 detection_loss_reg: 0.3281 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3296 instance_segmentation_loss_poly: 0.8421 +2023/11/06 01:22:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 01:22:27 - mmengine - INFO - Iter(train) [468000/640000] base_lr: 3.5239e-05 lr: 5.0218e-06 eta: 2 days, 5:13:11 time: 1.1286 data_time: 0.0380 memory: 21518 grad_norm: 3.7653 loss: 1.2382 caption_loss_cls: 2.0672 grounding_loss_reg: 2.4636 detection_loss_cls: 0.0309 detection_loss_reg: 0.3292 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3295 instance_segmentation_loss_poly: 0.8421 +2023/11/06 01:22:27 - mmengine - INFO - Saving checkpoint at 468000 iterations +2023/11/06 01:32:20 - mmengine - INFO - Iter(train) [468500/640000] base_lr: 3.5058e-05 lr: 5.0053e-06 eta: 2 days, 5:08:06 time: 1.1307 data_time: 0.0379 memory: 21518 grad_norm: 3.6801 loss: 1.2295 caption_loss_cls: 2.0700 grounding_loss_reg: 2.4636 detection_loss_cls: 0.0309 detection_loss_reg: 0.3287 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3298 instance_segmentation_loss_poly: 0.8422 +2023/11/06 01:42:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 01:42:13 - mmengine - INFO - Iter(train) [469000/640000] base_lr: 3.4877e-05 lr: 4.9888e-06 eta: 2 days, 5:02:46 time: 1.1411 data_time: 0.0385 memory: 21518 grad_norm: 3.6672 loss: 1.2222 caption_loss_cls: 2.0703 grounding_loss_reg: 2.4614 detection_loss_cls: 0.0309 detection_loss_reg: 0.3291 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3301 instance_segmentation_loss_poly: 0.8429 +2023/11/06 01:42:13 - mmengine - INFO - Saving checkpoint at 469000 iterations +2023/11/06 01:51:42 - mmengine - INFO - Iter(train) [469500/640000] base_lr: 3.4696e-05 lr: 4.9724e-06 eta: 2 days, 4:54:34 time: 1.1494 data_time: 0.0387 memory: 21518 grad_norm: 3.6320 loss: 1.2106 caption_loss_cls: 2.0702 grounding_loss_reg: 2.4593 detection_loss_cls: 0.0308 detection_loss_reg: 0.3287 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3296 instance_segmentation_loss_poly: 0.8423 +2023/11/06 02:01:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 02:01:21 - mmengine - INFO - Iter(train) [470000/640000] base_lr: 3.4516e-05 lr: 4.9560e-06 eta: 2 days, 4:47:32 time: 1.1534 data_time: 0.0386 memory: 21518 grad_norm: 3.5965 loss: 1.2006 caption_loss_cls: 2.0686 grounding_loss_reg: 2.4583 detection_loss_cls: 0.0309 detection_loss_reg: 0.3289 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3296 instance_segmentation_loss_poly: 0.8426 +2023/11/06 02:01:21 - mmengine - INFO - Saving checkpoint at 470000 iterations +2023/11/06 02:10:39 - mmengine - INFO - Iter(train) [470500/640000] base_lr: 3.4336e-05 lr: 4.9397e-06 eta: 2 days, 4:38:01 time: 1.1504 data_time: 0.0384 memory: 21518 grad_norm: 3.5210 loss: 1.1940 caption_loss_cls: 2.0663 grounding_loss_reg: 2.4565 detection_loss_cls: 0.0309 detection_loss_reg: 0.3288 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3293 instance_segmentation_loss_poly: 0.8430 +2023/11/06 02:19:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 02:19:54 - mmengine - INFO - Iter(train) [471000/640000] base_lr: 3.4157e-05 lr: 4.9233e-06 eta: 2 days, 4:28:17 time: 1.1418 data_time: 0.0383 memory: 21518 grad_norm: 3.5779 loss: 1.1975 caption_loss_cls: 2.0679 grounding_loss_reg: 2.4525 detection_loss_cls: 0.0308 detection_loss_reg: 0.3281 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3288 instance_segmentation_loss_poly: 0.8415 +2023/11/06 02:19:54 - mmengine - INFO - Saving checkpoint at 471000 iterations +2023/11/06 02:29:22 - mmengine - INFO - Iter(train) [471500/640000] base_lr: 3.3978e-05 lr: 4.9071e-06 eta: 2 days, 4:19:49 time: 1.1377 data_time: 0.0366 memory: 21518 grad_norm: 3.5796 loss: 1.1885 caption_loss_cls: 2.0698 grounding_loss_reg: 2.4508 detection_loss_cls: 0.0307 detection_loss_reg: 0.3281 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3294 instance_segmentation_loss_poly: 0.8428 +2023/11/06 02:38:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 02:38:47 - mmengine - INFO - Iter(train) [472000/640000] base_lr: 3.3799e-05 lr: 4.8908e-06 eta: 2 days, 4:11:01 time: 1.1442 data_time: 0.0367 memory: 21518 grad_norm: 3.5486 loss: 1.1797 caption_loss_cls: 2.0686 grounding_loss_reg: 2.4502 detection_loss_cls: 0.0308 detection_loss_reg: 0.3289 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3298 instance_segmentation_loss_poly: 0.8434 +2023/11/06 02:38:47 - mmengine - INFO - Saving checkpoint at 472000 iterations +2023/11/06 02:48:05 - mmengine - INFO - Iter(train) [472500/640000] base_lr: 3.3621e-05 lr: 4.8746e-06 eta: 2 days, 4:01:38 time: 1.1355 data_time: 0.0364 memory: 21518 grad_norm: 3.6212 loss: 1.1811 caption_loss_cls: 2.0661 grounding_loss_reg: 2.4481 detection_loss_cls: 0.0307 detection_loss_reg: 0.3282 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3297 instance_segmentation_loss_poly: 0.8435 +2023/11/06 02:56:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 02:56:43 - mmengine - INFO - Iter(train) [473000/640000] base_lr: 3.3443e-05 lr: 4.8585e-06 eta: 2 days, 3:48:16 time: 1.1166 data_time: 0.0358 memory: 21518 grad_norm: 3.7032 loss: 1.2036 caption_loss_cls: 2.0635 grounding_loss_reg: 2.4475 detection_loss_cls: 0.0307 detection_loss_reg: 0.3291 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0313 instance_segmentation_loss_reg: 0.3309 instance_segmentation_loss_poly: 0.8457 +2023/11/06 02:56:43 - mmengine - INFO - Saving checkpoint at 473000 iterations +2023/11/06 03:06:08 - mmengine - INFO - Iter(train) [473500/640000] base_lr: 3.3266e-05 lr: 4.8423e-06 eta: 2 days, 3:39:33 time: 1.1157 data_time: 0.0358 memory: 21518 grad_norm: 3.7323 loss: 1.2075 caption_loss_cls: 2.0601 grounding_loss_reg: 2.4448 detection_loss_cls: 0.0308 detection_loss_reg: 0.3303 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0314 instance_segmentation_loss_reg: 0.3312 instance_segmentation_loss_poly: 0.8466 +2023/11/06 03:15:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 03:15:10 - mmengine - INFO - Iter(train) [474000/640000] base_lr: 3.3089e-05 lr: 4.8262e-06 eta: 2 days, 3:28:41 time: 1.1062 data_time: 0.0356 memory: 21518 grad_norm: 3.8054 loss: 1.2198 caption_loss_cls: 2.0617 grounding_loss_reg: 2.4437 detection_loss_cls: 0.0308 detection_loss_reg: 0.3305 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0313 instance_segmentation_loss_reg: 0.3310 instance_segmentation_loss_poly: 0.8450 +2023/11/06 03:15:10 - mmengine - INFO - Saving checkpoint at 474000 iterations +2023/11/06 03:24:41 - mmengine - INFO - Iter(train) [474500/640000] base_lr: 3.2912e-05 lr: 4.8102e-06 eta: 2 days, 3:20:29 time: 1.1096 data_time: 0.0357 memory: 21518 grad_norm: 3.8281 loss: 1.2220 caption_loss_cls: 2.0590 grounding_loss_reg: 2.4400 detection_loss_cls: 0.0308 detection_loss_reg: 0.3306 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0313 instance_segmentation_loss_reg: 0.3305 instance_segmentation_loss_poly: 0.8435 +2023/11/06 03:34:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 03:34:21 - mmengine - INFO - Iter(train) [475000/640000] base_lr: 3.2736e-05 lr: 4.7942e-06 eta: 2 days, 3:13:07 time: 1.1159 data_time: 0.0364 memory: 21518 grad_norm: 3.7992 loss: 1.2225 caption_loss_cls: 2.0615 grounding_loss_reg: 2.4380 detection_loss_cls: 0.0307 detection_loss_reg: 0.3301 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0313 instance_segmentation_loss_reg: 0.3296 instance_segmentation_loss_poly: 0.8421 +2023/11/06 03:34:21 - mmengine - INFO - Saving checkpoint at 475000 iterations +2023/11/06 03:43:43 - mmengine - INFO - Iter(train) [475500/640000] base_lr: 3.2560e-05 lr: 4.7782e-06 eta: 2 days, 3:04:00 time: 1.1143 data_time: 0.0362 memory: 21518 grad_norm: 3.7627 loss: 1.2072 caption_loss_cls: 2.0596 grounding_loss_reg: 2.4381 detection_loss_cls: 0.0307 detection_loss_reg: 0.3294 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3290 instance_segmentation_loss_poly: 0.8410 +2023/11/06 03:52:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 03:52:58 - mmengine - INFO - Iter(train) [476000/640000] base_lr: 3.2385e-05 lr: 4.7622e-06 eta: 2 days, 2:54:21 time: 1.1120 data_time: 0.0362 memory: 21518 grad_norm: 3.7851 loss: 1.2093 caption_loss_cls: 2.0586 grounding_loss_reg: 2.4361 detection_loss_cls: 0.0306 detection_loss_reg: 0.3287 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3289 instance_segmentation_loss_poly: 0.8405 +2023/11/06 03:52:58 - mmengine - INFO - Saving checkpoint at 476000 iterations +2023/11/06 04:02:41 - mmengine - INFO - Iter(train) [476500/640000] base_lr: 3.2210e-05 lr: 4.7463e-06 eta: 2 days, 2:47:00 time: 1.1180 data_time: 0.0363 memory: 21518 grad_norm: 3.7397 loss: 1.2045 caption_loss_cls: 2.0550 grounding_loss_reg: 2.4357 detection_loss_cls: 0.0305 detection_loss_reg: 0.3282 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3284 instance_segmentation_loss_poly: 0.8391 +2023/11/06 04:11:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 04:11:48 - mmengine - INFO - Iter(train) [477000/640000] base_lr: 3.2035e-05 lr: 4.7305e-06 eta: 2 days, 2:36:42 time: 1.1255 data_time: 0.0362 memory: 21518 grad_norm: 3.6994 loss: 1.1827 caption_loss_cls: 2.0523 grounding_loss_reg: 2.4361 detection_loss_cls: 0.0304 detection_loss_reg: 0.3268 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3266 instance_segmentation_loss_poly: 0.8359 +2023/11/06 04:11:48 - mmengine - INFO - Saving checkpoint at 477000 iterations +2023/11/06 04:20:53 - mmengine - INFO - Iter(train) [477500/640000] base_lr: 3.1861e-05 lr: 4.7146e-06 eta: 2 days, 2:26:13 time: 1.1205 data_time: 0.0361 memory: 21518 grad_norm: 3.7146 loss: 1.1821 caption_loss_cls: 2.0504 grounding_loss_reg: 2.4328 detection_loss_cls: 0.0302 detection_loss_reg: 0.3251 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3257 instance_segmentation_loss_poly: 0.8330 +2023/11/06 04:30:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 04:30:14 - mmengine - INFO - Iter(train) [478000/640000] base_lr: 3.1687e-05 lr: 4.6989e-06 eta: 2 days, 2:17:04 time: 1.1252 data_time: 0.0361 memory: 21518 grad_norm: 3.6962 loss: 1.1722 caption_loss_cls: 2.0483 grounding_loss_reg: 2.4330 detection_loss_cls: 0.0302 detection_loss_reg: 0.3246 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0306 instance_segmentation_loss_reg: 0.3251 instance_segmentation_loss_poly: 0.8319 +2023/11/06 04:30:14 - mmengine - INFO - Saving checkpoint at 478000 iterations +2023/11/06 04:39:49 - mmengine - INFO - Iter(train) [478500/640000] base_lr: 3.1514e-05 lr: 4.6831e-06 eta: 2 days, 2:08:57 time: 1.1261 data_time: 0.0364 memory: 21518 grad_norm: 3.7090 loss: 1.1822 caption_loss_cls: 2.0484 grounding_loss_reg: 2.4332 detection_loss_cls: 0.0301 detection_loss_reg: 0.3244 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3253 instance_segmentation_loss_poly: 0.8327 +2023/11/06 04:48:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 04:48:54 - mmengine - INFO - Iter(train) [479000/640000] base_lr: 3.1341e-05 lr: 4.6674e-06 eta: 2 days, 1:58:34 time: 1.1174 data_time: 0.0358 memory: 21518 grad_norm: 3.7153 loss: 1.1836 caption_loss_cls: 2.0507 grounding_loss_reg: 2.4321 detection_loss_cls: 0.0301 detection_loss_reg: 0.3244 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0306 instance_segmentation_loss_reg: 0.3244 instance_segmentation_loss_poly: 0.8307 +2023/11/06 04:48:54 - mmengine - INFO - Saving checkpoint at 479000 iterations +2023/11/06 04:58:09 - mmengine - INFO - Iter(train) [479500/640000] base_lr: 3.1169e-05 lr: 4.6517e-06 eta: 2 days, 1:48:56 time: 1.1157 data_time: 0.0357 memory: 21518 grad_norm: 3.7566 loss: 1.1946 caption_loss_cls: 2.0484 grounding_loss_reg: 2.4303 detection_loss_cls: 0.0301 detection_loss_reg: 0.3241 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3247 instance_segmentation_loss_poly: 0.8302 +2023/11/06 05:07:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 05:07:18 - mmengine - INFO - Iter(train) [480000/640000] base_lr: 3.0997e-05 lr: 4.6361e-06 eta: 2 days, 1:38:52 time: 1.1141 data_time: 0.0357 memory: 21518 grad_norm: 3.7441 loss: 1.1857 caption_loss_cls: 2.0413 grounding_loss_reg: 2.4285 detection_loss_cls: 0.0301 detection_loss_reg: 0.3240 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3253 instance_segmentation_loss_poly: 0.8313 +2023/11/06 05:07:18 - mmengine - INFO - Saving checkpoint at 480000 iterations +2023/11/06 05:16:10 - mmengine - INFO - Evaluating bbox... +2023/11/06 05:17:07 - mmengine - INFO - bbox_mAP_copypaste: 0.457 0.631 0.496 0.281 0.508 0.605 +2023/11/06 05:17:07 - mmengine - INFO - Evaluating segm... +2023/11/06 05:18:19 - mmengine - INFO - segm_mAP_copypaste: 0.308 0.549 0.300 0.154 0.352 0.477 +2023/11/06 05:23:10 - mmengine - INFO - per class results: +2023/11/06 05:23:10 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 76.19 | 87.96 | +| building | 80.18 | 90.5 | +| sky | 92.94 | 97.48 | +| floor | 80.08 | 88.75 | +| tree | 73.24 | 86.62 | +| ceiling | 83.09 | 93.95 | +| road | 82.51 | 88.35 | +| bed | 86.38 | 95.04 | +| windowpane | 60.52 | 76.04 | +| grass | 62.86 | 79.22 | +| cabinet | 58.69 | 68.89 | +| sidewalk | 66.0 | 84.57 | +| person | 78.84 | 92.14 | +| earth | 36.04 | 48.49 | +| door | 49.46 | 65.51 | +| table | 58.75 | 77.38 | +| mountain | 52.07 | 65.06 | +| plant | 47.81 | 57.42 | +| curtain | 67.94 | 83.29 | +| chair | 56.31 | 71.21 | +| car | 80.55 | 90.19 | +| water | 50.91 | 61.77 | +| painting | 68.76 | 87.49 | +| sofa | 65.49 | 80.84 | +| shelf | 41.93 | 63.58 | +| house | 38.97 | 58.95 | +| sea | 54.45 | 86.65 | +| mirror | 63.65 | 73.26 | +| rug | 65.47 | 74.64 | +| field | 28.67 | 48.8 | +| armchair | 43.2 | 58.7 | +| seat | 60.65 | 81.77 | +| fence | 38.76 | 55.91 | +| desk | 44.42 | 62.8 | +| rock | 40.63 | 63.96 | +| wardrobe | 43.76 | 63.12 | +| lamp | 59.06 | 73.96 | +| bathtub | 78.28 | 84.87 | +| railing | 29.2 | 47.43 | +| cushion | 56.06 | 65.51 | +| base | 25.05 | 35.26 | +| box | 26.8 | 35.94 | +| column | 46.54 | 61.66 | +| signboard | 36.2 | 48.99 | +| chest of drawers | 37.71 | 60.93 | +| counter | 25.68 | 33.81 | +| sand | 33.96 | 49.86 | +| sink | 71.16 | 78.14 | +| skyscraper | 44.11 | 53.06 | +| fireplace | 72.86 | 88.64 | +| refrigerator | 76.4 | 84.57 | +| grandstand | 42.53 | 68.11 | +| path | 27.42 | 34.55 | +| stairs | 27.96 | 35.22 | +| runway | 69.15 | 84.78 | +| case | 41.4 | 45.36 | +| pool table | 85.72 | 96.04 | +| pillow | 54.54 | 68.84 | +| screen door | 66.77 | 72.49 | +| stairway | 29.73 | 40.97 | +| river | 17.67 | 27.39 | +| bridge | 53.26 | 63.24 | +| bookcase | 34.37 | 57.41 | +| blind | 24.23 | 26.55 | +| coffee table | 64.23 | 78.29 | +| toilet | 84.08 | 88.84 | +| flower | 28.16 | 62.39 | +| book | 46.28 | 64.77 | +| hill | 8.87 | 16.07 | +| bench | 43.06 | 49.35 | +| countertop | 51.52 | 62.89 | +| stove | 73.93 | 86.58 | +| palm | 44.52 | 58.31 | +| kitchen island | 39.12 | 68.09 | +| computer | 69.69 | 84.28 | +| swivel chair | 44.55 | 62.27 | +| boat | 73.45 | 84.69 | +| bar | 27.57 | 39.09 | +| arcade machine | 42.25 | 45.44 | +| hovel | 7.58 | 10.28 | +| bus | 87.47 | 95.13 | +| towel | 61.2 | 68.82 | +| light | 46.28 | 54.15 | +| truck | 34.19 | 54.77 | +| tower | 41.4 | 50.34 | +| chandelier | 61.8 | 73.88 | +| awning | 23.14 | 26.6 | +| streetlight | 25.5 | 34.0 | +| booth | 48.13 | 49.14 | +| television receiver | 67.1 | 81.38 | +| airplane | 56.46 | 66.81 | +| dirt track | 0.79 | 1.91 | +| apparel | 32.02 | 47.36 | +| pole | 29.18 | 37.88 | +| land | 2.34 | 2.96 | +| bannister | 10.4 | 13.5 | +| escalator | 28.71 | 34.93 | +| ottoman | 46.91 | 64.0 | +| bottle | 28.19 | 36.01 | +| buffet | 43.48 | 47.18 | +| poster | 24.84 | 33.32 | +| stage | 12.0 | 25.32 | +| van | 44.53 | 63.86 | +| ship | 45.84 | 47.01 | +| fountain | 14.74 | 14.99 | +| conveyer belt | 76.29 | 88.62 | +| canopy | 24.39 | 32.49 | +| washer | 67.43 | 69.8 | +| plaything | 29.34 | 44.52 | +| swimming pool | 52.58 | 65.65 | +| stool | 41.32 | 54.14 | +| barrel | 21.79 | 24.45 | +| basket | 27.55 | 38.09 | +| waterfall | 52.92 | 62.78 | +| tent | 88.95 | 97.09 | +| bag | 10.72 | 12.35 | +| minibike | 72.07 | 81.48 | +| cradle | 72.9 | 91.16 | +| oven | 38.69 | 49.1 | +| ball | 49.11 | 60.29 | +| food | 52.34 | 58.97 | +| step | 11.94 | 14.84 | +| tank | 46.84 | 53.49 | +| trade name | 24.63 | 29.52 | +| microwave | 81.22 | 88.83 | +| pot | 45.86 | 51.07 | +| animal | 60.71 | 64.65 | +| bicycle | 55.33 | 74.39 | +| lake | 53.43 | 64.44 | +| dishwasher | 54.63 | 73.33 | +| screen | 64.08 | 86.79 | +| blanket | 8.37 | 10.06 | +| sculpture | 52.39 | 62.68 | +| hood | 59.04 | 64.83 | +| sconce | 36.73 | 46.71 | +| vase | 40.62 | 52.45 | +| traffic light | 34.94 | 56.78 | +| tray | 11.64 | 19.94 | +| ashcan | 40.62 | 60.04 | +| fan | 55.36 | 72.41 | +| pier | 39.87 | 49.24 | +| crt screen | 6.31 | 13.91 | +| plate | 54.57 | 69.34 | +| monitor | 20.17 | 25.77 | +| bulletin board | 34.59 | 43.71 | +| shower | 1.79 | 4.69 | +| radiator | 51.71 | 59.1 | +| glass | 16.0 | 17.54 | +| clock | 27.36 | 32.12 | +| flag | 27.97 | 31.49 | ++---------------------+-------+-------+ +2023/11/06 05:23:29 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4570 coco/bbox_mAP_50: 0.6310 coco/bbox_mAP_75: 0.4960 coco/bbox_mAP_s: 0.2810 coco/bbox_mAP_m: 0.5080 coco/bbox_mAP_l: 0.6050 coco/segm_mAP: 0.3080 coco/segm_mAP_50: 0.5490 coco/segm_mAP_75: 0.3000 coco/segm_mAP_s: 0.1540 coco/segm_mAP_m: 0.3520 coco/segm_mAP_l: 0.4770 Bleu_1: 0.7448 Bleu_2: 0.5806 Bleu_3: 0.4417 Bleu_4: 0.3347 METEOR: 0.2659 ROUGE_L: 0.5485 CIDEr: 1.0662 SPICE: 0.1976 aAcc: 81.7800 mIoU: 46.9100 mAcc: 58.3100 visual-grounding/miou: 0.7824 visual-grounding/acc: 0.8523 data_time: 0.0211 time: 0.5469 +2023/11/06 05:32:59 - mmengine - INFO - Iter(train) [480500/640000] base_lr: 3.0825e-05 lr: 4.6205e-06 eta: 2 days, 1:30:27 time: 1.1113 data_time: 0.0329 memory: 21518 grad_norm: 3.7875 loss: 1.2018 caption_loss_cls: 2.0407 grounding_loss_reg: 2.4269 detection_loss_cls: 0.0301 detection_loss_reg: 0.3245 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3254 instance_segmentation_loss_poly: 0.8311 +2023/11/06 05:42:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 05:42:35 - mmengine - INFO - Iter(train) [481000/640000] base_lr: 3.0654e-05 lr: 4.6049e-06 eta: 2 days, 1:22:22 time: 1.1185 data_time: 0.0334 memory: 21518 grad_norm: 3.8097 loss: 1.2171 caption_loss_cls: 2.0421 grounding_loss_reg: 2.4295 detection_loss_cls: 0.0301 detection_loss_reg: 0.3252 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0306 instance_segmentation_loss_reg: 0.3254 instance_segmentation_loss_poly: 0.8316 +2023/11/06 05:42:35 - mmengine - INFO - Saving checkpoint at 481000 iterations +2023/11/06 05:51:19 - mmengine - INFO - Iter(train) [481500/640000] base_lr: 3.0483e-05 lr: 4.5894e-06 eta: 2 days, 1:10:35 time: 1.1133 data_time: 0.0332 memory: 21518 grad_norm: 3.8184 loss: 1.2257 caption_loss_cls: 2.0376 grounding_loss_reg: 2.4303 detection_loss_cls: 0.0302 detection_loss_reg: 0.3258 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0306 instance_segmentation_loss_reg: 0.3259 instance_segmentation_loss_poly: 0.8322 +2023/11/06 06:00:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 06:00:54 - mmengine - INFO - Iter(train) [482000/640000] base_lr: 3.0313e-05 lr: 4.5739e-06 eta: 2 days, 1:02:23 time: 1.1168 data_time: 0.0335 memory: 21518 grad_norm: 3.7954 loss: 1.2299 caption_loss_cls: 2.0345 grounding_loss_reg: 2.4254 detection_loss_cls: 0.0301 detection_loss_reg: 0.3262 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0306 instance_segmentation_loss_reg: 0.3260 instance_segmentation_loss_poly: 0.8326 +2023/11/06 06:00:54 - mmengine - INFO - Saving checkpoint at 482000 iterations +2023/11/06 06:11:07 - mmengine - INFO - Iter(train) [482500/640000] base_lr: 3.0143e-05 lr: 4.5585e-06 eta: 2 days, 0:56:45 time: 1.1264 data_time: 0.0336 memory: 21518 grad_norm: 3.7754 loss: 1.2165 caption_loss_cls: 2.0310 grounding_loss_reg: 2.4246 detection_loss_cls: 0.0300 detection_loss_reg: 0.3253 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0305 instance_segmentation_loss_reg: 0.3260 instance_segmentation_loss_poly: 0.8332 +2023/11/06 06:20:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 06:20:13 - mmengine - INFO - Iter(train) [483000/640000] base_lr: 2.9974e-05 lr: 4.5430e-06 eta: 2 days, 0:46:29 time: 1.1265 data_time: 0.0336 memory: 21518 grad_norm: 3.7912 loss: 1.2176 caption_loss_cls: 2.0310 grounding_loss_reg: 2.4253 detection_loss_cls: 0.0302 detection_loss_reg: 0.3266 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0306 instance_segmentation_loss_reg: 0.3270 instance_segmentation_loss_poly: 0.8345 +2023/11/06 06:20:13 - mmengine - INFO - Saving checkpoint at 483000 iterations +2023/11/06 06:29:36 - mmengine - INFO - Iter(train) [483500/640000] base_lr: 2.9804e-05 lr: 4.5277e-06 eta: 2 days, 0:37:24 time: 1.1285 data_time: 0.0339 memory: 21518 grad_norm: 3.7926 loss: 1.2220 caption_loss_cls: 2.0305 grounding_loss_reg: 2.4258 detection_loss_cls: 0.0301 detection_loss_reg: 0.3267 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0305 instance_segmentation_loss_reg: 0.3269 instance_segmentation_loss_poly: 0.8342 +2023/11/06 06:38:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 06:38:44 - mmengine - INFO - Iter(train) [484000/640000] base_lr: 2.9636e-05 lr: 4.5123e-06 eta: 2 days, 0:27:20 time: 1.1284 data_time: 0.0337 memory: 21518 grad_norm: 3.8135 loss: 1.2243 caption_loss_cls: 2.0287 grounding_loss_reg: 2.4234 detection_loss_cls: 0.0301 detection_loss_reg: 0.3278 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0305 instance_segmentation_loss_reg: 0.3271 instance_segmentation_loss_poly: 0.8349 +2023/11/06 06:38:44 - mmengine - INFO - Saving checkpoint at 484000 iterations +2023/11/06 06:47:34 - mmengine - INFO - Iter(train) [484500/640000] base_lr: 2.9468e-05 lr: 4.4971e-06 eta: 2 days, 0:16:07 time: 1.1180 data_time: 0.0363 memory: 21518 grad_norm: 3.8225 loss: 1.2146 caption_loss_cls: 2.0263 grounding_loss_reg: 2.4214 detection_loss_cls: 0.0301 detection_loss_reg: 0.3280 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0305 instance_segmentation_loss_reg: 0.3271 instance_segmentation_loss_poly: 0.8351 +2023/11/06 06:56:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 06:56:38 - mmengine - INFO - Iter(train) [485000/640000] base_lr: 2.9300e-05 lr: 4.4818e-06 eta: 2 days, 0:05:50 time: 1.1099 data_time: 0.0360 memory: 21518 grad_norm: 3.7833 loss: 1.2105 caption_loss_cls: 2.0263 grounding_loss_reg: 2.4196 detection_loss_cls: 0.0300 detection_loss_reg: 0.3280 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0305 instance_segmentation_loss_reg: 0.3267 instance_segmentation_loss_poly: 0.8350 +2023/11/06 06:56:38 - mmengine - INFO - Saving checkpoint at 485000 iterations +2023/11/06 07:05:42 - mmengine - INFO - Iter(train) [485500/640000] base_lr: 2.9133e-05 lr: 4.4666e-06 eta: 1 day, 23:55:36 time: 1.1149 data_time: 0.0359 memory: 21518 grad_norm: 3.7649 loss: 1.1989 caption_loss_cls: 2.0245 grounding_loss_reg: 2.4186 detection_loss_cls: 0.0301 detection_loss_reg: 0.3282 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0304 instance_segmentation_loss_reg: 0.3252 instance_segmentation_loss_poly: 0.8328 +2023/11/06 07:14:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 07:14:42 - mmengine - INFO - Iter(train) [486000/640000] base_lr: 2.8966e-05 lr: 4.4514e-06 eta: 1 day, 23:45:10 time: 1.1062 data_time: 0.0355 memory: 21518 grad_norm: 3.8165 loss: 1.2046 caption_loss_cls: 2.0291 grounding_loss_reg: 2.4175 detection_loss_cls: 0.0301 detection_loss_reg: 0.3274 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0303 instance_segmentation_loss_reg: 0.3249 instance_segmentation_loss_poly: 0.8327 +2023/11/06 07:14:42 - mmengine - INFO - Saving checkpoint at 486000 iterations +2023/11/06 07:24:01 - mmengine - INFO - Iter(train) [486500/640000] base_lr: 2.8799e-05 lr: 4.4363e-06 eta: 1 day, 23:35:52 time: 1.0926 data_time: 0.0353 memory: 21518 grad_norm: 3.8878 loss: 1.2197 caption_loss_cls: 2.0308 grounding_loss_reg: 2.4187 detection_loss_cls: 0.0299 detection_loss_reg: 0.3261 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3247 instance_segmentation_loss_poly: 0.8317 +2023/11/06 07:33:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 07:33:38 - mmengine - INFO - Iter(train) [487000/640000] base_lr: 2.8633e-05 lr: 4.4212e-06 eta: 1 day, 23:27:40 time: 1.1005 data_time: 0.0354 memory: 21518 grad_norm: 3.8566 loss: 1.2124 caption_loss_cls: 2.0330 grounding_loss_reg: 2.4148 detection_loss_cls: 0.0299 detection_loss_reg: 0.3265 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3254 instance_segmentation_loss_poly: 0.8324 +2023/11/06 07:33:38 - mmengine - INFO - Saving checkpoint at 487000 iterations +2023/11/06 07:43:07 - mmengine - INFO - Iter(train) [487500/640000] base_lr: 2.8468e-05 lr: 4.4061e-06 eta: 1 day, 23:18:56 time: 1.1018 data_time: 0.0355 memory: 21518 grad_norm: 3.8815 loss: 1.2237 caption_loss_cls: 2.0345 grounding_loss_reg: 2.4177 detection_loss_cls: 0.0297 detection_loss_reg: 0.3251 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3255 instance_segmentation_loss_poly: 0.8331 +2023/11/06 07:52:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 07:52:23 - mmengine - INFO - Iter(train) [488000/640000] base_lr: 2.8302e-05 lr: 4.3911e-06 eta: 1 day, 23:09:27 time: 1.1037 data_time: 0.0356 memory: 21518 grad_norm: 3.8800 loss: 1.2355 caption_loss_cls: 2.0378 grounding_loss_reg: 2.4167 detection_loss_cls: 0.0297 detection_loss_reg: 0.3248 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3253 instance_segmentation_loss_poly: 0.8339 +2023/11/06 07:52:23 - mmengine - INFO - Saving checkpoint at 488000 iterations +2023/11/06 08:01:56 - mmengine - INFO - Iter(train) [488500/640000] base_lr: 2.8138e-05 lr: 4.3762e-06 eta: 1 day, 23:00:59 time: 1.1147 data_time: 0.0358 memory: 21518 grad_norm: 3.8663 loss: 1.2331 caption_loss_cls: 2.0322 grounding_loss_reg: 2.4158 detection_loss_cls: 0.0297 detection_loss_reg: 0.3253 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3248 instance_segmentation_loss_poly: 0.8328 +2023/11/06 08:11:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 08:11:10 - mmengine - INFO - Iter(train) [489000/640000] base_lr: 2.7973e-05 lr: 4.3612e-06 eta: 1 day, 22:51:23 time: 1.1173 data_time: 0.0360 memory: 21518 grad_norm: 3.9084 loss: 1.2357 caption_loss_cls: 2.0330 grounding_loss_reg: 2.4164 detection_loss_cls: 0.0296 detection_loss_reg: 0.3244 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3250 instance_segmentation_loss_poly: 0.8327 +2023/11/06 08:11:10 - mmengine - INFO - Saving checkpoint at 489000 iterations +2023/11/06 08:20:49 - mmengine - INFO - Iter(train) [489500/640000] base_lr: 2.7810e-05 lr: 4.3463e-06 eta: 1 day, 22:43:09 time: 1.1258 data_time: 0.0364 memory: 21518 grad_norm: 3.8581 loss: 1.2365 caption_loss_cls: 2.0363 grounding_loss_reg: 2.4163 detection_loss_cls: 0.0297 detection_loss_reg: 0.3242 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3246 instance_segmentation_loss_poly: 0.8310 +2023/11/06 08:30:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 08:30:37 - mmengine - INFO - Iter(train) [490000/640000] base_lr: 2.7646e-05 lr: 4.3315e-06 eta: 1 day, 22:35:25 time: 1.1378 data_time: 0.0368 memory: 21518 grad_norm: 3.8135 loss: 1.2298 caption_loss_cls: 2.0376 grounding_loss_reg: 2.4165 detection_loss_cls: 0.0297 detection_loss_reg: 0.3243 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3248 instance_segmentation_loss_poly: 0.8315 +2023/11/06 08:30:37 - mmengine - INFO - Saving checkpoint at 490000 iterations +2023/11/06 08:40:31 - mmengine - INFO - Iter(train) [490500/640000] base_lr: 2.7483e-05 lr: 4.3167e-06 eta: 1 day, 22:27:56 time: 1.1466 data_time: 0.0373 memory: 21518 grad_norm: 3.7842 loss: 1.2168 caption_loss_cls: 2.0366 grounding_loss_reg: 2.4182 detection_loss_cls: 0.0297 detection_loss_reg: 0.3245 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3243 instance_segmentation_loss_poly: 0.8302 +2023/11/06 08:50:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 08:50:34 - mmengine - INFO - Iter(train) [491000/640000] base_lr: 2.7321e-05 lr: 4.3019e-06 eta: 1 day, 22:20:52 time: 1.1530 data_time: 0.0374 memory: 21518 grad_norm: 3.7149 loss: 1.2091 caption_loss_cls: 2.0382 grounding_loss_reg: 2.4201 detection_loss_cls: 0.0297 detection_loss_reg: 0.3244 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3235 instance_segmentation_loss_poly: 0.8287 +2023/11/06 08:50:34 - mmengine - INFO - Saving checkpoint at 491000 iterations +2023/11/06 09:00:14 - mmengine - INFO - Iter(train) [491500/640000] base_lr: 2.7159e-05 lr: 4.2871e-06 eta: 1 day, 22:12:37 time: 1.1561 data_time: 0.0389 memory: 21518 grad_norm: 3.7080 loss: 1.2077 caption_loss_cls: 2.0361 grounding_loss_reg: 2.4214 detection_loss_cls: 0.0297 detection_loss_reg: 0.3233 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3238 instance_segmentation_loss_poly: 0.8292 +2023/11/06 09:10:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 09:10:13 - mmengine - INFO - Iter(train) [492000/640000] base_lr: 2.6997e-05 lr: 4.2725e-06 eta: 1 day, 22:05:13 time: 1.1667 data_time: 0.0392 memory: 21518 grad_norm: 3.6802 loss: 1.1936 caption_loss_cls: 2.0368 grounding_loss_reg: 2.4202 detection_loss_cls: 0.0297 detection_loss_reg: 0.3230 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0301 instance_segmentation_loss_reg: 0.3224 instance_segmentation_loss_poly: 0.8266 +2023/11/06 09:10:13 - mmengine - INFO - Saving checkpoint at 492000 iterations +2023/11/06 09:19:46 - mmengine - INFO - Iter(train) [492500/640000] base_lr: 2.6836e-05 lr: 4.2578e-06 eta: 1 day, 21:56:28 time: 1.1664 data_time: 0.0391 memory: 21518 grad_norm: 3.7001 loss: 1.1939 caption_loss_cls: 2.0403 grounding_loss_reg: 2.4188 detection_loss_cls: 0.0297 detection_loss_reg: 0.3230 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0300 instance_segmentation_loss_reg: 0.3205 instance_segmentation_loss_poly: 0.8224 +2023/11/06 09:29:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 09:29:14 - mmengine - INFO - Iter(train) [493000/640000] base_lr: 2.6675e-05 lr: 4.2432e-06 eta: 1 day, 21:47:30 time: 1.1701 data_time: 0.0391 memory: 21518 grad_norm: 3.6385 loss: 1.1819 caption_loss_cls: 2.0413 grounding_loss_reg: 2.4177 detection_loss_cls: 0.0297 detection_loss_reg: 0.3218 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0300 instance_segmentation_loss_reg: 0.3213 instance_segmentation_loss_poly: 0.8236 +2023/11/06 09:29:14 - mmengine - INFO - Saving checkpoint at 493000 iterations +2023/11/06 09:38:40 - mmengine - INFO - Iter(train) [493500/640000] base_lr: 2.6515e-05 lr: 4.2286e-06 eta: 1 day, 21:38:22 time: 1.1668 data_time: 0.0391 memory: 21518 grad_norm: 3.6567 loss: 1.1739 caption_loss_cls: 2.0404 grounding_loss_reg: 2.4178 detection_loss_cls: 0.0296 detection_loss_reg: 0.3197 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0300 instance_segmentation_loss_reg: 0.3213 instance_segmentation_loss_poly: 0.8239 +2023/11/06 09:48:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 09:48:12 - mmengine - INFO - Iter(train) [494000/640000] base_lr: 2.6355e-05 lr: 4.2141e-06 eta: 1 day, 21:29:34 time: 1.1629 data_time: 0.0389 memory: 21518 grad_norm: 3.6973 loss: 1.1827 caption_loss_cls: 2.0410 grounding_loss_reg: 2.4179 detection_loss_cls: 0.0296 detection_loss_reg: 0.3203 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0300 instance_segmentation_loss_reg: 0.3218 instance_segmentation_loss_poly: 0.8253 +2023/11/06 09:48:12 - mmengine - INFO - Saving checkpoint at 494000 iterations +2023/11/06 09:57:35 - mmengine - INFO - Iter(train) [494500/640000] base_lr: 2.6196e-05 lr: 4.1996e-06 eta: 1 day, 21:20:18 time: 1.1551 data_time: 0.0383 memory: 21518 grad_norm: 3.6856 loss: 1.1880 caption_loss_cls: 2.0436 grounding_loss_reg: 2.4181 detection_loss_cls: 0.0296 detection_loss_reg: 0.3200 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0300 instance_segmentation_loss_reg: 0.3229 instance_segmentation_loss_poly: 0.8277 +2023/11/06 10:06:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 10:06:34 - mmengine - INFO - Iter(train) [495000/640000] base_lr: 2.6037e-05 lr: 4.1851e-06 eta: 1 day, 21:09:53 time: 1.1392 data_time: 0.0380 memory: 21518 grad_norm: 3.7765 loss: 1.1991 caption_loss_cls: 2.0441 grounding_loss_reg: 2.4162 detection_loss_cls: 0.0296 detection_loss_reg: 0.3208 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0300 instance_segmentation_loss_reg: 0.3232 instance_segmentation_loss_poly: 0.8282 +2023/11/06 10:06:34 - mmengine - INFO - Saving checkpoint at 495000 iterations +2023/11/06 10:16:38 - mmengine - INFO - Iter(train) [495500/640000] base_lr: 2.5878e-05 lr: 4.1707e-06 eta: 1 day, 21:02:33 time: 1.1450 data_time: 0.0372 memory: 21518 grad_norm: 3.7569 loss: 1.1755 caption_loss_cls: 2.0434 grounding_loss_reg: 2.4146 detection_loss_cls: 0.0296 detection_loss_reg: 0.3216 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0300 instance_segmentation_loss_reg: 0.3225 instance_segmentation_loss_poly: 0.8274 +2023/11/06 10:26:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 10:26:02 - mmengine - INFO - Iter(train) [496000/640000] base_lr: 2.5720e-05 lr: 4.1564e-06 eta: 1 day, 20:53:20 time: 1.1364 data_time: 0.0370 memory: 21518 grad_norm: 3.7882 loss: 1.1877 caption_loss_cls: 2.0446 grounding_loss_reg: 2.4149 detection_loss_cls: 0.0296 detection_loss_reg: 0.3222 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0301 instance_segmentation_loss_reg: 0.3223 instance_segmentation_loss_poly: 0.8269 +2023/11/06 10:26:02 - mmengine - INFO - Saving checkpoint at 496000 iterations +2023/11/06 10:35:33 - mmengine - INFO - Iter(train) [496500/640000] base_lr: 2.5563e-05 lr: 4.1420e-06 eta: 1 day, 20:44:23 time: 1.1359 data_time: 0.0391 memory: 21518 grad_norm: 3.8092 loss: 1.1969 caption_loss_cls: 2.0498 grounding_loss_reg: 2.4092 detection_loss_cls: 0.0297 detection_loss_reg: 0.3218 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3240 instance_segmentation_loss_poly: 0.8306 +2023/11/06 10:45:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 10:45:24 - mmengine - INFO - Iter(train) [497000/640000] base_lr: 2.5405e-05 lr: 4.1278e-06 eta: 1 day, 20:36:23 time: 1.1417 data_time: 0.0393 memory: 21518 grad_norm: 3.8134 loss: 1.1995 caption_loss_cls: 2.0515 grounding_loss_reg: 2.4084 detection_loss_cls: 0.0297 detection_loss_reg: 0.3220 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3250 instance_segmentation_loss_poly: 0.8328 +2023/11/06 10:45:25 - mmengine - INFO - Saving checkpoint at 497000 iterations +2023/11/06 10:54:48 - mmengine - INFO - Iter(train) [497500/640000] base_lr: 2.5249e-05 lr: 4.1135e-06 eta: 1 day, 20:27:06 time: 1.1412 data_time: 0.0394 memory: 21518 grad_norm: 3.8235 loss: 1.2109 caption_loss_cls: 2.0528 grounding_loss_reg: 2.4068 detection_loss_cls: 0.0298 detection_loss_reg: 0.3235 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0303 instance_segmentation_loss_reg: 0.3264 instance_segmentation_loss_poly: 0.8352 +2023/11/06 11:04:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 11:04:05 - mmengine - INFO - Iter(train) [498000/640000] base_lr: 2.5093e-05 lr: 4.0993e-06 eta: 1 day, 20:17:32 time: 1.1374 data_time: 0.0392 memory: 21518 grad_norm: 3.8222 loss: 1.2014 caption_loss_cls: 2.0527 grounding_loss_reg: 2.4061 detection_loss_cls: 0.0299 detection_loss_reg: 0.3245 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3260 instance_segmentation_loss_poly: 0.8334 +2023/11/06 11:04:05 - mmengine - INFO - Saving checkpoint at 498000 iterations +2023/11/06 11:13:30 - mmengine - INFO - Iter(train) [498500/640000] base_lr: 2.4937e-05 lr: 4.0852e-06 eta: 1 day, 20:08:19 time: 1.1379 data_time: 0.0402 memory: 21518 grad_norm: 3.8358 loss: 1.1956 caption_loss_cls: 2.0501 grounding_loss_reg: 2.4062 detection_loss_cls: 0.0299 detection_loss_reg: 0.3255 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0303 instance_segmentation_loss_reg: 0.3265 instance_segmentation_loss_poly: 0.8346 +2023/11/06 11:22:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 11:22:47 - mmengine - INFO - Iter(train) [499000/640000] base_lr: 2.4781e-05 lr: 4.0710e-06 eta: 1 day, 19:58:43 time: 1.1423 data_time: 0.0404 memory: 21518 grad_norm: 3.8376 loss: 1.1985 caption_loss_cls: 2.0494 grounding_loss_reg: 2.4052 detection_loss_cls: 0.0299 detection_loss_reg: 0.3262 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0301 instance_segmentation_loss_reg: 0.3257 instance_segmentation_loss_poly: 0.8331 +2023/11/06 11:22:47 - mmengine - INFO - Saving checkpoint at 499000 iterations +2023/11/06 11:32:00 - mmengine - INFO - Iter(train) [499500/640000] base_lr: 2.4627e-05 lr: 4.0570e-06 eta: 1 day, 19:49:00 time: 1.1296 data_time: 0.0395 memory: 21518 grad_norm: 3.8650 loss: 1.2156 caption_loss_cls: 2.0544 grounding_loss_reg: 2.4042 detection_loss_cls: 0.0299 detection_loss_reg: 0.3264 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0301 instance_segmentation_loss_reg: 0.3252 instance_segmentation_loss_poly: 0.8310 +2023/11/06 11:40:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 11:40:43 - mmengine - INFO - Iter(train) [500000/640000] base_lr: 2.4472e-05 lr: 4.0429e-06 eta: 1 day, 19:38:01 time: 1.1193 data_time: 0.0413 memory: 21518 grad_norm: 3.9262 loss: 1.2169 caption_loss_cls: 2.0520 grounding_loss_reg: 2.4024 detection_loss_cls: 0.0298 detection_loss_reg: 0.3254 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3259 instance_segmentation_loss_poly: 0.8329 +2023/11/06 11:40:43 - mmengine - INFO - Saving checkpoint at 500000 iterations +2023/11/06 11:49:32 - mmengine - INFO - Evaluating bbox... +2023/11/06 11:50:29 - mmengine - INFO - bbox_mAP_copypaste: 0.461 0.635 0.501 0.287 0.508 0.605 +2023/11/06 11:50:29 - mmengine - INFO - Evaluating segm... +2023/11/06 11:51:43 - mmengine - INFO - segm_mAP_copypaste: 0.313 0.556 0.308 0.158 0.355 0.482 +2023/11/06 11:57:01 - mmengine - INFO - per class results: +2023/11/06 11:57:01 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.07 | 90.05 | +| building | 79.71 | 92.71 | +| sky | 92.77 | 97.65 | +| floor | 80.4 | 90.4 | +| tree | 72.69 | 84.4 | +| ceiling | 83.35 | 93.26 | +| road | 82.92 | 89.88 | +| bed | 87.48 | 94.27 | +| windowpane | 59.26 | 72.79 | +| grass | 66.62 | 83.11 | +| cabinet | 58.24 | 69.39 | +| sidewalk | 66.39 | 78.07 | +| person | 78.66 | 89.92 | +| earth | 38.93 | 56.32 | +| door | 47.93 | 59.04 | +| table | 59.85 | 75.98 | +| mountain | 51.0 | 65.03 | +| plant | 50.46 | 61.34 | +| curtain | 69.9 | 82.77 | +| chair | 56.18 | 68.34 | +| car | 82.54 | 89.69 | +| water | 50.92 | 65.43 | +| painting | 71.31 | 83.86 | +| sofa | 66.1 | 81.32 | +| shelf | 43.81 | 63.89 | +| house | 27.52 | 30.43 | +| sea | 47.1 | 72.49 | +| mirror | 64.94 | 75.87 | +| rug | 61.12 | 67.34 | +| field | 30.69 | 40.05 | +| armchair | 42.85 | 61.55 | +| seat | 60.56 | 77.43 | +| fence | 44.02 | 60.13 | +| desk | 46.01 | 62.2 | +| rock | 35.87 | 51.52 | +| wardrobe | 47.3 | 66.63 | +| lamp | 60.45 | 73.27 | +| bathtub | 76.18 | 83.22 | +| railing | 24.89 | 34.36 | +| cushion | 56.5 | 66.67 | +| base | 22.43 | 30.09 | +| box | 25.21 | 33.03 | +| column | 44.9 | 55.52 | +| signboard | 36.51 | 45.92 | +| chest of drawers | 36.73 | 55.75 | +| counter | 30.99 | 40.03 | +| sand | 33.89 | 48.28 | +| sink | 70.76 | 77.73 | +| skyscraper | 42.54 | 52.27 | +| fireplace | 72.83 | 85.29 | +| refrigerator | 75.45 | 82.67 | +| grandstand | 30.43 | 69.66 | +| path | 24.19 | 31.01 | +| stairs | 24.97 | 30.89 | +| runway | 74.94 | 91.57 | +| case | 45.67 | 54.62 | +| pool table | 89.0 | 95.44 | +| pillow | 56.63 | 69.69 | +| screen door | 59.35 | 61.54 | +| stairway | 33.26 | 38.43 | +| river | 20.09 | 34.16 | +| bridge | 39.3 | 45.71 | +| bookcase | 35.55 | 56.16 | +| blind | 22.11 | 23.19 | +| coffee table | 64.24 | 83.61 | +| toilet | 83.71 | 88.93 | +| flower | 32.1 | 41.62 | +| book | 46.28 | 69.18 | +| hill | 9.53 | 20.21 | +| bench | 41.36 | 48.53 | +| countertop | 49.81 | 59.84 | +| stove | 75.9 | 84.68 | +| palm | 41.39 | 53.53 | +| kitchen island | 34.99 | 54.69 | +| computer | 72.48 | 81.65 | +| swivel chair | 46.4 | 62.02 | +| boat | 70.19 | 80.18 | +| bar | 36.54 | 45.33 | +| arcade machine | 29.1 | 30.56 | +| hovel | 14.42 | 19.16 | +| bus | 86.28 | 93.89 | +| towel | 60.42 | 71.24 | +| light | 43.6 | 49.25 | +| truck | 40.82 | 51.66 | +| tower | 32.85 | 41.12 | +| chandelier | 60.58 | 73.91 | +| awning | 20.68 | 22.83 | +| streetlight | 24.76 | 30.13 | +| booth | 46.77 | 47.97 | +| television receiver | 71.12 | 79.56 | +| airplane | 55.51 | 65.55 | +| dirt track | 1.26 | 5.59 | +| apparel | 38.04 | 54.44 | +| pole | 30.48 | 44.3 | +| land | 0.03 | 0.04 | +| bannister | 15.25 | 20.39 | +| escalator | 27.94 | 29.38 | +| ottoman | 49.73 | 63.89 | +| bottle | 27.54 | 34.17 | +| buffet | 42.49 | 53.09 | +| poster | 27.27 | 39.98 | +| stage | 16.55 | 24.94 | +| van | 42.73 | 56.24 | +| ship | 53.9 | 58.0 | +| fountain | 16.14 | 16.59 | +| conveyer belt | 79.05 | 88.05 | +| canopy | 21.7 | 24.05 | +| washer | 63.53 | 65.59 | +| plaything | 28.86 | 38.25 | +| swimming pool | 46.69 | 64.26 | +| stool | 43.62 | 56.45 | +| barrel | 51.16 | 68.8 | +| basket | 27.83 | 36.84 | +| waterfall | 50.88 | 57.05 | +| tent | 87.97 | 98.37 | +| bag | 12.49 | 14.55 | +| minibike | 70.85 | 79.36 | +| cradle | 71.23 | 89.37 | +| oven | 35.55 | 47.06 | +| ball | 41.0 | 45.35 | +| food | 59.78 | 69.63 | +| step | 18.78 | 22.75 | +| tank | 43.19 | 51.43 | +| trade name | 21.6 | 23.9 | +| microwave | 76.21 | 84.83 | +| pot | 44.96 | 49.97 | +| animal | 63.73 | 67.67 | +| bicycle | 54.93 | 70.28 | +| lake | 52.39 | 55.25 | +| dishwasher | 49.46 | 64.89 | +| screen | 55.02 | 67.79 | +| blanket | 7.22 | 9.35 | +| sculpture | 55.79 | 66.3 | +| hood | 53.74 | 57.01 | +| sconce | 34.43 | 42.24 | +| vase | 44.83 | 58.91 | +| traffic light | 35.3 | 57.79 | +| tray | 11.51 | 16.57 | +| ashcan | 42.26 | 55.21 | +| fan | 53.34 | 66.88 | +| pier | 47.77 | 78.96 | +| crt screen | 9.41 | 29.55 | +| plate | 55.36 | 71.11 | +| monitor | 16.96 | 19.42 | +| bulletin board | 40.72 | 51.21 | +| shower | 4.36 | 12.66 | +| radiator | 39.65 | 41.7 | +| glass | 16.16 | 17.84 | +| clock | 26.59 | 30.9 | +| flag | 29.65 | 34.76 | ++---------------------+-------+-------+ +2023/11/06 11:57:49 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4610 coco/bbox_mAP_50: 0.6350 coco/bbox_mAP_75: 0.5010 coco/bbox_mAP_s: 0.2870 coco/bbox_mAP_m: 0.5080 coco/bbox_mAP_l: 0.6050 coco/segm_mAP: 0.3130 coco/segm_mAP_50: 0.5560 coco/segm_mAP_75: 0.3080 coco/segm_mAP_s: 0.1580 coco/segm_mAP_m: 0.3550 coco/segm_mAP_l: 0.4820 Bleu_1: 0.7495 Bleu_2: 0.5851 Bleu_3: 0.4469 Bleu_4: 0.3399 METEOR: 0.2660 ROUGE_L: 0.5517 CIDEr: 1.0772 SPICE: 0.1974 aAcc: 81.8700 mIoU: 46.8300 mAcc: 57.2200 visual-grounding/miou: 0.7851 visual-grounding/acc: 0.8549 data_time: 0.1567 time: 0.6749 +2023/11/06 12:07:11 - mmengine - INFO - Iter(train) [500500/640000] base_lr: 2.4318e-05 lr: 4.0289e-06 eta: 1 day, 19:28:50 time: 1.1180 data_time: 0.0368 memory: 21518 grad_norm: 3.8710 loss: 1.2025 caption_loss_cls: 2.0492 grounding_loss_reg: 2.3989 detection_loss_cls: 0.0298 detection_loss_reg: 0.3258 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0301 instance_segmentation_loss_reg: 0.3253 instance_segmentation_loss_poly: 0.8313 +2023/11/06 12:16:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 12:16:24 - mmengine - INFO - Iter(train) [501000/640000] base_lr: 2.4165e-05 lr: 4.0150e-06 eta: 1 day, 19:19:07 time: 1.1082 data_time: 0.0365 memory: 21518 grad_norm: 3.9582 loss: 1.2132 caption_loss_cls: 2.0523 grounding_loss_reg: 2.3972 detection_loss_cls: 0.0297 detection_loss_reg: 0.3247 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0301 instance_segmentation_loss_reg: 0.3250 instance_segmentation_loss_poly: 0.8311 +2023/11/06 12:16:24 - mmengine - INFO - Saving checkpoint at 501000 iterations +2023/11/06 12:25:37 - mmengine - INFO - Iter(train) [501500/640000] base_lr: 2.4012e-05 lr: 4.0011e-06 eta: 1 day, 19:09:27 time: 1.1057 data_time: 0.0362 memory: 21518 grad_norm: 3.9528 loss: 1.2073 caption_loss_cls: 2.0552 grounding_loss_reg: 2.3942 detection_loss_cls: 0.0296 detection_loss_reg: 0.3244 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0301 instance_segmentation_loss_reg: 0.3248 instance_segmentation_loss_poly: 0.8299 +2023/11/06 12:34:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 12:34:30 - mmengine - INFO - Iter(train) [502000/640000] base_lr: 2.3859e-05 lr: 3.9872e-06 eta: 1 day, 18:58:59 time: 1.0996 data_time: 0.0361 memory: 21518 grad_norm: 3.9796 loss: 1.2069 caption_loss_cls: 2.0543 grounding_loss_reg: 2.3945 detection_loss_cls: 0.0296 detection_loss_reg: 0.3243 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0299 instance_segmentation_loss_reg: 0.3242 instance_segmentation_loss_poly: 0.8289 +2023/11/06 12:34:30 - mmengine - INFO - Saving checkpoint at 502000 iterations +2023/11/06 12:44:34 - mmengine - INFO - Iter(train) [502500/640000] base_lr: 2.3707e-05 lr: 3.9734e-06 eta: 1 day, 18:51:18 time: 1.1093 data_time: 0.0354 memory: 21518 grad_norm: 3.9263 loss: 1.1993 caption_loss_cls: 2.0519 grounding_loss_reg: 2.3927 detection_loss_cls: 0.0296 detection_loss_reg: 0.3246 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0298 instance_segmentation_loss_reg: 0.3228 instance_segmentation_loss_poly: 0.8258 +2023/11/06 12:53:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 12:53:53 - mmengine - INFO - Iter(train) [503000/640000] base_lr: 2.3556e-05 lr: 3.9596e-06 eta: 1 day, 18:41:51 time: 1.1099 data_time: 0.0352 memory: 21518 grad_norm: 3.9202 loss: 1.1970 caption_loss_cls: 2.0534 grounding_loss_reg: 2.3921 detection_loss_cls: 0.0296 detection_loss_reg: 0.3245 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0298 instance_segmentation_loss_reg: 0.3220 instance_segmentation_loss_poly: 0.8248 +2023/11/06 12:53:53 - mmengine - INFO - Saving checkpoint at 503000 iterations +2023/11/06 13:03:51 - mmengine - INFO - Iter(train) [503500/640000] base_lr: 2.3405e-05 lr: 3.9459e-06 eta: 1 day, 18:33:54 time: 1.1210 data_time: 0.0369 memory: 21518 grad_norm: 3.9073 loss: 1.1893 caption_loss_cls: 2.0545 grounding_loss_reg: 2.3924 detection_loss_cls: 0.0294 detection_loss_reg: 0.3228 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0297 instance_segmentation_loss_reg: 0.3217 instance_segmentation_loss_poly: 0.8233 +2023/11/06 13:13:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 13:13:06 - mmengine - INFO - Iter(train) [504000/640000] base_lr: 2.3254e-05 lr: 3.9322e-06 eta: 1 day, 18:24:18 time: 1.1292 data_time: 0.0350 memory: 21518 grad_norm: 3.8476 loss: 1.1802 caption_loss_cls: 2.0541 grounding_loss_reg: 2.3935 detection_loss_cls: 0.0293 detection_loss_reg: 0.3213 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3214 instance_segmentation_loss_poly: 0.8231 +2023/11/06 13:13:06 - mmengine - INFO - Saving checkpoint at 504000 iterations +2023/11/06 13:23:21 - mmengine - INFO - Iter(train) [504500/640000] base_lr: 2.3104e-05 lr: 3.9185e-06 eta: 1 day, 18:16:57 time: 1.1417 data_time: 0.0377 memory: 21518 grad_norm: 3.8952 loss: 1.1929 caption_loss_cls: 2.0522 grounding_loss_reg: 2.3975 detection_loss_cls: 0.0293 detection_loss_reg: 0.3210 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3217 instance_segmentation_loss_poly: 0.8225 +2023/11/06 13:43:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 13:43:41 - mmengine - INFO - Iter(train) [505000/640000] base_lr: 2.2954e-05 lr: 3.9049e-06 eta: 1 day, 18:31:50 time: 1.3084 data_time: 0.0687 memory: 21518 grad_norm: 3.8429 loss: 1.1813 caption_loss_cls: 2.0501 grounding_loss_reg: 2.3982 detection_loss_cls: 0.0292 detection_loss_reg: 0.3203 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3226 instance_segmentation_loss_poly: 0.8240 +2023/11/06 13:43:41 - mmengine - INFO - Saving checkpoint at 505000 iterations +2023/11/06 13:53:30 - mmengine - INFO - Iter(train) [505500/640000] base_lr: 2.2805e-05 lr: 3.8913e-06 eta: 1 day, 18:23:09 time: 1.3171 data_time: 0.0690 memory: 21518 grad_norm: 3.8323 loss: 1.1805 caption_loss_cls: 2.0467 grounding_loss_reg: 2.3975 detection_loss_cls: 0.0292 detection_loss_reg: 0.3206 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3229 instance_segmentation_loss_poly: 0.8242 +2023/11/06 14:02:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 14:02:16 - mmengine - INFO - Iter(train) [506000/640000] base_lr: 2.2656e-05 lr: 3.8778e-06 eta: 1 day, 18:12:13 time: 1.3155 data_time: 0.0688 memory: 21518 grad_norm: 3.7909 loss: 1.1761 caption_loss_cls: 2.0436 grounding_loss_reg: 2.3986 detection_loss_cls: 0.0291 detection_loss_reg: 0.3209 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3220 instance_segmentation_loss_poly: 0.8229 +2023/11/06 14:02:16 - mmengine - INFO - Saving checkpoint at 506000 iterations +2023/11/06 14:11:39 - mmengine - INFO - Iter(train) [506500/640000] base_lr: 2.2508e-05 lr: 3.8643e-06 eta: 1 day, 18:02:36 time: 1.3054 data_time: 0.0686 memory: 21518 grad_norm: 3.8355 loss: 1.1876 caption_loss_cls: 2.0419 grounding_loss_reg: 2.3969 detection_loss_cls: 0.0291 detection_loss_reg: 0.3214 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3220 instance_segmentation_loss_poly: 0.8222 +2023/11/06 14:20:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 14:20:41 - mmengine - INFO - Iter(train) [507000/640000] base_lr: 2.2360e-05 lr: 3.8509e-06 eta: 1 day, 17:52:16 time: 1.3012 data_time: 0.0686 memory: 21518 grad_norm: 3.8452 loss: 1.1856 caption_loss_cls: 2.0401 grounding_loss_reg: 2.3932 detection_loss_cls: 0.0290 detection_loss_reg: 0.3199 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3213 instance_segmentation_loss_poly: 0.8203 +2023/11/06 14:20:41 - mmengine - INFO - Saving checkpoint at 507000 iterations +2023/11/06 14:31:45 - mmengine - INFO - Iter(train) [507500/640000] base_lr: 2.2212e-05 lr: 3.8375e-06 eta: 1 day, 17:46:12 time: 1.3177 data_time: 0.0688 memory: 21518 grad_norm: 3.8773 loss: 1.1926 caption_loss_cls: 2.0382 grounding_loss_reg: 2.3905 detection_loss_cls: 0.0290 detection_loss_reg: 0.3208 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3216 instance_segmentation_loss_poly: 0.8200 +2023/11/06 14:41:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 14:41:25 - mmengine - INFO - Iter(train) [508000/640000] base_lr: 2.2066e-05 lr: 3.8241e-06 eta: 1 day, 17:37:09 time: 1.3238 data_time: 0.0691 memory: 21518 grad_norm: 3.8705 loss: 1.1937 caption_loss_cls: 2.0371 grounding_loss_reg: 2.3848 detection_loss_cls: 0.0289 detection_loss_reg: 0.3201 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3225 instance_segmentation_loss_poly: 0.8211 +2023/11/06 14:41:25 - mmengine - INFO - Saving checkpoint at 508000 iterations +2023/11/06 14:50:56 - mmengine - INFO - Iter(train) [508500/640000] base_lr: 2.1919e-05 lr: 3.8108e-06 eta: 1 day, 17:27:49 time: 1.3129 data_time: 0.0687 memory: 21518 grad_norm: 3.8227 loss: 1.1770 caption_loss_cls: 2.0367 grounding_loss_reg: 2.3836 detection_loss_cls: 0.0289 detection_loss_reg: 0.3201 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3226 instance_segmentation_loss_poly: 0.8226 +2023/11/06 15:00:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 15:00:20 - mmengine - INFO - Iter(train) [509000/640000] base_lr: 2.1773e-05 lr: 3.7976e-06 eta: 1 day, 17:18:13 time: 1.1490 data_time: 0.0379 memory: 21518 grad_norm: 3.8546 loss: 1.1799 caption_loss_cls: 2.0338 grounding_loss_reg: 2.3830 detection_loss_cls: 0.0289 detection_loss_reg: 0.3203 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3217 instance_segmentation_loss_poly: 0.8213 +2023/11/06 15:00:20 - mmengine - INFO - Saving checkpoint at 509000 iterations +2023/11/06 15:12:44 - mmengine - INFO - Iter(train) [509500/640000] base_lr: 2.1628e-05 lr: 3.7843e-06 eta: 1 day, 17:14:34 time: 1.1876 data_time: 0.0452 memory: 21518 grad_norm: 3.8523 loss: 1.1793 caption_loss_cls: 2.0327 grounding_loss_reg: 2.3820 detection_loss_cls: 0.0290 detection_loss_reg: 0.3218 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3208 instance_segmentation_loss_poly: 0.8190 +2023/11/06 15:21:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 15:21:54 - mmengine - INFO - Iter(train) [510000/640000] base_lr: 2.1483e-05 lr: 3.7712e-06 eta: 1 day, 17:04:29 time: 1.1937 data_time: 0.0453 memory: 21518 grad_norm: 3.8334 loss: 1.1755 caption_loss_cls: 2.0325 grounding_loss_reg: 2.3796 detection_loss_cls: 0.0289 detection_loss_reg: 0.3205 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3208 instance_segmentation_loss_poly: 0.8192 +2023/11/06 15:21:54 - mmengine - INFO - Saving checkpoint at 510000 iterations +2023/11/06 15:31:08 - mmengine - INFO - Iter(train) [510500/640000] base_lr: 2.1338e-05 lr: 3.7580e-06 eta: 1 day, 16:54:30 time: 1.1913 data_time: 0.0451 memory: 21518 grad_norm: 3.8188 loss: 1.1681 caption_loss_cls: 2.0318 grounding_loss_reg: 2.3773 detection_loss_cls: 0.0288 detection_loss_reg: 0.3204 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3206 instance_segmentation_loss_poly: 0.8189 +2023/11/06 15:40:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 15:40:25 - mmengine - INFO - Iter(train) [511000/640000] base_lr: 2.1194e-05 lr: 3.7449e-06 eta: 1 day, 16:44:37 time: 1.1950 data_time: 0.0451 memory: 21518 grad_norm: 3.7933 loss: 1.1636 caption_loss_cls: 2.0307 grounding_loss_reg: 2.3745 detection_loss_cls: 0.0287 detection_loss_reg: 0.3196 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3201 instance_segmentation_loss_poly: 0.8175 +2023/11/06 15:40:25 - mmengine - INFO - Saving checkpoint at 511000 iterations +2023/11/06 15:49:38 - mmengine - INFO - Iter(train) [511500/640000] base_lr: 2.1051e-05 lr: 3.7319e-06 eta: 1 day, 16:34:40 time: 1.1674 data_time: 0.0435 memory: 21518 grad_norm: 3.7863 loss: 1.1610 caption_loss_cls: 2.0302 grounding_loss_reg: 2.3735 detection_loss_cls: 0.0287 detection_loss_reg: 0.3196 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3203 instance_segmentation_loss_poly: 0.8178 +2023/11/06 15:59:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 15:59:12 - mmengine - INFO - Iter(train) [512000/640000] base_lr: 2.0908e-05 lr: 3.7189e-06 eta: 1 day, 16:25:21 time: 1.1660 data_time: 0.0432 memory: 21518 grad_norm: 3.7763 loss: 1.1525 caption_loss_cls: 2.0281 grounding_loss_reg: 2.3692 detection_loss_cls: 0.0287 detection_loss_reg: 0.3197 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3210 instance_segmentation_loss_poly: 0.8186 +2023/11/06 15:59:12 - mmengine - INFO - Saving checkpoint at 512000 iterations +2023/11/06 16:08:37 - mmengine - INFO - Iter(train) [512500/640000] base_lr: 2.0765e-05 lr: 3.7059e-06 eta: 1 day, 16:15:46 time: 1.1643 data_time: 0.0434 memory: 21518 grad_norm: 3.8379 loss: 1.1646 caption_loss_cls: 2.0239 grounding_loss_reg: 2.3689 detection_loss_cls: 0.0287 detection_loss_reg: 0.3198 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3221 instance_segmentation_loss_poly: 0.8207 +2023/11/06 16:18:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 16:18:24 - mmengine - INFO - Iter(train) [513000/640000] base_lr: 2.0623e-05 lr: 3.6930e-06 eta: 1 day, 16:06:50 time: 1.1700 data_time: 0.0438 memory: 21518 grad_norm: 3.7962 loss: 1.1610 caption_loss_cls: 2.0267 grounding_loss_reg: 2.3682 detection_loss_cls: 0.0286 detection_loss_reg: 0.3202 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3213 instance_segmentation_loss_poly: 0.8191 +2023/11/06 16:18:24 - mmengine - INFO - Saving checkpoint at 513000 iterations +2023/11/06 16:27:54 - mmengine - INFO - Iter(train) [513500/640000] base_lr: 2.0481e-05 lr: 3.6801e-06 eta: 1 day, 15:57:22 time: 1.1266 data_time: 0.0363 memory: 21518 grad_norm: 3.8362 loss: 1.1595 caption_loss_cls: 2.0251 grounding_loss_reg: 2.3666 detection_loss_cls: 0.0286 detection_loss_reg: 0.3208 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3200 instance_segmentation_loss_poly: 0.8163 +2023/11/06 16:37:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 16:37:56 - mmengine - INFO - Iter(train) [514000/640000] base_lr: 2.0340e-05 lr: 3.6673e-06 eta: 1 day, 15:48:54 time: 1.1395 data_time: 0.0368 memory: 21518 grad_norm: 3.8443 loss: 1.1645 caption_loss_cls: 2.0217 grounding_loss_reg: 2.3669 detection_loss_cls: 0.0286 detection_loss_reg: 0.3198 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3193 instance_segmentation_loss_poly: 0.8142 +2023/11/06 16:37:56 - mmengine - INFO - Saving checkpoint at 514000 iterations +2023/11/06 16:47:01 - mmengine - INFO - Iter(train) [514500/640000] base_lr: 2.0200e-05 lr: 3.6545e-06 eta: 1 day, 15:38:42 time: 1.1374 data_time: 0.0368 memory: 21518 grad_norm: 3.8837 loss: 1.1723 caption_loss_cls: 2.0218 grounding_loss_reg: 2.3651 detection_loss_cls: 0.0285 detection_loss_reg: 0.3187 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3198 instance_segmentation_loss_poly: 0.8155 +2023/11/06 16:56:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 16:56:29 - mmengine - INFO - Iter(train) [515000/640000] base_lr: 2.0059e-05 lr: 3.6418e-06 eta: 1 day, 15:29:11 time: 1.1401 data_time: 0.0369 memory: 21518 grad_norm: 3.9181 loss: 1.1771 caption_loss_cls: 2.0260 grounding_loss_reg: 2.3649 detection_loss_cls: 0.0285 detection_loss_reg: 0.3185 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3203 instance_segmentation_loss_poly: 0.8152 +2023/11/06 16:56:29 - mmengine - INFO - Saving checkpoint at 515000 iterations +2023/11/06 17:05:43 - mmengine - INFO - Iter(train) [515500/640000] base_lr: 1.9920e-05 lr: 3.6291e-06 eta: 1 day, 15:19:17 time: 1.1404 data_time: 0.0367 memory: 21518 grad_norm: 3.9008 loss: 1.1703 caption_loss_cls: 2.0228 grounding_loss_reg: 2.3656 detection_loss_cls: 0.0285 detection_loss_reg: 0.3183 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3199 instance_segmentation_loss_poly: 0.8144 +2023/11/06 17:14:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 17:14:52 - mmengine - INFO - Iter(train) [516000/640000] base_lr: 1.9781e-05 lr: 3.6164e-06 eta: 1 day, 15:09:15 time: 1.1341 data_time: 0.0365 memory: 21518 grad_norm: 3.9188 loss: 1.1747 caption_loss_cls: 2.0200 grounding_loss_reg: 2.3650 detection_loss_cls: 0.0286 detection_loss_reg: 0.3179 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3195 instance_segmentation_loss_poly: 0.8135 +2023/11/06 17:14:52 - mmengine - INFO - Saving checkpoint at 516000 iterations +2023/11/06 17:24:24 - mmengine - INFO - Iter(train) [516500/640000] base_lr: 1.9642e-05 lr: 3.6038e-06 eta: 1 day, 14:59:51 time: 1.1358 data_time: 0.0367 memory: 21518 grad_norm: 3.8947 loss: 1.1757 caption_loss_cls: 2.0195 grounding_loss_reg: 2.3638 detection_loss_cls: 0.0286 detection_loss_reg: 0.3179 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3202 instance_segmentation_loss_poly: 0.8140 +2023/11/06 17:33:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231105_173749 +2023/11/06 17:33:50 - mmengine - INFO - Iter(train) [517000/640000] base_lr: 1.9504e-05 lr: 3.5912e-06 eta: 1 day, 14:50:17 time: 1.1304 data_time: 0.0363 memory: 21518 grad_norm: 3.9093 loss: 1.1782 caption_loss_cls: 2.0193 grounding_loss_reg: 2.3645 detection_loss_cls: 0.0285 detection_loss_reg: 0.3174 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3195 instance_segmentation_loss_poly: 0.8131 +2023/11/06 17:33:50 - mmengine - INFO - Saving checkpoint at 517000 iterations +2023/11/06 19:50:53 - mmengine - INFO - Iter(train) [517500/640000] base_lr: 1.9366e-05 lr: 3.5787e-06 eta: 1 day, 14:51:49 time: 1.1310 data_time: 0.0328 memory: 21520 grad_norm: 3.8871 loss: 1.1761 caption_loss_cls: 2.0195 grounding_loss_reg: 2.3618 detection_loss_cls: 0.0286 detection_loss_reg: 0.3179 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3195 instance_segmentation_loss_poly: 0.8139 +2023/11/06 20:00:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/06 20:00:07 - mmengine - INFO - Iter(train) [518000/640000] base_lr: 1.9229e-05 lr: 3.5662e-06 eta: 1 day, 14:06:04 time: 1.1188 data_time: 0.0324 memory: 21520 grad_norm: 3.9559 loss: 1.1717 caption_loss_cls: 2.0184 grounding_loss_reg: 2.3603 detection_loss_cls: 0.0285 detection_loss_reg: 0.3176 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3203 instance_segmentation_loss_poly: 0.8157 +2023/11/06 20:00:07 - mmengine - INFO - Saving checkpoint at 518000 iterations +2023/11/06 20:09:35 - mmengine - INFO - Iter(train) [518500/640000] base_lr: 1.9092e-05 lr: 3.5538e-06 eta: 1 day, 14:03:36 time: 1.1244 data_time: 0.0324 memory: 21520 grad_norm: 3.9276 loss: 1.1648 caption_loss_cls: 2.0179 grounding_loss_reg: 2.3598 detection_loss_cls: 0.0285 detection_loss_reg: 0.3178 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3202 instance_segmentation_loss_poly: 0.8154 +2023/11/06 20:18:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/06 20:18:25 - mmengine - INFO - Iter(train) [519000/640000] base_lr: 1.8956e-05 lr: 3.5414e-06 eta: 1 day, 13:20:12 time: 1.1152 data_time: 0.0320 memory: 21520 grad_norm: 3.9219 loss: 1.1624 caption_loss_cls: 2.0146 grounding_loss_reg: 2.3593 detection_loss_cls: 0.0285 detection_loss_reg: 0.3177 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3200 instance_segmentation_loss_poly: 0.8156 +2023/11/06 20:18:25 - mmengine - INFO - Saving checkpoint at 519000 iterations +2023/11/06 20:27:57 - mmengine - INFO - Iter(train) [519500/640000] base_lr: 1.8820e-05 lr: 3.5291e-06 eta: 1 day, 13:23:21 time: 1.1194 data_time: 0.0323 memory: 21520 grad_norm: 3.8798 loss: 1.1640 caption_loss_cls: 2.0143 grounding_loss_reg: 2.3564 detection_loss_cls: 0.0286 detection_loss_reg: 0.3180 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3209 instance_segmentation_loss_poly: 0.8182 +2023/11/06 20:37:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/06 20:37:24 - mmengine - INFO - Iter(train) [520000/640000] base_lr: 1.8685e-05 lr: 3.5168e-06 eta: 1 day, 13:19:25 time: 1.1238 data_time: 0.0323 memory: 21520 grad_norm: 3.8833 loss: 1.1579 caption_loss_cls: 2.0143 grounding_loss_reg: 2.3517 detection_loss_cls: 0.0285 detection_loss_reg: 0.3177 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3188 instance_segmentation_loss_poly: 0.8146 +2023/11/06 20:37:24 - mmengine - INFO - Saving checkpoint at 520000 iterations +2023/11/06 20:45:55 - mmengine - INFO - Evaluating bbox... +2023/11/06 20:46:51 - mmengine - INFO - bbox_mAP_copypaste: 0.461 0.636 0.500 0.282 0.511 0.605 +2023/11/06 20:46:51 - mmengine - INFO - Evaluating segm... +2023/11/06 20:48:04 - mmengine - INFO - segm_mAP_copypaste: 0.314 0.558 0.307 0.155 0.359 0.485 +2023/11/06 20:52:49 - mmengine - INFO - per class results: +2023/11/06 20:52:49 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.98 | 89.4 | +| building | 80.8 | 90.38 | +| sky | 92.93 | 97.63 | +| floor | 80.41 | 89.57 | +| tree | 73.19 | 85.54 | +| ceiling | 83.37 | 93.92 | +| road | 82.34 | 88.86 | +| bed | 88.04 | 94.39 | +| windowpane | 59.03 | 73.26 | +| grass | 67.3 | 83.02 | +| cabinet | 57.85 | 71.77 | +| sidewalk | 66.26 | 82.82 | +| person | 79.25 | 90.79 | +| earth | 36.8 | 50.47 | +| door | 49.44 | 63.7 | +| table | 59.34 | 76.72 | +| mountain | 51.86 | 67.12 | +| plant | 51.9 | 64.52 | +| curtain | 66.43 | 83.72 | +| chair | 56.95 | 71.71 | +| car | 83.48 | 92.07 | +| water | 50.77 | 63.76 | +| painting | 69.72 | 85.85 | +| sofa | 67.18 | 81.3 | +| shelf | 42.61 | 60.96 | +| house | 39.33 | 55.62 | +| sea | 51.16 | 80.17 | +| mirror | 62.8 | 71.54 | +| rug | 64.09 | 75.43 | +| field | 30.16 | 43.97 | +| armchair | 43.55 | 63.89 | +| seat | 62.04 | 80.97 | +| fence | 41.02 | 60.82 | +| desk | 43.95 | 62.11 | +| rock | 33.56 | 50.84 | +| wardrobe | 44.32 | 63.66 | +| lamp | 60.59 | 73.38 | +| bathtub | 78.47 | 87.24 | +| railing | 28.41 | 40.99 | +| cushion | 56.3 | 65.46 | +| base | 25.51 | 34.94 | +| box | 26.04 | 36.63 | +| column | 43.21 | 51.4 | +| signboard | 37.15 | 45.98 | +| chest of drawers | 32.35 | 53.7 | +| counter | 35.73 | 48.76 | +| sand | 31.68 | 50.47 | +| sink | 71.54 | 77.75 | +| skyscraper | 51.2 | 61.78 | +| fireplace | 69.5 | 80.98 | +| refrigerator | 69.84 | 74.04 | +| grandstand | 34.82 | 69.02 | +| path | 26.04 | 32.85 | +| stairs | 23.97 | 30.15 | +| runway | 66.9 | 82.58 | +| case | 45.8 | 58.81 | +| pool table | 88.38 | 95.3 | +| pillow | 54.36 | 67.81 | +| screen door | 64.77 | 72.36 | +| stairway | 32.35 | 37.24 | +| river | 18.31 | 28.25 | +| bridge | 65.94 | 76.06 | +| bookcase | 33.75 | 58.31 | +| blind | 23.36 | 25.25 | +| coffee table | 60.47 | 73.8 | +| toilet | 84.32 | 89.25 | +| flower | 34.34 | 47.21 | +| book | 45.84 | 68.75 | +| hill | 7.23 | 10.15 | +| bench | 42.77 | 50.54 | +| countertop | 49.7 | 64.23 | +| stove | 76.68 | 84.53 | +| palm | 43.13 | 57.71 | +| kitchen island | 39.88 | 68.86 | +| computer | 72.84 | 84.36 | +| swivel chair | 39.51 | 48.32 | +| boat | 74.45 | 86.14 | +| bar | 34.83 | 39.63 | +| arcade machine | 31.36 | 33.21 | +| hovel | 12.45 | 14.89 | +| bus | 83.96 | 94.84 | +| towel | 61.58 | 73.28 | +| light | 45.53 | 51.34 | +| truck | 39.39 | 47.25 | +| tower | 38.6 | 51.6 | +| chandelier | 63.1 | 77.74 | +| awning | 25.5 | 30.41 | +| streetlight | 26.28 | 32.84 | +| booth | 43.43 | 44.05 | +| television receiver | 68.58 | 79.11 | +| airplane | 55.59 | 64.26 | +| dirt track | 1.45 | 6.54 | +| apparel | 35.26 | 52.31 | +| pole | 30.74 | 40.36 | +| land | 2.33 | 3.05 | +| bannister | 13.7 | 17.19 | +| escalator | 24.09 | 27.43 | +| ottoman | 46.9 | 65.15 | +| bottle | 26.71 | 32.22 | +| buffet | 36.29 | 38.65 | +| poster | 26.91 | 36.32 | +| stage | 10.76 | 16.91 | +| van | 36.14 | 48.57 | +| ship | 80.76 | 82.02 | +| fountain | 13.67 | 14.01 | +| conveyer belt | 75.48 | 80.98 | +| canopy | 18.59 | 22.26 | +| washer | 66.92 | 68.05 | +| plaything | 25.98 | 36.17 | +| swimming pool | 59.32 | 76.94 | +| stool | 40.35 | 56.89 | +| barrel | 39.41 | 50.95 | +| basket | 28.32 | 41.79 | +| waterfall | 51.48 | 63.02 | +| tent | 85.93 | 97.63 | +| bag | 13.28 | 16.56 | +| minibike | 72.26 | 82.2 | +| cradle | 74.3 | 92.93 | +| oven | 40.8 | 47.5 | +| ball | 36.76 | 41.13 | +| food | 53.0 | 58.1 | +| step | 17.68 | 20.6 | +| tank | 44.15 | 48.67 | +| trade name | 17.71 | 18.84 | +| microwave | 81.69 | 89.52 | +| pot | 46.62 | 52.74 | +| animal | 63.9 | 67.82 | +| bicycle | 54.91 | 71.51 | +| lake | 60.63 | 64.99 | +| dishwasher | 51.27 | 73.13 | +| screen | 61.1 | 83.47 | +| blanket | 13.17 | 16.43 | +| sculpture | 55.67 | 63.05 | +| hood | 53.16 | 57.9 | +| sconce | 35.11 | 43.09 | +| vase | 42.24 | 53.64 | +| traffic light | 33.8 | 48.73 | +| tray | 11.58 | 17.94 | +| ashcan | 37.87 | 48.14 | +| fan | 54.05 | 69.21 | +| pier | 48.46 | 73.12 | +| crt screen | 5.96 | 15.97 | +| plate | 55.58 | 70.21 | +| monitor | 14.35 | 17.44 | +| bulletin board | 32.64 | 40.3 | +| shower | 3.93 | 8.69 | +| radiator | 45.37 | 50.48 | +| glass | 14.51 | 16.86 | +| clock | 25.48 | 29.8 | +| flag | 29.75 | 33.87 | ++---------------------+-------+-------+ +2023/11/06 20:53:31 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4610 coco/bbox_mAP_50: 0.6360 coco/bbox_mAP_75: 0.5000 coco/bbox_mAP_s: 0.2820 coco/bbox_mAP_m: 0.5110 coco/bbox_mAP_l: 0.6050 coco/segm_mAP: 0.3140 coco/segm_mAP_50: 0.5580 coco/segm_mAP_75: 0.3070 coco/segm_mAP_s: 0.1550 coco/segm_mAP_m: 0.3590 coco/segm_mAP_l: 0.4850 Bleu_1: 0.7505 Bleu_2: 0.5851 Bleu_3: 0.4446 Bleu_4: 0.3353 METEOR: 0.2669 ROUGE_L: 0.5535 CIDEr: 1.0810 SPICE: 0.1982 aAcc: 82.0400 mIoU: 47.1100 mAcc: 57.7900 visual-grounding/miou: 0.7857 visual-grounding/acc: 0.8558 data_time: 0.1290 time: 0.6470 +2023/11/06 21:02:58 - mmengine - INFO - Iter(train) [520500/640000] base_lr: 1.8550e-05 lr: 3.5045e-06 eta: 1 day, 13:15:42 time: 1.1234 data_time: 0.0295 memory: 21519 grad_norm: 3.8447 loss: 1.1423 caption_loss_cls: 2.0124 grounding_loss_reg: 2.3530 detection_loss_cls: 0.0285 detection_loss_reg: 0.3174 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3186 instance_segmentation_loss_poly: 0.8135 +2023/11/06 21:12:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/06 21:12:18 - mmengine - INFO - Iter(train) [521000/640000] base_lr: 1.8416e-05 lr: 3.4923e-06 eta: 1 day, 13:05:24 time: 1.1221 data_time: 0.0295 memory: 21519 grad_norm: 3.8971 loss: 1.1451 caption_loss_cls: 2.0069 grounding_loss_reg: 2.3521 detection_loss_cls: 0.0285 detection_loss_reg: 0.3168 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3185 instance_segmentation_loss_poly: 0.8140 +2023/11/06 21:12:18 - mmengine - INFO - Saving checkpoint at 521000 iterations +2023/11/06 21:22:01 - mmengine - INFO - Iter(train) [521500/640000] base_lr: 1.8282e-05 lr: 3.4802e-06 eta: 1 day, 13:05:22 time: 1.1249 data_time: 0.0331 memory: 21519 grad_norm: 3.9161 loss: 1.1527 caption_loss_cls: 2.0093 grounding_loss_reg: 2.3502 detection_loss_cls: 0.0285 detection_loss_reg: 0.3181 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3192 instance_segmentation_loss_poly: 0.8150 +2023/11/06 21:30:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/06 21:30:32 - mmengine - INFO - Iter(train) [522000/640000] base_lr: 1.8149e-05 lr: 3.4681e-06 eta: 1 day, 12:35:13 time: 1.1142 data_time: 0.0341 memory: 21519 grad_norm: 3.9585 loss: 1.1717 caption_loss_cls: 2.0082 grounding_loss_reg: 2.3493 detection_loss_cls: 0.0284 detection_loss_reg: 0.3170 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3194 instance_segmentation_loss_poly: 0.8148 +2023/11/06 21:30:32 - mmengine - INFO - Saving checkpoint at 522000 iterations +2023/11/06 21:40:13 - mmengine - INFO - Iter(train) [522500/640000] base_lr: 1.8016e-05 lr: 3.4560e-06 eta: 1 day, 12:33:51 time: 1.1175 data_time: 0.0341 memory: 21519 grad_norm: 3.9776 loss: 1.1753 caption_loss_cls: 2.0084 grounding_loss_reg: 2.3491 detection_loss_cls: 0.0285 detection_loss_reg: 0.3170 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3209 instance_segmentation_loss_poly: 0.8183 +2023/11/06 21:49:49 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/06 21:49:49 - mmengine - INFO - Iter(train) [523000/640000] base_lr: 1.7884e-05 lr: 3.4440e-06 eta: 1 day, 12:29:39 time: 1.1289 data_time: 0.0343 memory: 21519 grad_norm: 3.9231 loss: 1.1594 caption_loss_cls: 2.0017 grounding_loss_reg: 2.3491 detection_loss_cls: 0.0287 detection_loss_reg: 0.3183 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3219 instance_segmentation_loss_poly: 0.8204 +2023/11/06 21:49:49 - mmengine - INFO - Saving checkpoint at 523000 iterations +2023/11/06 21:59:32 - mmengine - INFO - Iter(train) [523500/640000] base_lr: 1.7752e-05 lr: 3.4320e-06 eta: 1 day, 12:26:40 time: 1.1319 data_time: 0.0342 memory: 21519 grad_norm: 3.9944 loss: 1.1639 caption_loss_cls: 2.0039 grounding_loss_reg: 2.3486 detection_loss_cls: 0.0287 detection_loss_reg: 0.3189 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3216 instance_segmentation_loss_poly: 0.8201 +2023/11/06 22:08:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/06 22:08:44 - mmengine - INFO - Iter(train) [524000/640000] base_lr: 1.7621e-05 lr: 3.4201e-06 eta: 1 day, 12:13:54 time: 1.1280 data_time: 0.0342 memory: 21519 grad_norm: 4.0097 loss: 1.1732 caption_loss_cls: 2.0029 grounding_loss_reg: 2.3469 detection_loss_cls: 0.0288 detection_loss_reg: 0.3199 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3210 instance_segmentation_loss_poly: 0.8180 +2023/11/06 22:08:44 - mmengine - INFO - Saving checkpoint at 524000 iterations +2023/11/06 22:17:19 - mmengine - INFO - Iter(train) [524500/640000] base_lr: 1.7490e-05 lr: 3.4082e-06 eta: 1 day, 11:52:15 time: 1.1141 data_time: 0.0364 memory: 21519 grad_norm: 4.1142 loss: 1.1944 caption_loss_cls: 2.0046 grounding_loss_reg: 2.3487 detection_loss_cls: 0.0289 detection_loss_reg: 0.3197 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3210 instance_segmentation_loss_poly: 0.8181 +2023/11/06 22:26:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/06 22:26:01 - mmengine - INFO - Iter(train) [525000/640000] base_lr: 1.7360e-05 lr: 3.3963e-06 eta: 1 day, 11:34:03 time: 1.1048 data_time: 0.0360 memory: 21519 grad_norm: 4.1536 loss: 1.1970 caption_loss_cls: 2.0044 grounding_loss_reg: 2.3441 detection_loss_cls: 0.0288 detection_loss_reg: 0.3185 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3201 instance_segmentation_loss_poly: 0.8161 +2023/11/06 22:26:01 - mmengine - INFO - Saving checkpoint at 525000 iterations +2023/11/06 22:34:54 - mmengine - INFO - Iter(train) [525500/640000] base_lr: 1.7230e-05 lr: 3.3845e-06 eta: 1 day, 11:19:21 time: 1.0924 data_time: 0.0358 memory: 21519 grad_norm: 4.1967 loss: 1.2047 caption_loss_cls: 2.0070 grounding_loss_reg: 2.3405 detection_loss_cls: 0.0289 detection_loss_reg: 0.3189 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3202 instance_segmentation_loss_poly: 0.8172 +2023/11/06 22:44:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/06 22:44:08 - mmengine - INFO - Iter(train) [526000/640000] base_lr: 1.7101e-05 lr: 3.3728e-06 eta: 1 day, 11:09:38 time: 1.1030 data_time: 0.0348 memory: 21519 grad_norm: 4.1189 loss: 1.1938 caption_loss_cls: 2.0067 grounding_loss_reg: 2.3373 detection_loss_cls: 0.0289 detection_loss_reg: 0.3183 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3205 instance_segmentation_loss_poly: 0.8183 +2023/11/06 22:44:08 - mmengine - INFO - Saving checkpoint at 526000 iterations +2023/11/06 22:53:19 - mmengine - INFO - Iter(train) [526500/640000] base_lr: 1.6972e-05 lr: 3.3611e-06 eta: 1 day, 10:59:30 time: 1.0956 data_time: 0.0347 memory: 21519 grad_norm: 4.1373 loss: 1.1876 caption_loss_cls: 2.0024 grounding_loss_reg: 2.3332 detection_loss_cls: 0.0289 detection_loss_reg: 0.3190 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3202 instance_segmentation_loss_poly: 0.8182 +2023/11/06 23:02:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/06 23:02:19 - mmengine - INFO - Iter(train) [527000/640000] base_lr: 1.6844e-05 lr: 3.3494e-06 eta: 1 day, 10:47:22 time: 1.0865 data_time: 0.0348 memory: 21519 grad_norm: 4.2557 loss: 1.2100 caption_loss_cls: 1.9993 grounding_loss_reg: 2.3349 detection_loss_cls: 0.0290 detection_loss_reg: 0.3192 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3198 instance_segmentation_loss_poly: 0.8177 +2023/11/06 23:02:19 - mmengine - INFO - Saving checkpoint at 527000 iterations +2023/11/06 23:11:48 - mmengine - INFO - Iter(train) [527500/640000] base_lr: 1.6716e-05 lr: 3.3378e-06 eta: 1 day, 10:40:42 time: 1.0830 data_time: 0.0348 memory: 21519 grad_norm: 4.2834 loss: 1.2140 caption_loss_cls: 1.9993 grounding_loss_reg: 2.3371 detection_loss_cls: 0.0290 detection_loss_reg: 0.3191 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3200 instance_segmentation_loss_poly: 0.8178 +2023/11/06 23:20:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/06 23:20:29 - mmengine - INFO - Iter(train) [528000/640000] base_lr: 1.6589e-05 lr: 3.3263e-06 eta: 1 day, 10:25:34 time: 1.0753 data_time: 0.0346 memory: 21519 grad_norm: 4.3001 loss: 1.2186 caption_loss_cls: 1.9989 grounding_loss_reg: 2.3378 detection_loss_cls: 0.0290 detection_loss_reg: 0.3194 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3200 instance_segmentation_loss_poly: 0.8184 +2023/11/06 23:20:29 - mmengine - INFO - Saving checkpoint at 528000 iterations +2023/11/06 23:29:44 - mmengine - INFO - Iter(train) [528500/640000] base_lr: 1.6462e-05 lr: 3.3147e-06 eta: 1 day, 10:16:39 time: 1.0855 data_time: 0.0350 memory: 21519 grad_norm: 4.2874 loss: 1.2133 caption_loss_cls: 1.9970 grounding_loss_reg: 2.3406 detection_loss_cls: 0.0289 detection_loss_reg: 0.3192 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3184 instance_segmentation_loss_poly: 0.8149 +2023/11/06 23:38:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/06 23:38:55 - mmengine - INFO - Iter(train) [529000/640000] base_lr: 1.6336e-05 lr: 3.3033e-06 eta: 1 day, 10:06:54 time: 1.0925 data_time: 0.0352 memory: 21519 grad_norm: 4.2203 loss: 1.1996 caption_loss_cls: 1.9931 grounding_loss_reg: 2.3387 detection_loss_cls: 0.0289 detection_loss_reg: 0.3187 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3189 instance_segmentation_loss_poly: 0.8155 +2023/11/06 23:38:55 - mmengine - INFO - Saving checkpoint at 529000 iterations +2023/11/06 23:48:42 - mmengine - INFO - Iter(train) [529500/640000] base_lr: 1.6210e-05 lr: 3.2918e-06 eta: 1 day, 10:02:41 time: 1.1061 data_time: 0.0353 memory: 21519 grad_norm: 4.1875 loss: 1.1854 caption_loss_cls: 1.9917 grounding_loss_reg: 2.3396 detection_loss_cls: 0.0287 detection_loss_reg: 0.3177 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3196 instance_segmentation_loss_poly: 0.8180 +2023/11/06 23:57:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/06 23:57:59 - mmengine - INFO - Iter(train) [530000/640000] base_lr: 1.6085e-05 lr: 3.2805e-06 eta: 1 day, 9:53:39 time: 1.1069 data_time: 0.0353 memory: 21519 grad_norm: 4.2010 loss: 1.1797 caption_loss_cls: 1.9911 grounding_loss_reg: 2.3366 detection_loss_cls: 0.0286 detection_loss_reg: 0.3176 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3188 instance_segmentation_loss_poly: 0.8161 +2023/11/06 23:57:59 - mmengine - INFO - Saving checkpoint at 530000 iterations +2023/11/07 00:07:46 - mmengine - INFO - Iter(train) [530500/640000] base_lr: 1.5960e-05 lr: 3.2691e-06 eta: 1 day, 9:48:43 time: 1.1158 data_time: 0.0360 memory: 21519 grad_norm: 4.1794 loss: 1.1879 caption_loss_cls: 1.9929 grounding_loss_reg: 2.3354 detection_loss_cls: 0.0286 detection_loss_reg: 0.3177 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3202 instance_segmentation_loss_poly: 0.8183 +2023/11/07 00:16:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 00:16:45 - mmengine - INFO - Iter(train) [531000/640000] base_lr: 1.5836e-05 lr: 3.2578e-06 eta: 1 day, 9:37:14 time: 1.1156 data_time: 0.0358 memory: 21519 grad_norm: 4.1286 loss: 1.1749 caption_loss_cls: 1.9934 grounding_loss_reg: 2.3319 detection_loss_cls: 0.0287 detection_loss_reg: 0.3182 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3200 instance_segmentation_loss_poly: 0.8177 +2023/11/07 00:16:45 - mmengine - INFO - Saving checkpoint at 531000 iterations +2023/11/07 00:26:18 - mmengine - INFO - Iter(train) [531500/640000] base_lr: 1.5713e-05 lr: 3.2466e-06 eta: 1 day, 9:30:10 time: 1.1166 data_time: 0.0356 memory: 21519 grad_norm: 4.0565 loss: 1.1611 caption_loss_cls: 1.9962 grounding_loss_reg: 2.3295 detection_loss_cls: 0.0287 detection_loss_reg: 0.3186 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3206 instance_segmentation_loss_poly: 0.8190 +2023/11/07 00:35:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 00:35:17 - mmengine - INFO - Iter(train) [532000/640000] base_lr: 1.5590e-05 lr: 3.2354e-06 eta: 1 day, 9:18:48 time: 1.1211 data_time: 0.0357 memory: 21519 grad_norm: 4.0606 loss: 1.1592 caption_loss_cls: 1.9942 grounding_loss_reg: 2.3305 detection_loss_cls: 0.0287 detection_loss_reg: 0.3183 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3206 instance_segmentation_loss_poly: 0.8197 +2023/11/07 00:35:17 - mmengine - INFO - Saving checkpoint at 532000 iterations +2023/11/07 00:44:45 - mmengine - INFO - Iter(train) [532500/640000] base_lr: 1.5467e-05 lr: 3.2243e-06 eta: 1 day, 9:11:00 time: 1.1243 data_time: 0.0359 memory: 21519 grad_norm: 4.0702 loss: 1.1624 caption_loss_cls: 1.9939 grounding_loss_reg: 2.3276 detection_loss_cls: 0.0287 detection_loss_reg: 0.3185 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3206 instance_segmentation_loss_poly: 0.8192 +2023/11/07 00:54:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 00:54:05 - mmengine - INFO - Iter(train) [533000/640000] base_lr: 1.5345e-05 lr: 3.2132e-06 eta: 1 day, 9:02:04 time: 1.1265 data_time: 0.0359 memory: 21519 grad_norm: 4.0849 loss: 1.1636 caption_loss_cls: 1.9897 grounding_loss_reg: 2.3255 detection_loss_cls: 0.0287 detection_loss_reg: 0.3187 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3208 instance_segmentation_loss_poly: 0.8195 +2023/11/07 00:54:05 - mmengine - INFO - Saving checkpoint at 533000 iterations +2023/11/07 01:03:06 - mmengine - INFO - Iter(train) [533500/640000] base_lr: 1.5223e-05 lr: 3.2021e-06 eta: 1 day, 8:51:13 time: 1.1149 data_time: 0.0357 memory: 21519 grad_norm: 4.1258 loss: 1.1708 caption_loss_cls: 1.9895 grounding_loss_reg: 2.3231 detection_loss_cls: 0.0287 detection_loss_reg: 0.3183 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3214 instance_segmentation_loss_poly: 0.8208 +2023/11/07 01:11:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 01:11:55 - mmengine - INFO - Iter(train) [534000/640000] base_lr: 1.5102e-05 lr: 3.1911e-06 eta: 1 day, 8:39:11 time: 1.1080 data_time: 0.0351 memory: 21519 grad_norm: 4.1298 loss: 1.1652 caption_loss_cls: 1.9876 grounding_loss_reg: 2.3215 detection_loss_cls: 0.0287 detection_loss_reg: 0.3180 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3206 instance_segmentation_loss_poly: 0.8194 +2023/11/07 01:11:55 - mmengine - INFO - Saving checkpoint at 534000 iterations +2023/11/07 01:21:15 - mmengine - INFO - Iter(train) [534500/640000] base_lr: 1.4982e-05 lr: 3.1802e-06 eta: 1 day, 8:30:25 time: 1.1012 data_time: 0.0343 memory: 21519 grad_norm: 4.1140 loss: 1.1548 caption_loss_cls: 1.9855 grounding_loss_reg: 2.3192 detection_loss_cls: 0.0287 detection_loss_reg: 0.3186 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3210 instance_segmentation_loss_poly: 0.8197 +2023/11/07 01:30:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 01:30:17 - mmengine - INFO - Iter(train) [535000/640000] base_lr: 1.4862e-05 lr: 3.1692e-06 eta: 1 day, 8:19:55 time: 1.1020 data_time: 0.0344 memory: 21519 grad_norm: 4.1559 loss: 1.1674 caption_loss_cls: 1.9812 grounding_loss_reg: 2.3197 detection_loss_cls: 0.0287 detection_loss_reg: 0.3187 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3217 instance_segmentation_loss_poly: 0.8216 +2023/11/07 01:30:17 - mmengine - INFO - Saving checkpoint at 535000 iterations +2023/11/07 01:39:46 - mmengine - INFO - Iter(train) [535500/640000] base_lr: 1.4742e-05 lr: 3.1584e-06 eta: 1 day, 8:12:04 time: 1.1010 data_time: 0.0344 memory: 21519 grad_norm: 4.1936 loss: 1.1680 caption_loss_cls: 1.9829 grounding_loss_reg: 2.3175 detection_loss_cls: 0.0286 detection_loss_reg: 0.3183 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3216 instance_segmentation_loss_poly: 0.8216 +2023/11/07 01:49:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 01:49:03 - mmengine - INFO - Iter(train) [536000/640000] base_lr: 1.4623e-05 lr: 3.1476e-06 eta: 1 day, 8:02:59 time: 1.1056 data_time: 0.0344 memory: 21519 grad_norm: 4.1978 loss: 1.1624 caption_loss_cls: 1.9811 grounding_loss_reg: 2.3162 detection_loss_cls: 0.0286 detection_loss_reg: 0.3185 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3214 instance_segmentation_loss_poly: 0.8212 +2023/11/07 01:49:03 - mmengine - INFO - Saving checkpoint at 536000 iterations +2023/11/07 01:58:10 - mmengine - INFO - Iter(train) [536500/640000] base_lr: 1.4505e-05 lr: 3.1368e-06 eta: 1 day, 7:52:58 time: 1.1001 data_time: 0.0338 memory: 21519 grad_norm: 4.1691 loss: 1.1522 caption_loss_cls: 1.9804 grounding_loss_reg: 2.3143 detection_loss_cls: 0.0285 detection_loss_reg: 0.3188 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3211 instance_segmentation_loss_poly: 0.8215 +2023/11/07 02:07:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 02:07:18 - mmengine - INFO - Iter(train) [537000/640000] base_lr: 1.4387e-05 lr: 3.1261e-06 eta: 1 day, 7:43:08 time: 1.0974 data_time: 0.0336 memory: 21519 grad_norm: 4.1673 loss: 1.1550 caption_loss_cls: 1.9784 grounding_loss_reg: 2.3167 detection_loss_cls: 0.0285 detection_loss_reg: 0.3187 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0287 instance_segmentation_loss_reg: 0.3202 instance_segmentation_loss_poly: 0.8193 +2023/11/07 02:07:18 - mmengine - INFO - Saving checkpoint at 537000 iterations +2023/11/07 02:17:00 - mmengine - INFO - Iter(train) [537500/640000] base_lr: 1.4269e-05 lr: 3.1154e-06 eta: 1 day, 7:36:10 time: 1.1075 data_time: 0.0338 memory: 21519 grad_norm: 4.1604 loss: 1.1494 caption_loss_cls: 1.9762 grounding_loss_reg: 2.3194 detection_loss_cls: 0.0285 detection_loss_reg: 0.3184 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0286 instance_segmentation_loss_reg: 0.3199 instance_segmentation_loss_poly: 0.8183 +2023/11/07 02:26:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 02:26:15 - mmengine - INFO - Iter(train) [538000/640000] base_lr: 1.4152e-05 lr: 3.1048e-06 eta: 1 day, 7:26:53 time: 1.1140 data_time: 0.0341 memory: 21519 grad_norm: 4.1251 loss: 1.1521 caption_loss_cls: 1.9762 grounding_loss_reg: 2.3168 detection_loss_cls: 0.0286 detection_loss_reg: 0.3191 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0287 instance_segmentation_loss_reg: 0.3205 instance_segmentation_loss_poly: 0.8189 +2023/11/07 02:26:15 - mmengine - INFO - Saving checkpoint at 538000 iterations +2023/11/07 02:35:27 - mmengine - INFO - Iter(train) [538500/640000] base_lr: 1.4036e-05 lr: 3.0942e-06 eta: 1 day, 7:17:22 time: 1.1121 data_time: 0.0354 memory: 21519 grad_norm: 4.2078 loss: 1.1566 caption_loss_cls: 1.9725 grounding_loss_reg: 2.3140 detection_loss_cls: 0.0285 detection_loss_reg: 0.3172 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0285 instance_segmentation_loss_reg: 0.3191 instance_segmentation_loss_poly: 0.8162 +2023/11/07 02:44:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 02:44:47 - mmengine - INFO - Iter(train) [539000/640000] base_lr: 1.3920e-05 lr: 3.0837e-06 eta: 1 day, 7:08:30 time: 1.1167 data_time: 0.0357 memory: 21519 grad_norm: 4.1536 loss: 1.1531 caption_loss_cls: 1.9723 grounding_loss_reg: 2.3159 detection_loss_cls: 0.0285 detection_loss_reg: 0.3177 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0285 instance_segmentation_loss_reg: 0.3199 instance_segmentation_loss_poly: 0.8171 +2023/11/07 02:44:47 - mmengine - INFO - Saving checkpoint at 539000 iterations +2023/11/07 02:54:14 - mmengine - INFO - Iter(train) [539500/640000] base_lr: 1.3805e-05 lr: 3.0732e-06 eta: 1 day, 7:00:04 time: 1.1159 data_time: 0.0357 memory: 21519 grad_norm: 4.1859 loss: 1.1592 caption_loss_cls: 1.9742 grounding_loss_reg: 2.3150 detection_loss_cls: 0.0285 detection_loss_reg: 0.3173 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0285 instance_segmentation_loss_reg: 0.3190 instance_segmentation_loss_poly: 0.8148 +2023/11/07 03:03:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 03:03:40 - mmengine - INFO - Iter(train) [540000/640000] base_lr: 1.3690e-05 lr: 3.0627e-06 eta: 1 day, 6:51:35 time: 1.1182 data_time: 0.0358 memory: 21519 grad_norm: 4.1447 loss: 1.1577 caption_loss_cls: 1.9735 grounding_loss_reg: 2.3140 detection_loss_cls: 0.0285 detection_loss_reg: 0.3174 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0286 instance_segmentation_loss_reg: 0.3199 instance_segmentation_loss_poly: 0.8172 +2023/11/07 03:03:40 - mmengine - INFO - Saving checkpoint at 540000 iterations +2023/11/07 03:12:16 - mmengine - INFO - Evaluating bbox... +2023/11/07 03:13:12 - mmengine - INFO - bbox_mAP_copypaste: 0.462 0.637 0.503 0.290 0.511 0.609 +2023/11/07 03:13:12 - mmengine - INFO - Evaluating segm... +2023/11/07 03:14:22 - mmengine - INFO - segm_mAP_copypaste: 0.314 0.557 0.308 0.159 0.359 0.484 +2023/11/07 03:19:00 - mmengine - INFO - per class results: +2023/11/07 03:19:00 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 76.02 | 87.35 | +| building | 79.8 | 89.66 | +| sky | 92.89 | 97.64 | +| floor | 79.74 | 90.1 | +| tree | 73.67 | 86.11 | +| ceiling | 82.95 | 94.96 | +| road | 81.85 | 88.61 | +| bed | 88.32 | 94.57 | +| windowpane | 60.56 | 79.0 | +| grass | 67.48 | 82.99 | +| cabinet | 60.46 | 72.95 | +| sidewalk | 66.39 | 82.31 | +| person | 79.95 | 91.21 | +| earth | 39.47 | 55.61 | +| door | 49.68 | 63.05 | +| table | 57.83 | 76.18 | +| mountain | 56.92 | 76.95 | +| plant | 52.97 | 65.15 | +| curtain | 67.26 | 81.27 | +| chair | 55.95 | 69.78 | +| car | 82.38 | 90.38 | +| water | 53.2 | 67.42 | +| painting | 71.73 | 85.6 | +| sofa | 65.86 | 76.84 | +| shelf | 42.7 | 64.84 | +| house | 45.23 | 77.01 | +| sea | 51.45 | 70.98 | +| mirror | 63.46 | 73.34 | +| rug | 61.35 | 70.26 | +| field | 30.6 | 42.98 | +| armchair | 44.66 | 68.49 | +| seat | 60.97 | 79.77 | +| fence | 41.71 | 59.87 | +| desk | 45.1 | 62.11 | +| rock | 31.54 | 46.74 | +| wardrobe | 48.07 | 62.66 | +| lamp | 60.45 | 73.43 | +| bathtub | 78.29 | 86.72 | +| railing | 28.02 | 42.26 | +| cushion | 56.24 | 68.48 | +| base | 26.68 | 35.43 | +| box | 24.52 | 30.98 | +| column | 48.8 | 59.16 | +| signboard | 36.9 | 48.32 | +| chest of drawers | 34.97 | 54.27 | +| counter | 27.78 | 37.29 | +| sand | 35.86 | 46.57 | +| sink | 72.13 | 77.6 | +| skyscraper | 36.18 | 43.54 | +| fireplace | 73.52 | 88.47 | +| refrigerator | 75.39 | 82.89 | +| grandstand | 33.83 | 64.53 | +| path | 28.05 | 38.43 | +| stairs | 27.83 | 34.65 | +| runway | 65.87 | 76.65 | +| case | 45.66 | 56.63 | +| pool table | 86.58 | 95.51 | +| pillow | 58.93 | 72.09 | +| screen door | 67.93 | 74.76 | +| stairway | 34.77 | 41.39 | +| river | 15.04 | 29.77 | +| bridge | 50.53 | 56.75 | +| bookcase | 34.09 | 58.19 | +| blind | 22.56 | 24.33 | +| coffee table | 58.17 | 83.98 | +| toilet | 83.19 | 89.54 | +| flower | 33.39 | 45.15 | +| book | 45.17 | 66.63 | +| hill | 10.05 | 19.71 | +| bench | 46.2 | 53.17 | +| countertop | 50.01 | 64.09 | +| stove | 76.19 | 84.3 | +| palm | 43.44 | 54.53 | +| kitchen island | 40.89 | 69.39 | +| computer | 69.08 | 79.42 | +| swivel chair | 41.64 | 50.83 | +| boat | 68.1 | 87.65 | +| bar | 27.58 | 33.91 | +| arcade machine | 36.09 | 37.95 | +| hovel | 8.16 | 9.5 | +| bus | 87.32 | 94.9 | +| towel | 60.65 | 74.28 | +| light | 47.94 | 55.46 | +| truck | 38.44 | 47.67 | +| tower | 12.31 | 15.61 | +| chandelier | 63.93 | 78.07 | +| awning | 24.0 | 28.27 | +| streetlight | 26.78 | 32.31 | +| booth | 46.31 | 47.57 | +| television receiver | 69.47 | 80.36 | +| airplane | 57.66 | 66.13 | +| dirt track | 0.39 | 1.7 | +| apparel | 32.47 | 47.99 | +| pole | 32.69 | 48.04 | +| land | 0.18 | 0.24 | +| bannister | 14.06 | 17.68 | +| escalator | 20.95 | 21.67 | +| ottoman | 46.38 | 66.33 | +| bottle | 26.12 | 32.12 | +| buffet | 42.74 | 52.85 | +| poster | 28.39 | 37.55 | +| stage | 14.85 | 27.28 | +| van | 44.56 | 62.51 | +| ship | 41.66 | 44.03 | +| fountain | 19.46 | 19.95 | +| conveyer belt | 76.13 | 79.23 | +| canopy | 27.62 | 32.78 | +| washer | 66.84 | 69.09 | +| plaything | 30.04 | 47.17 | +| swimming pool | 53.46 | 70.56 | +| stool | 43.42 | 57.24 | +| barrel | 19.3 | 24.79 | +| basket | 29.5 | 42.08 | +| waterfall | 51.11 | 64.18 | +| tent | 90.35 | 97.67 | +| bag | 12.38 | 14.0 | +| minibike | 74.0 | 84.9 | +| cradle | 67.69 | 84.08 | +| oven | 41.5 | 50.64 | +| ball | 43.02 | 47.21 | +| food | 57.9 | 65.81 | +| step | 15.66 | 18.15 | +| tank | 44.71 | 50.2 | +| trade name | 24.18 | 29.23 | +| microwave | 81.44 | 90.36 | +| pot | 48.58 | 55.04 | +| animal | 60.23 | 62.76 | +| bicycle | 55.9 | 72.23 | +| lake | 62.04 | 67.34 | +| dishwasher | 52.52 | 73.42 | +| screen | 62.01 | 87.53 | +| blanket | 15.06 | 19.24 | +| sculpture | 52.12 | 60.94 | +| hood | 58.49 | 63.62 | +| sconce | 35.33 | 44.31 | +| vase | 41.63 | 52.73 | +| traffic light | 34.77 | 53.19 | +| tray | 10.35 | 15.9 | +| ashcan | 41.56 | 54.92 | +| fan | 53.95 | 66.47 | +| pier | 51.44 | 68.8 | +| crt screen | 5.03 | 12.75 | +| plate | 55.38 | 72.8 | +| monitor | 18.87 | 23.42 | +| bulletin board | 32.99 | 42.11 | +| shower | 4.02 | 8.83 | +| radiator | 48.96 | 54.6 | +| glass | 16.58 | 18.29 | +| clock | 26.05 | 31.11 | +| flag | 29.73 | 35.65 | ++---------------------+-------+-------+ +2023/11/07 03:19:16 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4620 coco/bbox_mAP_50: 0.6370 coco/bbox_mAP_75: 0.5030 coco/bbox_mAP_s: 0.2900 coco/bbox_mAP_m: 0.5110 coco/bbox_mAP_l: 0.6090 coco/segm_mAP: 0.3140 coco/segm_mAP_50: 0.5570 coco/segm_mAP_75: 0.3080 coco/segm_mAP_s: 0.1590 coco/segm_mAP_m: 0.3590 coco/segm_mAP_l: 0.4840 Bleu_1: 0.7567 Bleu_2: 0.5946 Bleu_3: 0.4551 Bleu_4: 0.3451 METEOR: 0.2698 ROUGE_L: 0.5587 CIDEr: 1.1006 SPICE: 0.2011 aAcc: 82.0700 mIoU: 47.0600 mAcc: 57.9400 visual-grounding/miou: 0.7855 visual-grounding/acc: 0.8543 data_time: 0.0045 time: 0.5226 +2023/11/07 03:28:42 - mmengine - INFO - Iter(train) [540500/640000] base_lr: 1.3576e-05 lr: 3.0523e-06 eta: 1 day, 6:43:10 time: 1.1236 data_time: 0.0336 memory: 21519 grad_norm: 4.1358 loss: 1.1642 caption_loss_cls: 1.9733 grounding_loss_reg: 2.3135 detection_loss_cls: 0.0287 detection_loss_reg: 0.3187 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3212 instance_segmentation_loss_poly: 0.8199 +2023/11/07 03:37:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 03:37:39 - mmengine - INFO - Iter(train) [541000/640000] base_lr: 1.3462e-05 lr: 3.0420e-06 eta: 1 day, 6:32:37 time: 1.1210 data_time: 0.0340 memory: 21519 grad_norm: 4.1770 loss: 1.1744 caption_loss_cls: 1.9746 grounding_loss_reg: 2.3109 detection_loss_cls: 0.0287 detection_loss_reg: 0.3191 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3216 instance_segmentation_loss_poly: 0.8208 +2023/11/07 03:37:39 - mmengine - INFO - Saving checkpoint at 541000 iterations +2023/11/07 03:47:34 - mmengine - INFO - Iter(train) [541500/640000] base_lr: 1.3349e-05 lr: 3.0317e-06 eta: 1 day, 6:26:00 time: 1.1242 data_time: 0.0341 memory: 21519 grad_norm: 4.0795 loss: 1.1676 caption_loss_cls: 1.9719 grounding_loss_reg: 2.3100 detection_loss_cls: 0.0288 detection_loss_reg: 0.3202 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3210 instance_segmentation_loss_poly: 0.8201 +2023/11/07 03:57:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 03:57:27 - mmengine - INFO - Iter(train) [542000/640000] base_lr: 1.3236e-05 lr: 3.0215e-06 eta: 1 day, 6:19:04 time: 1.1336 data_time: 0.0347 memory: 21519 grad_norm: 4.0639 loss: 1.1588 caption_loss_cls: 1.9688 grounding_loss_reg: 2.3079 detection_loss_cls: 0.0287 detection_loss_reg: 0.3190 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3212 instance_segmentation_loss_poly: 0.8204 +2023/11/07 03:57:27 - mmengine - INFO - Saving checkpoint at 542000 iterations +2023/11/07 04:07:01 - mmengine - INFO - Iter(train) [542500/640000] base_lr: 1.3124e-05 lr: 3.0113e-06 eta: 1 day, 6:10:53 time: 1.1392 data_time: 0.0337 memory: 21519 grad_norm: 4.0262 loss: 1.1611 caption_loss_cls: 1.9700 grounding_loss_reg: 2.3077 detection_loss_cls: 0.0287 detection_loss_reg: 0.3193 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0287 instance_segmentation_loss_reg: 0.3205 instance_segmentation_loss_poly: 0.8184 +2023/11/07 04:16:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 04:16:43 - mmengine - INFO - Iter(train) [543000/640000] base_lr: 1.3012e-05 lr: 3.0011e-06 eta: 1 day, 6:03:06 time: 1.1445 data_time: 0.0335 memory: 21519 grad_norm: 3.9895 loss: 1.1442 caption_loss_cls: 1.9718 grounding_loss_reg: 2.3063 detection_loss_cls: 0.0286 detection_loss_reg: 0.3183 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0286 instance_segmentation_loss_reg: 0.3191 instance_segmentation_loss_poly: 0.8156 +2023/11/07 04:16:43 - mmengine - INFO - Saving checkpoint at 543000 iterations +2023/11/07 04:25:59 - mmengine - INFO - Iter(train) [543500/640000] base_lr: 1.2901e-05 lr: 2.9910e-06 eta: 1 day, 5:53:38 time: 1.1418 data_time: 0.0335 memory: 21519 grad_norm: 3.9147 loss: 1.1362 caption_loss_cls: 1.9703 grounding_loss_reg: 2.3059 detection_loss_cls: 0.0286 detection_loss_reg: 0.3182 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0285 instance_segmentation_loss_reg: 0.3192 instance_segmentation_loss_poly: 0.8163 +2023/11/07 04:35:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 04:35:10 - mmengine - INFO - Iter(train) [544000/640000] base_lr: 1.2791e-05 lr: 2.9810e-06 eta: 1 day, 5:43:55 time: 1.1380 data_time: 0.0333 memory: 21519 grad_norm: 3.9723 loss: 1.1371 caption_loss_cls: 1.9711 grounding_loss_reg: 2.3016 detection_loss_cls: 0.0284 detection_loss_reg: 0.3176 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0284 instance_segmentation_loss_reg: 0.3184 instance_segmentation_loss_poly: 0.8145 +2023/11/07 04:35:10 - mmengine - INFO - Saving checkpoint at 544000 iterations +2023/11/07 04:44:38 - mmengine - INFO - Iter(train) [544500/640000] base_lr: 1.2681e-05 lr: 2.9710e-06 eta: 1 day, 5:35:13 time: 1.1380 data_time: 0.0358 memory: 21519 grad_norm: 3.9701 loss: 1.1281 caption_loss_cls: 1.9669 grounding_loss_reg: 2.3036 detection_loss_cls: 0.0283 detection_loss_reg: 0.3169 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0284 instance_segmentation_loss_reg: 0.3183 instance_segmentation_loss_poly: 0.8151 +2023/11/07 04:54:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 04:54:03 - mmengine - INFO - Iter(train) [545000/640000] base_lr: 1.2571e-05 lr: 2.9610e-06 eta: 1 day, 5:26:20 time: 1.1450 data_time: 0.0357 memory: 21519 grad_norm: 3.9376 loss: 1.1168 caption_loss_cls: 1.9641 grounding_loss_reg: 2.3048 detection_loss_cls: 0.0282 detection_loss_reg: 0.3166 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0284 instance_segmentation_loss_reg: 0.3184 instance_segmentation_loss_poly: 0.8156 +2023/11/07 04:54:03 - mmengine - INFO - Saving checkpoint at 545000 iterations +2023/11/07 05:03:22 - mmengine - INFO - Iter(train) [545500/640000] base_lr: 1.2462e-05 lr: 2.9511e-06 eta: 1 day, 5:17:03 time: 1.1358 data_time: 0.0353 memory: 21519 grad_norm: 4.0305 loss: 1.1213 caption_loss_cls: 1.9641 grounding_loss_reg: 2.3054 detection_loss_cls: 0.0282 detection_loss_reg: 0.3163 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0282 instance_segmentation_loss_reg: 0.3170 instance_segmentation_loss_poly: 0.8121 +2023/11/07 05:12:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 05:12:17 - mmengine - INFO - Iter(train) [546000/640000] base_lr: 1.2354e-05 lr: 2.9412e-06 eta: 1 day, 5:06:31 time: 1.1215 data_time: 0.0355 memory: 21519 grad_norm: 4.1278 loss: 1.1385 caption_loss_cls: 1.9611 grounding_loss_reg: 2.3069 detection_loss_cls: 0.0280 detection_loss_reg: 0.3151 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0283 instance_segmentation_loss_reg: 0.3173 instance_segmentation_loss_poly: 0.8121 +2023/11/07 05:12:17 - mmengine - INFO - Saving checkpoint at 546000 iterations +2023/11/07 05:21:45 - mmengine - INFO - Iter(train) [546500/640000] base_lr: 1.2246e-05 lr: 2.9314e-06 eta: 1 day, 4:57:45 time: 1.1199 data_time: 0.0354 memory: 21519 grad_norm: 4.1585 loss: 1.1402 caption_loss_cls: 1.9612 grounding_loss_reg: 2.3039 detection_loss_cls: 0.0280 detection_loss_reg: 0.3150 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0282 instance_segmentation_loss_reg: 0.3165 instance_segmentation_loss_poly: 0.8100 +2023/11/07 05:30:49 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 05:30:49 - mmengine - INFO - Iter(train) [547000/640000] base_lr: 1.2138e-05 lr: 2.9217e-06 eta: 1 day, 4:47:43 time: 1.1104 data_time: 0.0355 memory: 21519 grad_norm: 4.2515 loss: 1.1526 caption_loss_cls: 1.9618 grounding_loss_reg: 2.3023 detection_loss_cls: 0.0279 detection_loss_reg: 0.3148 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0282 instance_segmentation_loss_reg: 0.3163 instance_segmentation_loss_poly: 0.8101 +2023/11/07 05:30:49 - mmengine - INFO - Saving checkpoint at 547000 iterations +2023/11/07 05:40:20 - mmengine - INFO - Iter(train) [547500/640000] base_lr: 1.2031e-05 lr: 2.9119e-06 eta: 1 day, 4:39:07 time: 1.1144 data_time: 0.0355 memory: 21519 grad_norm: 4.2805 loss: 1.1582 caption_loss_cls: 1.9616 grounding_loss_reg: 2.3036 detection_loss_cls: 0.0279 detection_loss_reg: 0.3145 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0281 instance_segmentation_loss_reg: 0.3152 instance_segmentation_loss_poly: 0.8084 +2023/11/07 05:49:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 05:49:56 - mmengine - INFO - Iter(train) [548000/640000] base_lr: 1.1925e-05 lr: 2.9023e-06 eta: 1 day, 4:30:42 time: 1.1206 data_time: 0.0359 memory: 21519 grad_norm: 4.2498 loss: 1.1671 caption_loss_cls: 1.9637 grounding_loss_reg: 2.2992 detection_loss_cls: 0.0279 detection_loss_reg: 0.3136 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0281 instance_segmentation_loss_reg: 0.3157 instance_segmentation_loss_poly: 0.8088 +2023/11/07 05:49:56 - mmengine - INFO - Saving checkpoint at 548000 iterations +2023/11/07 05:59:19 - mmengine - INFO - Iter(train) [548500/640000] base_lr: 1.1819e-05 lr: 2.8927e-06 eta: 1 day, 4:21:39 time: 1.1194 data_time: 0.0358 memory: 21519 grad_norm: 4.2229 loss: 1.1589 caption_loss_cls: 1.9663 grounding_loss_reg: 2.2982 detection_loss_cls: 0.0279 detection_loss_reg: 0.3133 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0281 instance_segmentation_loss_reg: 0.3156 instance_segmentation_loss_poly: 0.8087 +2023/11/07 06:08:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 06:08:37 - mmengine - INFO - Iter(train) [549000/640000] base_lr: 1.1714e-05 lr: 2.8831e-06 eta: 1 day, 4:12:19 time: 1.1175 data_time: 0.0358 memory: 21519 grad_norm: 4.2327 loss: 1.1646 caption_loss_cls: 1.9685 grounding_loss_reg: 2.2990 detection_loss_cls: 0.0278 detection_loss_reg: 0.3138 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0281 instance_segmentation_loss_reg: 0.3151 instance_segmentation_loss_poly: 0.8072 +2023/11/07 06:08:37 - mmengine - INFO - Saving checkpoint at 549000 iterations +2023/11/07 06:18:25 - mmengine - INFO - Iter(train) [549500/640000] base_lr: 1.1609e-05 lr: 2.8736e-06 eta: 1 day, 4:04:22 time: 1.1247 data_time: 0.0361 memory: 21519 grad_norm: 4.1787 loss: 1.1620 caption_loss_cls: 1.9704 grounding_loss_reg: 2.2982 detection_loss_cls: 0.0278 detection_loss_reg: 0.3133 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0280 instance_segmentation_loss_reg: 0.3154 instance_segmentation_loss_poly: 0.8068 +2023/11/07 06:27:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 06:27:32 - mmengine - INFO - Iter(train) [550000/640000] base_lr: 1.1505e-05 lr: 2.8641e-06 eta: 1 day, 3:54:34 time: 1.1278 data_time: 0.0356 memory: 21519 grad_norm: 4.1310 loss: 1.1497 caption_loss_cls: 1.9699 grounding_loss_reg: 2.3006 detection_loss_cls: 0.0278 detection_loss_reg: 0.3128 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0280 instance_segmentation_loss_reg: 0.3155 instance_segmentation_loss_poly: 0.8077 +2023/11/07 06:27:32 - mmengine - INFO - Saving checkpoint at 550000 iterations +2023/11/07 06:36:37 - mmengine - INFO - Iter(train) [550500/640000] base_lr: 1.1402e-05 lr: 2.8547e-06 eta: 1 day, 3:44:39 time: 1.1221 data_time: 0.0356 memory: 21519 grad_norm: 4.1432 loss: 1.1555 caption_loss_cls: 1.9724 grounding_loss_reg: 2.2985 detection_loss_cls: 0.0279 detection_loss_reg: 0.3135 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0280 instance_segmentation_loss_reg: 0.3151 instance_segmentation_loss_poly: 0.8064 +2023/11/07 06:45:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 06:45:56 - mmengine - INFO - Iter(train) [551000/640000] base_lr: 1.1299e-05 lr: 2.8453e-06 eta: 1 day, 3:35:22 time: 1.1259 data_time: 0.0358 memory: 21519 grad_norm: 4.1273 loss: 1.1573 caption_loss_cls: 1.9685 grounding_loss_reg: 2.3020 detection_loss_cls: 0.0278 detection_loss_reg: 0.3123 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0279 instance_segmentation_loss_reg: 0.3154 instance_segmentation_loss_poly: 0.8063 +2023/11/07 06:45:57 - mmengine - INFO - Saving checkpoint at 551000 iterations +2023/11/07 06:55:31 - mmengine - INFO - Iter(train) [551500/640000] base_lr: 1.1196e-05 lr: 2.8360e-06 eta: 1 day, 3:26:45 time: 1.1267 data_time: 0.0362 memory: 21519 grad_norm: 4.1438 loss: 1.1667 caption_loss_cls: 1.9655 grounding_loss_reg: 2.3016 detection_loss_cls: 0.0279 detection_loss_reg: 0.3132 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0279 instance_segmentation_loss_reg: 0.3154 instance_segmentation_loss_poly: 0.8060 +2023/11/07 07:04:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 07:04:42 - mmengine - INFO - Iter(train) [552000/640000] base_lr: 1.1094e-05 lr: 2.8267e-06 eta: 1 day, 3:17:06 time: 1.1203 data_time: 0.0358 memory: 21519 grad_norm: 4.1445 loss: 1.1562 caption_loss_cls: 1.9639 grounding_loss_reg: 2.2989 detection_loss_cls: 0.0278 detection_loss_reg: 0.3135 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0279 instance_segmentation_loss_reg: 0.3150 instance_segmentation_loss_poly: 0.8056 +2023/11/07 07:04:42 - mmengine - INFO - Saving checkpoint at 552000 iterations +2023/11/07 07:13:58 - mmengine - INFO - Iter(train) [552500/640000] base_lr: 1.0993e-05 lr: 2.8175e-06 eta: 1 day, 3:07:43 time: 1.1187 data_time: 0.0358 memory: 21519 grad_norm: 4.1889 loss: 1.1628 caption_loss_cls: 1.9652 grounding_loss_reg: 2.2993 detection_loss_cls: 0.0278 detection_loss_reg: 0.3131 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0279 instance_segmentation_loss_reg: 0.3148 instance_segmentation_loss_poly: 0.8052 +2023/11/07 07:23:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 07:23:09 - mmengine - INFO - Iter(train) [553000/640000] base_lr: 1.0892e-05 lr: 2.8083e-06 eta: 1 day, 2:58:08 time: 1.1170 data_time: 0.0357 memory: 21519 grad_norm: 4.1862 loss: 1.1525 caption_loss_cls: 1.9641 grounding_loss_reg: 2.3000 detection_loss_cls: 0.0278 detection_loss_reg: 0.3127 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0278 instance_segmentation_loss_reg: 0.3147 instance_segmentation_loss_poly: 0.8050 +2023/11/07 07:23:09 - mmengine - INFO - Saving checkpoint at 553000 iterations +2023/11/07 07:32:53 - mmengine - INFO - Iter(train) [553500/640000] base_lr: 1.0791e-05 lr: 2.7992e-06 eta: 1 day, 2:49:49 time: 1.1161 data_time: 0.0358 memory: 21519 grad_norm: 4.2402 loss: 1.1619 caption_loss_cls: 1.9684 grounding_loss_reg: 2.2997 detection_loss_cls: 0.0277 detection_loss_reg: 0.3124 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3138 instance_segmentation_loss_poly: 0.8030 +2023/11/07 07:42:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 07:42:41 - mmengine - INFO - Iter(train) [554000/640000] base_lr: 1.0691e-05 lr: 2.7901e-06 eta: 1 day, 2:41:38 time: 1.1260 data_time: 0.0360 memory: 21519 grad_norm: 4.2668 loss: 1.1678 caption_loss_cls: 1.9678 grounding_loss_reg: 2.2983 detection_loss_cls: 0.0276 detection_loss_reg: 0.3119 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3140 instance_segmentation_loss_poly: 0.8031 +2023/11/07 07:42:41 - mmengine - INFO - Saving checkpoint at 554000 iterations +2023/11/07 07:51:27 - mmengine - INFO - Iter(train) [554500/640000] base_lr: 1.0592e-05 lr: 2.7811e-06 eta: 1 day, 2:31:05 time: 1.1215 data_time: 0.0357 memory: 21519 grad_norm: 4.2773 loss: 1.1708 caption_loss_cls: 1.9694 grounding_loss_reg: 2.2974 detection_loss_cls: 0.0277 detection_loss_reg: 0.3122 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3133 instance_segmentation_loss_poly: 0.8019 +2023/11/07 08:01:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 08:01:02 - mmengine - INFO - Iter(train) [555000/640000] base_lr: 1.0493e-05 lr: 2.7721e-06 eta: 1 day, 2:22:23 time: 1.1254 data_time: 0.0358 memory: 21519 grad_norm: 4.2502 loss: 1.1686 caption_loss_cls: 1.9702 grounding_loss_reg: 2.2963 detection_loss_cls: 0.0276 detection_loss_reg: 0.3109 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3134 instance_segmentation_loss_poly: 0.8024 +2023/11/07 08:01:02 - mmengine - INFO - Saving checkpoint at 555000 iterations +2023/11/07 08:11:00 - mmengine - INFO - Iter(train) [555500/640000] base_lr: 1.0395e-05 lr: 2.7632e-06 eta: 1 day, 2:14:29 time: 1.1312 data_time: 0.0359 memory: 21519 grad_norm: 4.2303 loss: 1.1582 caption_loss_cls: 1.9702 grounding_loss_reg: 2.2982 detection_loss_cls: 0.0276 detection_loss_reg: 0.3105 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3135 instance_segmentation_loss_poly: 0.8027 +2023/11/07 08:20:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 08:20:06 - mmengine - INFO - Iter(train) [556000/640000] base_lr: 1.0298e-05 lr: 2.7543e-06 eta: 1 day, 2:04:41 time: 1.1300 data_time: 0.0359 memory: 21519 grad_norm: 4.2474 loss: 1.1587 caption_loss_cls: 1.9661 grounding_loss_reg: 2.2985 detection_loss_cls: 0.0276 detection_loss_reg: 0.3106 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3134 instance_segmentation_loss_poly: 0.8018 +2023/11/07 08:20:06 - mmengine - INFO - Saving checkpoint at 556000 iterations +2023/11/07 08:29:27 - mmengine - INFO - Iter(train) [556500/640000] base_lr: 1.0200e-05 lr: 2.7455e-06 eta: 1 day, 1:55:26 time: 1.1312 data_time: 0.0361 memory: 21519 grad_norm: 4.2411 loss: 1.1599 caption_loss_cls: 1.9669 grounding_loss_reg: 2.2963 detection_loss_cls: 0.0277 detection_loss_reg: 0.3109 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3137 instance_segmentation_loss_poly: 0.8030 +2023/11/07 08:38:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 08:38:35 - mmengine - INFO - Iter(train) [557000/640000] base_lr: 1.0104e-05 lr: 2.7367e-06 eta: 1 day, 1:45:43 time: 1.1303 data_time: 0.0360 memory: 21519 grad_norm: 4.2722 loss: 1.1669 caption_loss_cls: 1.9649 grounding_loss_reg: 2.2929 detection_loss_cls: 0.0276 detection_loss_reg: 0.3113 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3137 instance_segmentation_loss_poly: 0.8025 +2023/11/07 08:38:35 - mmengine - INFO - Saving checkpoint at 557000 iterations +2023/11/07 08:47:26 - mmengine - INFO - Iter(train) [557500/640000] base_lr: 1.0008e-05 lr: 2.7280e-06 eta: 1 day, 1:35:27 time: 1.1171 data_time: 0.0356 memory: 21519 grad_norm: 4.2760 loss: 1.1615 caption_loss_cls: 1.9656 grounding_loss_reg: 2.2918 detection_loss_cls: 0.0276 detection_loss_reg: 0.3119 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3133 instance_segmentation_loss_poly: 0.8021 +2023/11/07 08:56:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 08:56:33 - mmengine - INFO - Iter(train) [558000/640000] base_lr: 9.9125e-06 lr: 2.7193e-06 eta: 1 day, 1:25:45 time: 1.1070 data_time: 0.0356 memory: 21519 grad_norm: 4.2191 loss: 1.1642 caption_loss_cls: 1.9654 grounding_loss_reg: 2.2920 detection_loss_cls: 0.0276 detection_loss_reg: 0.3117 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3145 instance_segmentation_loss_poly: 0.8045 +2023/11/07 08:56:33 - mmengine - INFO - Saving checkpoint at 558000 iterations +2023/11/07 09:05:41 - mmengine - INFO - Iter(train) [558500/640000] base_lr: 9.8175e-06 lr: 2.7107e-06 eta: 1 day, 1:16:06 time: 1.1124 data_time: 0.0357 memory: 21519 grad_norm: 4.1978 loss: 1.1537 caption_loss_cls: 1.9685 grounding_loss_reg: 2.2927 detection_loss_cls: 0.0277 detection_loss_reg: 0.3134 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3137 instance_segmentation_loss_poly: 0.8035 +2023/11/07 09:14:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 09:14:43 - mmengine - INFO - Iter(train) [559000/640000] base_lr: 9.7232e-06 lr: 2.7021e-06 eta: 1 day, 1:06:17 time: 1.1043 data_time: 0.0354 memory: 21519 grad_norm: 4.2548 loss: 1.1576 caption_loss_cls: 1.9683 grounding_loss_reg: 2.2933 detection_loss_cls: 0.0277 detection_loss_reg: 0.3135 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3135 instance_segmentation_loss_poly: 0.8035 +2023/11/07 09:14:43 - mmengine - INFO - Saving checkpoint at 559000 iterations +2023/11/07 09:24:01 - mmengine - INFO - Iter(train) [559500/640000] base_lr: 9.6294e-06 lr: 2.6936e-06 eta: 1 day, 0:56:57 time: 1.0942 data_time: 0.0348 memory: 21519 grad_norm: 4.3253 loss: 1.1622 caption_loss_cls: 1.9649 grounding_loss_reg: 2.2958 detection_loss_cls: 0.0276 detection_loss_reg: 0.3122 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3123 instance_segmentation_loss_poly: 0.8004 +2023/11/07 09:33:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 09:33:38 - mmengine - INFO - Iter(train) [560000/640000] base_lr: 9.5361e-06 lr: 2.6851e-06 eta: 1 day, 0:48:15 time: 1.1022 data_time: 0.0350 memory: 21519 grad_norm: 4.3067 loss: 1.1604 caption_loss_cls: 1.9680 grounding_loss_reg: 2.2952 detection_loss_cls: 0.0275 detection_loss_reg: 0.3114 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3116 instance_segmentation_loss_poly: 0.7984 +2023/11/07 09:33:38 - mmengine - INFO - Saving checkpoint at 560000 iterations +2023/11/07 09:42:15 - mmengine - INFO - Evaluating bbox... +2023/11/07 09:43:11 - mmengine - INFO - bbox_mAP_copypaste: 0.464 0.639 0.502 0.290 0.513 0.612 +2023/11/07 09:43:11 - mmengine - INFO - Evaluating segm... +2023/11/07 09:44:23 - mmengine - INFO - segm_mAP_copypaste: 0.315 0.558 0.308 0.155 0.362 0.490 +2023/11/07 09:49:36 - mmengine - INFO - per class results: +2023/11/07 09:49:36 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.56 | 88.86 | +| building | 80.36 | 90.55 | +| sky | 92.93 | 97.57 | +| floor | 80.37 | 89.94 | +| tree | 72.9 | 86.48 | +| ceiling | 82.97 | 94.24 | +| road | 82.26 | 89.23 | +| bed | 88.25 | 94.34 | +| windowpane | 60.08 | 76.66 | +| grass | 66.3 | 83.38 | +| cabinet | 59.76 | 71.89 | +| sidewalk | 66.31 | 80.43 | +| person | 79.07 | 90.96 | +| earth | 37.63 | 51.17 | +| door | 47.9 | 59.22 | +| table | 58.88 | 74.73 | +| mountain | 53.48 | 66.59 | +| plant | 51.63 | 62.11 | +| curtain | 68.0 | 84.23 | +| chair | 56.27 | 69.97 | +| car | 82.88 | 90.26 | +| water | 51.91 | 67.53 | +| painting | 71.9 | 84.83 | +| sofa | 66.51 | 80.22 | +| shelf | 41.91 | 61.49 | +| house | 43.15 | 61.47 | +| sea | 49.49 | 69.08 | +| mirror | 63.24 | 72.0 | +| rug | 61.65 | 70.32 | +| field | 29.81 | 45.16 | +| armchair | 42.52 | 64.13 | +| seat | 63.5 | 79.43 | +| fence | 41.87 | 60.9 | +| desk | 42.33 | 58.68 | +| rock | 36.53 | 54.09 | +| wardrobe | 43.26 | 58.71 | +| lamp | 60.49 | 72.89 | +| bathtub | 76.38 | 86.54 | +| railing | 26.27 | 37.99 | +| cushion | 56.75 | 69.34 | +| base | 22.85 | 29.26 | +| box | 25.04 | 32.83 | +| column | 46.94 | 57.72 | +| signboard | 36.74 | 49.05 | +| chest of drawers | 34.07 | 52.39 | +| counter | 29.56 | 41.25 | +| sand | 35.77 | 51.56 | +| sink | 71.57 | 78.32 | +| skyscraper | 48.87 | 59.22 | +| fireplace | 72.18 | 84.29 | +| refrigerator | 74.35 | 80.92 | +| grandstand | 35.48 | 69.58 | +| path | 30.11 | 41.75 | +| stairs | 25.78 | 34.41 | +| runway | 65.24 | 77.69 | +| case | 41.22 | 48.13 | +| pool table | 88.15 | 95.39 | +| pillow | 56.1 | 68.14 | +| screen door | 69.93 | 76.36 | +| stairway | 29.25 | 41.74 | +| river | 15.1 | 32.66 | +| bridge | 47.94 | 55.19 | +| bookcase | 35.52 | 56.1 | +| blind | 23.52 | 25.24 | +| coffee table | 64.21 | 81.54 | +| toilet | 83.83 | 89.01 | +| flower | 33.9 | 46.24 | +| book | 46.16 | 71.07 | +| hill | 8.97 | 18.5 | +| bench | 47.58 | 55.49 | +| countertop | 52.01 | 64.74 | +| stove | 76.66 | 84.36 | +| palm | 44.15 | 56.25 | +| kitchen island | 39.79 | 67.96 | +| computer | 69.65 | 80.69 | +| swivel chair | 40.56 | 50.07 | +| boat | 75.69 | 84.08 | +| bar | 45.12 | 55.12 | +| arcade machine | 24.74 | 25.75 | +| hovel | 15.9 | 19.58 | +| bus | 87.44 | 94.43 | +| towel | 60.34 | 72.33 | +| light | 45.97 | 53.65 | +| truck | 41.68 | 50.29 | +| tower | 39.5 | 50.08 | +| chandelier | 63.0 | 76.86 | +| awning | 24.96 | 29.36 | +| streetlight | 26.66 | 34.66 | +| booth | 45.11 | 46.21 | +| television receiver | 69.84 | 82.31 | +| airplane | 55.04 | 65.19 | +| dirt track | 0.47 | 2.07 | +| apparel | 38.13 | 54.44 | +| pole | 28.01 | 37.27 | +| land | 0.35 | 0.47 | +| bannister | 14.53 | 19.32 | +| escalator | 27.3 | 29.66 | +| ottoman | 47.49 | 68.36 | +| bottle | 26.36 | 33.46 | +| buffet | 37.19 | 41.47 | +| poster | 26.15 | 33.54 | +| stage | 10.35 | 16.87 | +| van | 42.61 | 57.63 | +| ship | 62.22 | 64.05 | +| fountain | 17.18 | 17.7 | +| conveyer belt | 77.14 | 84.65 | +| canopy | 22.03 | 29.54 | +| washer | 65.42 | 67.86 | +| plaything | 33.68 | 43.88 | +| swimming pool | 57.04 | 72.11 | +| stool | 42.37 | 52.81 | +| barrel | 32.96 | 49.55 | +| basket | 28.8 | 41.72 | +| waterfall | 50.29 | 61.71 | +| tent | 88.37 | 97.52 | +| bag | 14.79 | 17.06 | +| minibike | 72.77 | 82.02 | +| cradle | 75.51 | 93.08 | +| oven | 45.33 | 59.57 | +| ball | 39.1 | 42.51 | +| food | 57.71 | 66.23 | +| step | 15.31 | 17.67 | +| tank | 39.09 | 47.6 | +| trade name | 23.98 | 27.95 | +| microwave | 81.57 | 89.67 | +| pot | 45.82 | 52.19 | +| animal | 60.27 | 63.29 | +| bicycle | 54.46 | 70.05 | +| lake | 54.21 | 55.56 | +| dishwasher | 53.41 | 76.27 | +| screen | 60.1 | 79.05 | +| blanket | 13.03 | 15.94 | +| sculpture | 55.86 | 69.47 | +| hood | 56.68 | 64.18 | +| sconce | 35.1 | 43.08 | +| vase | 42.36 | 56.13 | +| traffic light | 35.01 | 51.71 | +| tray | 10.28 | 23.83 | +| ashcan | 39.89 | 56.51 | +| fan | 52.99 | 63.9 | +| pier | 40.08 | 57.38 | +| crt screen | 10.24 | 27.9 | +| plate | 54.68 | 68.47 | +| monitor | 16.61 | 21.04 | +| bulletin board | 31.49 | 42.46 | +| shower | 6.22 | 9.81 | +| radiator | 49.79 | 54.92 | +| glass | 16.19 | 17.74 | +| clock | 25.4 | 30.41 | +| flag | 28.82 | 32.81 | ++---------------------+-------+-------+ +2023/11/07 09:49:51 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4640 coco/bbox_mAP_50: 0.6390 coco/bbox_mAP_75: 0.5020 coco/bbox_mAP_s: 0.2900 coco/bbox_mAP_m: 0.5130 coco/bbox_mAP_l: 0.6120 coco/segm_mAP: 0.3150 coco/segm_mAP_50: 0.5580 coco/segm_mAP_75: 0.3080 coco/segm_mAP_s: 0.1550 coco/segm_mAP_m: 0.3620 coco/segm_mAP_l: 0.4900 Bleu_1: 0.7599 Bleu_2: 0.5978 Bleu_3: 0.4583 Bleu_4: 0.3477 METEOR: 0.2695 ROUGE_L: 0.5586 CIDEr: 1.1099 SPICE: 0.2021 aAcc: 81.9900 mIoU: 47.2900 mAcc: 58.1200 visual-grounding/miou: 0.7878 visual-grounding/acc: 0.8561 data_time: 0.0047 time: 0.5240 +2023/11/07 09:59:02 - mmengine - INFO - Iter(train) [560500/640000] base_lr: 9.4434e-06 lr: 2.6767e-06 eta: 1 day, 0:38:45 time: 1.0999 data_time: 0.0322 memory: 21519 grad_norm: 4.3358 loss: 1.1712 caption_loss_cls: 1.9686 grounding_loss_reg: 2.2967 detection_loss_cls: 0.0275 detection_loss_reg: 0.3108 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3118 instance_segmentation_loss_poly: 0.7982 +2023/11/07 10:08:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 10:08:18 - mmengine - INFO - Iter(train) [561000/640000] base_lr: 9.3512e-06 lr: 2.6683e-06 eta: 1 day, 0:29:23 time: 1.1020 data_time: 0.0322 memory: 21519 grad_norm: 4.3198 loss: 1.1726 caption_loss_cls: 1.9687 grounding_loss_reg: 2.2979 detection_loss_cls: 0.0275 detection_loss_reg: 0.3105 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3108 instance_segmentation_loss_poly: 0.7962 +2023/11/07 10:08:18 - mmengine - INFO - Saving checkpoint at 561000 iterations +2023/11/07 10:18:14 - mmengine - INFO - Iter(train) [561500/640000] base_lr: 9.2596e-06 lr: 2.6600e-06 eta: 1 day, 0:21:11 time: 1.1183 data_time: 0.0324 memory: 21519 grad_norm: 4.3061 loss: 1.1737 caption_loss_cls: 1.9710 grounding_loss_reg: 2.2976 detection_loss_cls: 0.0273 detection_loss_reg: 0.3088 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0273 instance_segmentation_loss_reg: 0.3102 instance_segmentation_loss_poly: 0.7957 +2023/11/07 10:27:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 10:27:29 - mmengine - INFO - Iter(train) [562000/640000] base_lr: 9.1686e-06 lr: 2.6517e-06 eta: 1 day, 0:11:46 time: 1.1203 data_time: 0.0325 memory: 21519 grad_norm: 4.3608 loss: 1.1778 caption_loss_cls: 1.9725 grounding_loss_reg: 2.2969 detection_loss_cls: 0.0274 detection_loss_reg: 0.3087 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3112 instance_segmentation_loss_poly: 0.7970 +2023/11/07 10:27:29 - mmengine - INFO - Saving checkpoint at 562000 iterations +2023/11/07 10:37:05 - mmengine - INFO - Iter(train) [562500/640000] base_lr: 9.0781e-06 lr: 2.6435e-06 eta: 1 day, 0:02:57 time: 1.1272 data_time: 0.0328 memory: 21519 grad_norm: 4.3077 loss: 1.1749 caption_loss_cls: 1.9719 grounding_loss_reg: 2.2964 detection_loss_cls: 0.0274 detection_loss_reg: 0.3092 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3114 instance_segmentation_loss_poly: 0.7978 +2023/11/07 10:46:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 10:46:51 - mmengine - INFO - Iter(train) [563000/640000] base_lr: 8.9881e-06 lr: 2.6353e-06 eta: 23:54:23 time: 1.1381 data_time: 0.0332 memory: 21519 grad_norm: 4.2483 loss: 1.1677 caption_loss_cls: 1.9698 grounding_loss_reg: 2.2949 detection_loss_cls: 0.0274 detection_loss_reg: 0.3105 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3128 instance_segmentation_loss_poly: 0.7993 +2023/11/07 10:46:51 - mmengine - INFO - Saving checkpoint at 563000 iterations +2023/11/07 10:56:21 - mmengine - INFO - Iter(train) [563500/640000] base_lr: 8.8987e-06 lr: 2.6272e-06 eta: 23:45:22 time: 1.1413 data_time: 0.0333 memory: 21519 grad_norm: 4.2088 loss: 1.1603 caption_loss_cls: 1.9711 grounding_loss_reg: 2.2947 detection_loss_cls: 0.0274 detection_loss_reg: 0.3093 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3130 instance_segmentation_loss_poly: 0.8000 +2023/11/07 11:06:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 11:06:03 - mmengine - INFO - Iter(train) [564000/640000] base_lr: 8.8099e-06 lr: 2.6191e-06 eta: 23:36:40 time: 1.1424 data_time: 0.0332 memory: 21519 grad_norm: 4.1175 loss: 1.1477 caption_loss_cls: 1.9688 grounding_loss_reg: 2.2939 detection_loss_cls: 0.0275 detection_loss_reg: 0.3102 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3125 instance_segmentation_loss_poly: 0.7991 +2023/11/07 11:06:03 - mmengine - INFO - Saving checkpoint at 564000 iterations +2023/11/07 11:15:29 - mmengine - INFO - Iter(train) [564500/640000] base_lr: 8.7216e-06 lr: 2.6111e-06 eta: 23:27:30 time: 1.1457 data_time: 0.0363 memory: 21519 grad_norm: 4.1059 loss: 1.1455 caption_loss_cls: 1.9676 grounding_loss_reg: 2.2918 detection_loss_cls: 0.0275 detection_loss_reg: 0.3104 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3135 instance_segmentation_loss_poly: 0.8013 +2023/11/07 11:24:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 11:24:59 - mmengine - INFO - Iter(train) [565000/640000] base_lr: 8.6339e-06 lr: 2.6031e-06 eta: 23:18:27 time: 1.1493 data_time: 0.0365 memory: 21519 grad_norm: 4.0794 loss: 1.1438 caption_loss_cls: 1.9714 grounding_loss_reg: 2.2922 detection_loss_cls: 0.0275 detection_loss_reg: 0.3112 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3144 instance_segmentation_loss_poly: 0.8029 +2023/11/07 11:24:59 - mmengine - INFO - Saving checkpoint at 565000 iterations +2023/11/07 11:34:34 - mmengine - INFO - Iter(train) [565500/640000] base_lr: 8.5467e-06 lr: 2.5952e-06 eta: 23:09:31 time: 1.1440 data_time: 0.0365 memory: 21519 grad_norm: 4.0875 loss: 1.1452 caption_loss_cls: 1.9702 grounding_loss_reg: 2.2906 detection_loss_cls: 0.0275 detection_loss_reg: 0.3112 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3140 instance_segmentation_loss_poly: 0.8029 +2023/11/07 11:44:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 11:44:03 - mmengine - INFO - Iter(train) [566000/640000] base_lr: 8.4601e-06 lr: 2.5873e-06 eta: 23:00:24 time: 1.1474 data_time: 0.0363 memory: 21519 grad_norm: 4.0202 loss: 1.1278 caption_loss_cls: 1.9737 grounding_loss_reg: 2.2878 detection_loss_cls: 0.0276 detection_loss_reg: 0.3127 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3147 instance_segmentation_loss_poly: 0.8046 +2023/11/07 11:44:03 - mmengine - INFO - Saving checkpoint at 566000 iterations +2023/11/07 11:53:30 - mmengine - INFO - Iter(train) [566500/640000] base_lr: 8.3740e-06 lr: 2.5795e-06 eta: 22:51:15 time: 1.1452 data_time: 0.0362 memory: 21519 grad_norm: 4.0570 loss: 1.1257 caption_loss_cls: 1.9700 grounding_loss_reg: 2.2887 detection_loss_cls: 0.0277 detection_loss_reg: 0.3132 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3154 instance_segmentation_loss_poly: 0.8055 +2023/11/07 12:02:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 12:02:57 - mmengine - INFO - Iter(train) [567000/640000] base_lr: 8.2885e-06 lr: 2.5717e-06 eta: 22:42:06 time: 1.1407 data_time: 0.0360 memory: 21519 grad_norm: 4.0853 loss: 1.1346 caption_loss_cls: 1.9732 grounding_loss_reg: 2.2890 detection_loss_cls: 0.0277 detection_loss_reg: 0.3135 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3160 instance_segmentation_loss_poly: 0.8067 +2023/11/07 12:02:57 - mmengine - INFO - Saving checkpoint at 567000 iterations +2023/11/07 12:12:16 - mmengine - INFO - Iter(train) [567500/640000] base_lr: 8.2036e-06 lr: 2.5640e-06 eta: 22:32:44 time: 1.1377 data_time: 0.0358 memory: 21519 grad_norm: 4.0692 loss: 1.1370 caption_loss_cls: 1.9737 grounding_loss_reg: 2.2866 detection_loss_cls: 0.0277 detection_loss_reg: 0.3137 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3153 instance_segmentation_loss_poly: 0.8050 +2023/11/07 12:21:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 12:21:14 - mmengine - INFO - Iter(train) [568000/640000] base_lr: 8.1192e-06 lr: 2.5563e-06 eta: 22:22:53 time: 1.1268 data_time: 0.0356 memory: 21519 grad_norm: 4.1811 loss: 1.1502 caption_loss_cls: 1.9699 grounding_loss_reg: 2.2863 detection_loss_cls: 0.0278 detection_loss_reg: 0.3149 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3152 instance_segmentation_loss_poly: 0.8052 +2023/11/07 12:21:14 - mmengine - INFO - Saving checkpoint at 568000 iterations +2023/11/07 12:30:44 - mmengine - INFO - Iter(train) [568500/640000] base_lr: 8.0354e-06 lr: 2.5487e-06 eta: 22:13:47 time: 1.1278 data_time: 0.0353 memory: 21519 grad_norm: 4.1688 loss: 1.1371 caption_loss_cls: 1.9706 grounding_loss_reg: 2.2822 detection_loss_cls: 0.0277 detection_loss_reg: 0.3142 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3156 instance_segmentation_loss_poly: 0.8065 +2023/11/07 12:40:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 12:40:14 - mmengine - INFO - Iter(train) [569000/640000] base_lr: 7.9521e-06 lr: 2.5411e-06 eta: 22:04:41 time: 1.1278 data_time: 0.0353 memory: 21519 grad_norm: 4.1980 loss: 1.1426 caption_loss_cls: 1.9705 grounding_loss_reg: 2.2806 detection_loss_cls: 0.0277 detection_loss_reg: 0.3144 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3156 instance_segmentation_loss_poly: 0.8068 +2023/11/07 12:40:14 - mmengine - INFO - Saving checkpoint at 569000 iterations +2023/11/07 12:49:09 - mmengine - INFO - Iter(train) [569500/640000] base_lr: 7.8694e-06 lr: 2.5336e-06 eta: 21:54:47 time: 1.1177 data_time: 0.0351 memory: 21519 grad_norm: 4.2359 loss: 1.1505 caption_loss_cls: 1.9719 grounding_loss_reg: 2.2824 detection_loss_cls: 0.0278 detection_loss_reg: 0.3154 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3160 instance_segmentation_loss_poly: 0.8079 +2023/11/07 12:59:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 12:59:01 - mmengine - INFO - Iter(train) [570000/640000] base_lr: 7.7873e-06 lr: 2.5261e-06 eta: 21:46:10 time: 1.1234 data_time: 0.0353 memory: 21519 grad_norm: 4.2416 loss: 1.1590 caption_loss_cls: 1.9742 grounding_loss_reg: 2.2823 detection_loss_cls: 0.0278 detection_loss_reg: 0.3156 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3155 instance_segmentation_loss_poly: 0.8076 +2023/11/07 12:59:01 - mmengine - INFO - Saving checkpoint at 570000 iterations +2023/11/07 13:08:24 - mmengine - INFO - Iter(train) [570500/640000] base_lr: 7.7057e-06 lr: 2.5187e-06 eta: 21:36:54 time: 1.1226 data_time: 0.0356 memory: 21519 grad_norm: 4.2394 loss: 1.1717 caption_loss_cls: 1.9725 grounding_loss_reg: 2.2843 detection_loss_cls: 0.0279 detection_loss_reg: 0.3163 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3162 instance_segmentation_loss_poly: 0.8094 +2023/11/07 13:17:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 13:17:43 - mmengine - INFO - Iter(train) [571000/640000] base_lr: 7.6247e-06 lr: 2.5113e-06 eta: 21:27:32 time: 1.1204 data_time: 0.0355 memory: 21519 grad_norm: 4.2457 loss: 1.1687 caption_loss_cls: 1.9719 grounding_loss_reg: 2.2842 detection_loss_cls: 0.0279 detection_loss_reg: 0.3165 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3156 instance_segmentation_loss_poly: 0.8083 +2023/11/07 13:17:43 - mmengine - INFO - Saving checkpoint at 571000 iterations +2023/11/07 13:26:53 - mmengine - INFO - Iter(train) [571500/640000] base_lr: 7.5443e-06 lr: 2.5040e-06 eta: 21:17:59 time: 1.1181 data_time: 0.0354 memory: 21519 grad_norm: 4.2682 loss: 1.1685 caption_loss_cls: 1.9740 grounding_loss_reg: 2.2839 detection_loss_cls: 0.0279 detection_loss_reg: 0.3170 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3153 instance_segmentation_loss_poly: 0.8072 +2023/11/07 13:36:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 13:36:09 - mmengine - INFO - Iter(train) [572000/640000] base_lr: 7.4644e-06 lr: 2.4968e-06 eta: 21:08:34 time: 1.1226 data_time: 0.0357 memory: 21519 grad_norm: 4.2510 loss: 1.1757 caption_loss_cls: 1.9747 grounding_loss_reg: 2.2867 detection_loss_cls: 0.0279 detection_loss_reg: 0.3162 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3156 instance_segmentation_loss_poly: 0.8085 +2023/11/07 13:36:09 - mmengine - INFO - Saving checkpoint at 572000 iterations +2023/11/07 13:45:23 - mmengine - INFO - Iter(train) [572500/640000] base_lr: 7.3850e-06 lr: 2.4895e-06 eta: 20:59:08 time: 1.1188 data_time: 0.0357 memory: 21519 grad_norm: 4.2660 loss: 1.1847 caption_loss_cls: 1.9735 grounding_loss_reg: 2.2860 detection_loss_cls: 0.0279 detection_loss_reg: 0.3162 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0278 instance_segmentation_loss_reg: 0.3162 instance_segmentation_loss_poly: 0.8098 +2023/11/07 13:53:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 13:53:39 - mmengine - INFO - Iter(train) [573000/640000] base_lr: 7.3063e-06 lr: 2.4824e-06 eta: 20:48:31 time: 1.1001 data_time: 0.0351 memory: 21519 grad_norm: 4.3355 loss: 1.1890 caption_loss_cls: 1.9736 grounding_loss_reg: 2.2877 detection_loss_cls: 0.0279 detection_loss_reg: 0.3163 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0278 instance_segmentation_loss_reg: 0.3162 instance_segmentation_loss_poly: 0.8103 +2023/11/07 13:53:39 - mmengine - INFO - Saving checkpoint at 573000 iterations +2023/11/07 14:03:17 - mmengine - INFO - Iter(train) [573500/640000] base_lr: 7.2281e-06 lr: 2.4753e-06 eta: 20:39:34 time: 1.1110 data_time: 0.0353 memory: 21519 grad_norm: 4.2690 loss: 1.1757 caption_loss_cls: 1.9725 grounding_loss_reg: 2.2861 detection_loss_cls: 0.0280 detection_loss_reg: 0.3167 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0278 instance_segmentation_loss_reg: 0.3167 instance_segmentation_loss_poly: 0.8112 +2023/11/07 14:12:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 14:12:27 - mmengine - INFO - Iter(train) [574000/640000] base_lr: 7.1504e-06 lr: 2.4682e-06 eta: 20:30:03 time: 1.1006 data_time: 0.0351 memory: 21519 grad_norm: 4.3609 loss: 1.1814 caption_loss_cls: 1.9699 grounding_loss_reg: 2.2866 detection_loss_cls: 0.0279 detection_loss_reg: 0.3167 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0278 instance_segmentation_loss_reg: 0.3167 instance_segmentation_loss_poly: 0.8118 +2023/11/07 14:12:27 - mmengine - INFO - Saving checkpoint at 574000 iterations +2023/11/07 14:21:43 - mmengine - INFO - Iter(train) [574500/640000] base_lr: 7.0734e-06 lr: 2.4612e-06 eta: 20:20:40 time: 1.0986 data_time: 0.0348 memory: 21519 grad_norm: 4.3598 loss: 1.1708 caption_loss_cls: 1.9710 grounding_loss_reg: 2.2863 detection_loss_cls: 0.0280 detection_loss_reg: 0.3172 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3167 instance_segmentation_loss_poly: 0.8111 +2023/11/07 14:30:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 14:30:36 - mmengine - INFO - Iter(train) [575000/640000] base_lr: 6.9969e-06 lr: 2.4543e-06 eta: 20:10:51 time: 1.0923 data_time: 0.0345 memory: 21519 grad_norm: 4.3950 loss: 1.1620 caption_loss_cls: 1.9659 grounding_loss_reg: 2.2838 detection_loss_cls: 0.0280 detection_loss_reg: 0.3179 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3167 instance_segmentation_loss_poly: 0.8113 +2023/11/07 14:30:36 - mmengine - INFO - Saving checkpoint at 575000 iterations +2023/11/07 14:40:36 - mmengine - INFO - Iter(train) [575500/640000] base_lr: 6.9209e-06 lr: 2.4474e-06 eta: 20:02:17 time: 1.1048 data_time: 0.0351 memory: 21519 grad_norm: 4.3372 loss: 1.1543 caption_loss_cls: 1.9627 grounding_loss_reg: 2.2817 detection_loss_cls: 0.0279 detection_loss_reg: 0.3178 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3163 instance_segmentation_loss_poly: 0.8111 +2023/11/07 14:49:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 14:49:57 - mmengine - INFO - Iter(train) [576000/640000] base_lr: 6.8456e-06 lr: 2.4405e-06 eta: 19:52:59 time: 1.1059 data_time: 0.0350 memory: 21519 grad_norm: 4.3369 loss: 1.1509 caption_loss_cls: 1.9656 grounding_loss_reg: 2.2783 detection_loss_cls: 0.0279 detection_loss_reg: 0.3175 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3165 instance_segmentation_loss_poly: 0.8114 +2023/11/07 14:49:57 - mmengine - INFO - Saving checkpoint at 576000 iterations +2023/11/07 14:59:31 - mmengine - INFO - Iter(train) [576500/640000] base_lr: 6.7708e-06 lr: 2.4337e-06 eta: 19:43:55 time: 1.1108 data_time: 0.0352 memory: 21519 grad_norm: 4.3220 loss: 1.1428 caption_loss_cls: 1.9619 grounding_loss_reg: 2.2778 detection_loss_cls: 0.0278 detection_loss_reg: 0.3172 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3170 instance_segmentation_loss_poly: 0.8121 +2023/11/07 15:08:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 15:08:46 - mmengine - INFO - Iter(train) [577000/640000] base_lr: 6.6965e-06 lr: 2.4270e-06 eta: 19:34:31 time: 1.1259 data_time: 0.0357 memory: 21519 grad_norm: 4.2496 loss: 1.1332 caption_loss_cls: 1.9636 grounding_loss_reg: 2.2768 detection_loss_cls: 0.0278 detection_loss_reg: 0.3175 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3168 instance_segmentation_loss_poly: 0.8124 +2023/11/07 15:08:46 - mmengine - INFO - Saving checkpoint at 577000 iterations +2023/11/07 15:18:41 - mmengine - INFO - Iter(train) [577500/640000] base_lr: 6.6228e-06 lr: 2.4203e-06 eta: 19:25:48 time: 1.1301 data_time: 0.0375 memory: 21519 grad_norm: 4.2839 loss: 1.1411 caption_loss_cls: 1.9665 grounding_loss_reg: 2.2759 detection_loss_cls: 0.0278 detection_loss_reg: 0.3174 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3170 instance_segmentation_loss_poly: 0.8125 +2023/11/07 15:28:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 15:28:17 - mmengine - INFO - Iter(train) [578000/640000] base_lr: 6.5497e-06 lr: 2.4136e-06 eta: 19:16:44 time: 1.1363 data_time: 0.0377 memory: 21519 grad_norm: 4.2222 loss: 1.1334 caption_loss_cls: 1.9633 grounding_loss_reg: 2.2753 detection_loss_cls: 0.0279 detection_loss_reg: 0.3180 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3168 instance_segmentation_loss_poly: 0.8118 +2023/11/07 15:28:17 - mmengine - INFO - Saving checkpoint at 578000 iterations +2023/11/07 15:38:04 - mmengine - INFO - Iter(train) [578500/640000] base_lr: 6.4772e-06 lr: 2.4070e-06 eta: 19:07:51 time: 1.1442 data_time: 0.0380 memory: 21519 grad_norm: 4.1902 loss: 1.1315 caption_loss_cls: 1.9632 grounding_loss_reg: 2.2743 detection_loss_cls: 0.0278 detection_loss_reg: 0.3177 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3166 instance_segmentation_loss_poly: 0.8111 +2023/11/07 15:46:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 15:46:48 - mmengine - INFO - Iter(train) [579000/640000] base_lr: 6.4053e-06 lr: 2.4005e-06 eta: 18:57:56 time: 1.1420 data_time: 0.0378 memory: 21519 grad_norm: 4.1358 loss: 1.1367 caption_loss_cls: 1.9662 grounding_loss_reg: 2.2717 detection_loss_cls: 0.0278 detection_loss_reg: 0.3170 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3182 instance_segmentation_loss_poly: 0.8144 +2023/11/07 15:46:48 - mmengine - INFO - Saving checkpoint at 579000 iterations +2023/11/07 15:56:15 - mmengine - INFO - Iter(train) [579500/640000] base_lr: 6.3339e-06 lr: 2.3940e-06 eta: 18:48:42 time: 1.1335 data_time: 0.0374 memory: 21519 grad_norm: 4.1708 loss: 1.1448 caption_loss_cls: 1.9647 grounding_loss_reg: 2.2684 detection_loss_cls: 0.0278 detection_loss_reg: 0.3175 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3182 instance_segmentation_loss_poly: 0.8145 +2023/11/07 16:05:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 16:05:16 - mmengine - INFO - Iter(train) [580000/640000] base_lr: 6.2630e-06 lr: 2.3875e-06 eta: 18:39:05 time: 1.1289 data_time: 0.0373 memory: 21519 grad_norm: 4.1929 loss: 1.1452 caption_loss_cls: 1.9635 grounding_loss_reg: 2.2689 detection_loss_cls: 0.0278 detection_loss_reg: 0.3181 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3183 instance_segmentation_loss_poly: 0.8144 +2023/11/07 16:05:16 - mmengine - INFO - Saving checkpoint at 580000 iterations +2023/11/07 16:14:16 - mmengine - INFO - Evaluating bbox... +2023/11/07 16:15:13 - mmengine - INFO - bbox_mAP_copypaste: 0.465 0.641 0.506 0.293 0.513 0.609 +2023/11/07 16:15:13 - mmengine - INFO - Evaluating segm... +2023/11/07 16:16:24 - mmengine - INFO - segm_mAP_copypaste: 0.315 0.559 0.308 0.162 0.361 0.488 +2023/11/07 16:21:30 - mmengine - INFO - per class results: +2023/11/07 16:21:30 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 76.05 | 88.49 | +| building | 80.43 | 90.63 | +| sky | 92.9 | 97.51 | +| floor | 80.54 | 89.52 | +| tree | 73.2 | 86.24 | +| ceiling | 83.6 | 93.94 | +| road | 83.32 | 89.25 | +| bed | 88.17 | 94.99 | +| windowpane | 60.03 | 77.1 | +| grass | 66.99 | 86.36 | +| cabinet | 60.89 | 72.32 | +| sidewalk | 66.46 | 82.0 | +| person | 79.17 | 91.16 | +| earth | 37.42 | 48.93 | +| door | 49.92 | 65.06 | +| table | 59.29 | 75.52 | +| mountain | 53.64 | 68.53 | +| plant | 52.65 | 63.64 | +| curtain | 67.04 | 84.05 | +| chair | 57.26 | 70.84 | +| car | 82.81 | 90.65 | +| water | 52.82 | 67.88 | +| painting | 70.29 | 87.24 | +| sofa | 66.74 | 80.86 | +| shelf | 42.97 | 61.85 | +| house | 44.99 | 63.27 | +| sea | 50.47 | 70.89 | +| mirror | 64.67 | 73.2 | +| rug | 65.24 | 76.17 | +| field | 28.73 | 39.38 | +| armchair | 43.98 | 62.69 | +| seat | 62.93 | 79.73 | +| fence | 39.23 | 52.55 | +| desk | 45.14 | 64.6 | +| rock | 38.23 | 58.51 | +| wardrobe | 43.83 | 61.84 | +| lamp | 60.84 | 74.48 | +| bathtub | 77.16 | 84.98 | +| railing | 27.57 | 40.43 | +| cushion | 56.51 | 68.58 | +| base | 24.93 | 34.89 | +| box | 26.01 | 33.21 | +| column | 48.19 | 61.62 | +| signboard | 37.24 | 50.19 | +| chest of drawers | 37.93 | 53.91 | +| counter | 32.74 | 43.13 | +| sand | 39.4 | 62.68 | +| sink | 72.49 | 79.28 | +| skyscraper | 37.89 | 45.94 | +| fireplace | 74.31 | 89.53 | +| refrigerator | 75.9 | 84.76 | +| grandstand | 34.31 | 63.99 | +| path | 33.46 | 44.98 | +| stairs | 25.29 | 30.94 | +| runway | 68.59 | 88.4 | +| case | 44.42 | 57.88 | +| pool table | 87.36 | 95.82 | +| pillow | 58.17 | 71.57 | +| screen door | 67.47 | 72.95 | +| stairway | 29.96 | 42.4 | +| river | 15.7 | 31.82 | +| bridge | 61.92 | 73.57 | +| bookcase | 35.51 | 57.18 | +| blind | 24.04 | 26.29 | +| coffee table | 65.77 | 81.72 | +| toilet | 84.67 | 89.24 | +| flower | 34.35 | 45.38 | +| book | 45.9 | 67.57 | +| hill | 8.35 | 15.83 | +| bench | 44.22 | 49.6 | +| countertop | 49.51 | 63.43 | +| stove | 77.18 | 84.44 | +| palm | 45.37 | 57.61 | +| kitchen island | 38.53 | 70.35 | +| computer | 69.8 | 80.87 | +| swivel chair | 45.46 | 58.1 | +| boat | 73.99 | 88.38 | +| bar | 41.25 | 49.9 | +| arcade machine | 36.57 | 38.45 | +| hovel | 14.14 | 19.12 | +| bus | 86.37 | 95.25 | +| towel | 63.28 | 75.66 | +| light | 47.38 | 55.21 | +| truck | 40.12 | 47.39 | +| tower | 38.06 | 49.03 | +| chandelier | 63.45 | 77.88 | +| awning | 25.83 | 32.32 | +| streetlight | 28.72 | 36.66 | +| booth | 48.86 | 50.0 | +| television receiver | 71.69 | 82.87 | +| airplane | 56.3 | 66.97 | +| dirt track | 0.5 | 2.0 | +| apparel | 35.28 | 53.06 | +| pole | 28.92 | 38.8 | +| land | 2.32 | 3.25 | +| bannister | 12.84 | 17.25 | +| escalator | 26.31 | 27.33 | +| ottoman | 46.97 | 64.02 | +| bottle | 25.76 | 31.28 | +| buffet | 38.73 | 43.29 | +| poster | 28.58 | 37.39 | +| stage | 10.04 | 16.96 | +| van | 44.04 | 60.41 | +| ship | 77.84 | 86.89 | +| fountain | 17.35 | 17.7 | +| conveyer belt | 77.26 | 85.16 | +| canopy | 24.45 | 32.9 | +| washer | 64.21 | 66.55 | +| plaything | 34.97 | 52.54 | +| swimming pool | 59.38 | 76.58 | +| stool | 43.71 | 55.26 | +| barrel | 20.8 | 25.83 | +| basket | 26.72 | 37.78 | +| waterfall | 51.07 | 62.34 | +| tent | 86.02 | 97.89 | +| bag | 12.64 | 14.5 | +| minibike | 71.95 | 81.2 | +| cradle | 70.83 | 88.22 | +| oven | 44.14 | 57.33 | +| ball | 42.96 | 47.95 | +| food | 56.63 | 62.03 | +| step | 16.19 | 19.34 | +| tank | 40.99 | 46.83 | +| trade name | 23.42 | 26.8 | +| microwave | 79.77 | 86.5 | +| pot | 46.06 | 52.01 | +| animal | 60.9 | 63.98 | +| bicycle | 54.03 | 71.39 | +| lake | 61.61 | 65.54 | +| dishwasher | 54.58 | 75.54 | +| screen | 65.72 | 82.84 | +| blanket | 10.75 | 12.89 | +| sculpture | 55.96 | 61.13 | +| hood | 58.52 | 62.75 | +| sconce | 34.4 | 42.15 | +| vase | 42.19 | 55.15 | +| traffic light | 35.37 | 53.3 | +| tray | 10.07 | 16.64 | +| ashcan | 40.9 | 54.97 | +| fan | 55.68 | 67.6 | +| pier | 41.67 | 55.78 | +| crt screen | 5.87 | 16.3 | +| plate | 54.88 | 71.04 | +| monitor | 15.99 | 19.61 | +| bulletin board | 28.21 | 36.03 | +| shower | 6.1 | 10.58 | +| radiator | 52.13 | 57.84 | +| glass | 15.95 | 17.05 | +| clock | 25.94 | 30.32 | +| flag | 29.85 | 35.64 | ++---------------------+-------+-------+ +2023/11/07 16:21:45 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4650 coco/bbox_mAP_50: 0.6410 coco/bbox_mAP_75: 0.5060 coco/bbox_mAP_s: 0.2930 coco/bbox_mAP_m: 0.5130 coco/bbox_mAP_l: 0.6090 coco/segm_mAP: 0.3150 coco/segm_mAP_50: 0.5590 coco/segm_mAP_75: 0.3080 coco/segm_mAP_s: 0.1620 coco/segm_mAP_m: 0.3610 coco/segm_mAP_l: 0.4880 Bleu_1: 0.7602 Bleu_2: 0.5979 Bleu_3: 0.4590 Bleu_4: 0.3497 METEOR: 0.2715 ROUGE_L: 0.5583 CIDEr: 1.1107 SPICE: 0.2039 aAcc: 82.3000 mIoU: 47.8600 mAcc: 58.7600 visual-grounding/miou: 0.7873 visual-grounding/acc: 0.8545 data_time: 0.0049 time: 0.5246 +2023/11/07 16:30:58 - mmengine - INFO - Iter(train) [580500/640000] base_lr: 6.1928e-06 lr: 2.3812e-06 eta: 18:29:40 time: 1.1238 data_time: 0.0344 memory: 21519 grad_norm: 4.2247 loss: 1.1620 caption_loss_cls: 1.9663 grounding_loss_reg: 2.2672 detection_loss_cls: 0.0279 detection_loss_reg: 0.3191 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0278 instance_segmentation_loss_reg: 0.3194 instance_segmentation_loss_poly: 0.8164 +2023/11/07 16:40:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 16:40:37 - mmengine - INFO - Iter(train) [581000/640000] base_lr: 6.1231e-06 lr: 2.3748e-06 eta: 18:20:38 time: 1.1298 data_time: 0.0347 memory: 21519 grad_norm: 4.2275 loss: 1.1668 caption_loss_cls: 1.9657 grounding_loss_reg: 2.2666 detection_loss_cls: 0.0278 detection_loss_reg: 0.3195 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3199 instance_segmentation_loss_poly: 0.8166 +2023/11/07 16:40:37 - mmengine - INFO - Saving checkpoint at 581000 iterations +2023/11/07 16:50:07 - mmengine - INFO - Iter(train) [581500/640000] base_lr: 6.0540e-06 lr: 2.3685e-06 eta: 18:11:27 time: 1.1236 data_time: 0.0328 memory: 21519 grad_norm: 4.1894 loss: 1.1499 caption_loss_cls: 1.9639 grounding_loss_reg: 2.2667 detection_loss_cls: 0.0279 detection_loss_reg: 0.3200 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3187 instance_segmentation_loss_poly: 0.8151 +2023/11/07 16:59:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 16:59:30 - mmengine - INFO - Iter(train) [582000/640000] base_lr: 5.9855e-06 lr: 2.3623e-06 eta: 18:02:10 time: 1.1204 data_time: 0.0328 memory: 21519 grad_norm: 4.2242 loss: 1.1551 caption_loss_cls: 1.9632 grounding_loss_reg: 2.2668 detection_loss_cls: 0.0279 detection_loss_reg: 0.3206 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3189 instance_segmentation_loss_poly: 0.8148 +2023/11/07 16:59:30 - mmengine - INFO - Saving checkpoint at 582000 iterations +2023/11/07 17:09:08 - mmengine - INFO - Iter(train) [582500/640000] base_lr: 5.9175e-06 lr: 2.3561e-06 eta: 17:53:06 time: 1.1182 data_time: 0.0328 memory: 21519 grad_norm: 4.2250 loss: 1.1571 caption_loss_cls: 1.9642 grounding_loss_reg: 2.2666 detection_loss_cls: 0.0278 detection_loss_reg: 0.3200 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3189 instance_segmentation_loss_poly: 0.8151 +2023/11/07 17:18:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 17:18:18 - mmengine - INFO - Iter(train) [583000/640000] base_lr: 5.8501e-06 lr: 2.3500e-06 eta: 17:43:37 time: 1.1245 data_time: 0.0330 memory: 21519 grad_norm: 4.2122 loss: 1.1506 caption_loss_cls: 1.9637 grounding_loss_reg: 2.2656 detection_loss_cls: 0.0277 detection_loss_reg: 0.3188 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3197 instance_segmentation_loss_poly: 0.8163 +2023/11/07 17:18:18 - mmengine - INFO - Saving checkpoint at 583000 iterations +2023/11/07 17:27:27 - mmengine - INFO - Iter(train) [583500/640000] base_lr: 5.7833e-06 lr: 2.3439e-06 eta: 17:34:08 time: 1.1203 data_time: 0.0330 memory: 21519 grad_norm: 4.2074 loss: 1.1486 caption_loss_cls: 1.9670 grounding_loss_reg: 2.2642 detection_loss_cls: 0.0278 detection_loss_reg: 0.3195 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3195 instance_segmentation_loss_poly: 0.8162 +2023/11/07 17:36:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 17:36:42 - mmengine - INFO - Iter(train) [584000/640000] base_lr: 5.7171e-06 lr: 2.3379e-06 eta: 17:24:43 time: 1.1235 data_time: 0.0330 memory: 21519 grad_norm: 4.1672 loss: 1.1435 caption_loss_cls: 1.9662 grounding_loss_reg: 2.2649 detection_loss_cls: 0.0277 detection_loss_reg: 0.3197 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0278 instance_segmentation_loss_reg: 0.3202 instance_segmentation_loss_poly: 0.8174 +2023/11/07 17:36:42 - mmengine - INFO - Saving checkpoint at 584000 iterations +2023/11/07 17:45:55 - mmengine - INFO - Iter(train) [584500/640000] base_lr: 5.6514e-06 lr: 2.3319e-06 eta: 17:15:18 time: 1.1233 data_time: 0.0358 memory: 21519 grad_norm: 4.1597 loss: 1.1318 caption_loss_cls: 1.9633 grounding_loss_reg: 2.2630 detection_loss_cls: 0.0278 detection_loss_reg: 0.3194 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3199 instance_segmentation_loss_poly: 0.8170 +2023/11/07 17:55:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 17:55:22 - mmengine - INFO - Iter(train) [585000/640000] base_lr: 5.5863e-06 lr: 2.3260e-06 eta: 17:06:04 time: 1.1203 data_time: 0.0358 memory: 21519 grad_norm: 4.1377 loss: 1.1226 caption_loss_cls: 1.9633 grounding_loss_reg: 2.2615 detection_loss_cls: 0.0278 detection_loss_reg: 0.3195 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0278 instance_segmentation_loss_reg: 0.3200 instance_segmentation_loss_poly: 0.8170 +2023/11/07 17:55:22 - mmengine - INFO - Saving checkpoint at 585000 iterations +2023/11/07 18:04:52 - mmengine - INFO - Iter(train) [585500/640000] base_lr: 5.5218e-06 lr: 2.3202e-06 eta: 16:56:52 time: 1.1203 data_time: 0.0358 memory: 21519 grad_norm: 4.1999 loss: 1.1365 caption_loss_cls: 1.9623 grounding_loss_reg: 2.2598 detection_loss_cls: 0.0279 detection_loss_reg: 0.3202 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0278 instance_segmentation_loss_reg: 0.3201 instance_segmentation_loss_poly: 0.8163 +2023/11/07 18:14:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 18:14:22 - mmengine - INFO - Iter(train) [586000/640000] base_lr: 5.4578e-06 lr: 2.3143e-06 eta: 16:47:40 time: 1.1221 data_time: 0.0358 memory: 21519 grad_norm: 4.1463 loss: 1.1336 caption_loss_cls: 1.9635 grounding_loss_reg: 2.2603 detection_loss_cls: 0.0279 detection_loss_reg: 0.3205 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3196 instance_segmentation_loss_poly: 0.8153 +2023/11/07 18:14:22 - mmengine - INFO - Saving checkpoint at 586000 iterations +2023/11/07 18:23:51 - mmengine - INFO - Iter(train) [586500/640000] base_lr: 5.3945e-06 lr: 2.3086e-06 eta: 16:38:26 time: 1.1196 data_time: 0.0359 memory: 21519 grad_norm: 4.1817 loss: 1.1313 caption_loss_cls: 1.9630 grounding_loss_reg: 2.2624 detection_loss_cls: 0.0278 detection_loss_reg: 0.3202 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0278 instance_segmentation_loss_reg: 0.3195 instance_segmentation_loss_poly: 0.8149 +2023/11/07 18:33:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 18:33:25 - mmengine - INFO - Iter(train) [587000/640000] base_lr: 5.3317e-06 lr: 2.3029e-06 eta: 16:29:17 time: 1.1257 data_time: 0.0361 memory: 21519 grad_norm: 4.1920 loss: 1.1365 caption_loss_cls: 1.9623 grounding_loss_reg: 2.2618 detection_loss_cls: 0.0278 detection_loss_reg: 0.3199 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0278 instance_segmentation_loss_reg: 0.3194 instance_segmentation_loss_poly: 0.8147 +2023/11/07 18:33:25 - mmengine - INFO - Saving checkpoint at 587000 iterations +2023/11/07 18:42:30 - mmengine - INFO - Iter(train) [587500/640000] base_lr: 5.2695e-06 lr: 2.2972e-06 eta: 16:19:45 time: 1.1245 data_time: 0.0361 memory: 21519 grad_norm: 4.2280 loss: 1.1351 caption_loss_cls: 1.9604 grounding_loss_reg: 2.2605 detection_loss_cls: 0.0278 detection_loss_reg: 0.3198 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0278 instance_segmentation_loss_reg: 0.3195 instance_segmentation_loss_poly: 0.8144 +2023/11/07 18:51:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 18:51:57 - mmengine - INFO - Iter(train) [588000/640000] base_lr: 5.2078e-06 lr: 2.2916e-06 eta: 16:10:31 time: 1.1278 data_time: 0.0361 memory: 21519 grad_norm: 4.2716 loss: 1.1392 caption_loss_cls: 1.9602 grounding_loss_reg: 2.2608 detection_loss_cls: 0.0278 detection_loss_reg: 0.3194 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3191 instance_segmentation_loss_poly: 0.8136 +2023/11/07 18:51:57 - mmengine - INFO - Saving checkpoint at 588000 iterations +2023/11/07 19:01:12 - mmengine - INFO - Iter(train) [588500/640000] base_lr: 5.1467e-06 lr: 2.2861e-06 eta: 16:01:07 time: 1.1282 data_time: 0.0362 memory: 21519 grad_norm: 4.2611 loss: 1.1367 caption_loss_cls: 1.9579 grounding_loss_reg: 2.2621 detection_loss_cls: 0.0278 detection_loss_reg: 0.3198 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3186 instance_segmentation_loss_poly: 0.8120 +2023/11/07 19:10:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 19:10:14 - mmengine - INFO - Iter(train) [589000/640000] base_lr: 5.0863e-06 lr: 2.2806e-06 eta: 15:51:34 time: 1.1218 data_time: 0.0357 memory: 21519 grad_norm: 4.2921 loss: 1.1399 caption_loss_cls: 1.9583 grounding_loss_reg: 2.2639 detection_loss_cls: 0.0277 detection_loss_reg: 0.3190 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3185 instance_segmentation_loss_poly: 0.8121 +2023/11/07 19:10:14 - mmengine - INFO - Saving checkpoint at 589000 iterations +2023/11/07 19:19:47 - mmengine - INFO - Iter(train) [589500/640000] base_lr: 5.0264e-06 lr: 2.2751e-06 eta: 15:42:23 time: 1.1227 data_time: 0.0360 memory: 21519 grad_norm: 4.2746 loss: 1.1404 caption_loss_cls: 1.9580 grounding_loss_reg: 2.2643 detection_loss_cls: 0.0276 detection_loss_reg: 0.3181 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3187 instance_segmentation_loss_poly: 0.8125 +2023/11/07 19:29:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231106_193813 +2023/11/07 19:29:14 - mmengine - INFO - Iter(train) [590000/640000] base_lr: 4.9670e-06 lr: 2.2697e-06 eta: 15:33:08 time: 1.1219 data_time: 0.0359 memory: 21519 grad_norm: 4.2917 loss: 1.1414 caption_loss_cls: 1.9598 grounding_loss_reg: 2.2615 detection_loss_cls: 0.0276 detection_loss_reg: 0.3181 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3184 instance_segmentation_loss_poly: 0.8121 +2023/11/07 19:29:14 - mmengine - INFO - Saving checkpoint at 590000 iterations +2023/11/08 02:53:08 - mmengine - INFO - Iter(train) [590500/640000] base_lr: 4.9083e-06 lr: 2.2644e-06 eta: 15:11:26 time: 1.1180 data_time: 0.0324 memory: 21524 grad_norm: 4.2677 loss: 1.1385 caption_loss_cls: 1.9570 grounding_loss_reg: 2.2583 detection_loss_cls: 0.0276 detection_loss_reg: 0.3185 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3184 instance_segmentation_loss_poly: 0.8119 +2023/11/08 03:02:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 03:02:07 - mmengine - INFO - Iter(train) [591000/640000] base_lr: 4.8501e-06 lr: 2.2591e-06 eta: 14:50:59 time: 1.1093 data_time: 0.0321 memory: 21523 grad_norm: 4.3133 loss: 1.1266 caption_loss_cls: 1.9521 grounding_loss_reg: 2.2526 detection_loss_cls: 0.0275 detection_loss_reg: 0.3178 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3180 instance_segmentation_loss_poly: 0.8106 +2023/11/08 03:02:07 - mmengine - INFO - Saving checkpoint at 591000 iterations +2023/11/08 03:11:23 - mmengine - INFO - Iter(train) [591500/640000] base_lr: 4.7925e-06 lr: 2.2539e-06 eta: 14:47:13 time: 1.1121 data_time: 0.0319 memory: 21523 grad_norm: 4.2846 loss: 1.1203 caption_loss_cls: 1.9515 grounding_loss_reg: 2.2507 detection_loss_cls: 0.0274 detection_loss_reg: 0.3170 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3172 instance_segmentation_loss_poly: 0.8092 +2023/11/08 03:20:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 03:20:00 - mmengine - INFO - Iter(train) [592000/640000] base_lr: 4.7355e-06 lr: 2.2487e-06 eta: 14:24:51 time: 1.0992 data_time: 0.0314 memory: 21523 grad_norm: 4.2851 loss: 1.1177 caption_loss_cls: 1.9512 grounding_loss_reg: 2.2506 detection_loss_cls: 0.0273 detection_loss_reg: 0.3159 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3170 instance_segmentation_loss_poly: 0.8090 +2023/11/08 03:20:00 - mmengine - INFO - Saving checkpoint at 592000 iterations +2023/11/08 03:29:16 - mmengine - INFO - Iter(train) [592500/640000] base_lr: 4.6791e-06 lr: 2.2436e-06 eta: 14:20:41 time: 1.0997 data_time: 0.0314 memory: 21523 grad_norm: 4.2404 loss: 1.1145 caption_loss_cls: 1.9501 grounding_loss_reg: 2.2479 detection_loss_cls: 0.0272 detection_loss_reg: 0.3153 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3165 instance_segmentation_loss_poly: 0.8080 +2023/11/08 03:38:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 03:38:30 - mmengine - INFO - Iter(train) [593000/640000] base_lr: 4.6232e-06 lr: 2.2385e-06 eta: 14:14:20 time: 1.1028 data_time: 0.0315 memory: 21523 grad_norm: 4.2352 loss: 1.1134 caption_loss_cls: 1.9514 grounding_loss_reg: 2.2464 detection_loss_cls: 0.0272 detection_loss_reg: 0.3156 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3164 instance_segmentation_loss_poly: 0.8087 +2023/11/08 03:38:30 - mmengine - INFO - Saving checkpoint at 593000 iterations +2023/11/08 03:48:01 - mmengine - INFO - Iter(train) [593500/640000] base_lr: 4.5679e-06 lr: 2.2334e-06 eta: 14:10:48 time: 1.1022 data_time: 0.0314 memory: 21523 grad_norm: 4.1794 loss: 1.1027 caption_loss_cls: 1.9508 grounding_loss_reg: 2.2429 detection_loss_cls: 0.0273 detection_loss_reg: 0.3162 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3173 instance_segmentation_loss_poly: 0.8104 +2023/11/08 03:57:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 03:57:03 - mmengine - INFO - Iter(train) [594000/640000] base_lr: 4.5132e-06 lr: 2.2285e-06 eta: 14:00:14 time: 1.0960 data_time: 0.0313 memory: 21523 grad_norm: 4.2377 loss: 1.1079 caption_loss_cls: 1.9499 grounding_loss_reg: 2.2419 detection_loss_cls: 0.0273 detection_loss_reg: 0.3166 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3167 instance_segmentation_loss_poly: 0.8105 +2023/11/08 03:57:03 - mmengine - INFO - Saving checkpoint at 594000 iterations +2023/11/08 04:06:28 - mmengine - INFO - Iter(train) [594500/640000] base_lr: 4.4591e-06 lr: 2.2236e-06 eta: 13:53:50 time: 1.0989 data_time: 0.0347 memory: 21523 grad_norm: 4.2641 loss: 1.1118 caption_loss_cls: 1.9496 grounding_loss_reg: 2.2393 detection_loss_cls: 0.0273 detection_loss_reg: 0.3173 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3170 instance_segmentation_loss_poly: 0.8108 +2023/11/08 04:14:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 04:14:21 - mmengine - INFO - Iter(train) [595000/640000] base_lr: 4.4056e-06 lr: 2.2187e-06 eta: 13:33:06 time: 1.0824 data_time: 0.0344 memory: 21523 grad_norm: 4.3317 loss: 1.1360 caption_loss_cls: 1.9555 grounding_loss_reg: 2.2366 detection_loss_cls: 0.0273 detection_loss_reg: 0.3169 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3174 instance_segmentation_loss_poly: 0.8119 +2023/11/08 04:14:21 - mmengine - INFO - Saving checkpoint at 595000 iterations +2023/11/08 04:23:51 - mmengine - INFO - Iter(train) [595500/640000] base_lr: 4.3526e-06 lr: 2.2139e-06 eta: 13:27:44 time: 1.0859 data_time: 0.0346 memory: 21523 grad_norm: 4.3531 loss: 1.1417 caption_loss_cls: 1.9550 grounding_loss_reg: 2.2368 detection_loss_cls: 0.0272 detection_loss_reg: 0.3170 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3168 instance_segmentation_loss_poly: 0.8104 +2023/11/08 04:33:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 04:33:15 - mmengine - INFO - Iter(train) [596000/640000] base_lr: 4.3003e-06 lr: 2.2091e-06 eta: 13:20:58 time: 1.0978 data_time: 0.0348 memory: 21523 grad_norm: 4.2846 loss: 1.1233 caption_loss_cls: 1.9527 grounding_loss_reg: 2.2369 detection_loss_cls: 0.0273 detection_loss_reg: 0.3169 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3166 instance_segmentation_loss_poly: 0.8096 +2023/11/08 04:33:15 - mmengine - INFO - Saving checkpoint at 596000 iterations +2023/11/08 04:42:46 - mmengine - INFO - Iter(train) [596500/640000] base_lr: 4.2485e-06 lr: 2.2044e-06 eta: 13:14:34 time: 1.1014 data_time: 0.0351 memory: 21523 grad_norm: 4.3560 loss: 1.1271 caption_loss_cls: 1.9538 grounding_loss_reg: 2.2339 detection_loss_cls: 0.0273 detection_loss_reg: 0.3162 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3163 instance_segmentation_loss_poly: 0.8092 +2023/11/08 04:51:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 04:51:45 - mmengine - INFO - Iter(train) [597000/640000] base_lr: 4.1973e-06 lr: 2.1998e-06 eta: 13:04:28 time: 1.0976 data_time: 0.0350 memory: 21523 grad_norm: 4.3626 loss: 1.1283 caption_loss_cls: 1.9533 grounding_loss_reg: 2.2342 detection_loss_cls: 0.0273 detection_loss_reg: 0.3166 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3162 instance_segmentation_loss_poly: 0.8092 +2023/11/08 04:51:45 - mmengine - INFO - Saving checkpoint at 597000 iterations +2023/11/08 05:00:07 - mmengine - INFO - Iter(train) [597500/640000] base_lr: 4.1467e-06 lr: 2.1952e-06 eta: 12:50:59 time: 1.0803 data_time: 0.0346 memory: 21523 grad_norm: 4.4853 loss: 1.1391 caption_loss_cls: 1.9499 grounding_loss_reg: 2.2347 detection_loss_cls: 0.0273 detection_loss_reg: 0.3169 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3165 instance_segmentation_loss_poly: 0.8094 +2023/11/08 05:08:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 05:08:39 - mmengine - INFO - Iter(train) [598000/640000] base_lr: 4.0966e-06 lr: 2.1906e-06 eta: 12:39:04 time: 1.0728 data_time: 0.0345 memory: 21523 grad_norm: 4.5257 loss: 1.1506 caption_loss_cls: 1.9513 grounding_loss_reg: 2.2362 detection_loss_cls: 0.0274 detection_loss_reg: 0.3177 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3173 instance_segmentation_loss_poly: 0.8115 +2023/11/08 05:08:39 - mmengine - INFO - Saving checkpoint at 598000 iterations +2023/11/08 05:17:27 - mmengine - INFO - Iter(train) [598500/640000] base_lr: 4.0472e-06 lr: 2.1861e-06 eta: 12:28:52 time: 1.0637 data_time: 0.0341 memory: 21523 grad_norm: 4.5719 loss: 1.1579 caption_loss_cls: 1.9481 grounding_loss_reg: 2.2351 detection_loss_cls: 0.0274 detection_loss_reg: 0.3174 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3168 instance_segmentation_loss_poly: 0.8105 +2023/11/08 05:26:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 05:26:29 - mmengine - INFO - Iter(train) [599000/640000] base_lr: 3.9983e-06 lr: 2.1817e-06 eta: 12:19:48 time: 1.0808 data_time: 0.0347 memory: 21523 grad_norm: 4.4854 loss: 1.1470 caption_loss_cls: 1.9463 grounding_loss_reg: 2.2350 detection_loss_cls: 0.0273 detection_loss_reg: 0.3172 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3165 instance_segmentation_loss_poly: 0.8100 +2023/11/08 05:26:29 - mmengine - INFO - Saving checkpoint at 599000 iterations +2023/11/08 05:35:25 - mmengine - INFO - Iter(train) [599500/640000] base_lr: 3.9500e-06 lr: 2.1773e-06 eta: 12:10:24 time: 1.0724 data_time: 0.0345 memory: 21523 grad_norm: 4.5039 loss: 1.1499 caption_loss_cls: 1.9487 grounding_loss_reg: 2.2345 detection_loss_cls: 0.0273 detection_loss_reg: 0.3167 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3160 instance_segmentation_loss_poly: 0.8095 +2023/11/08 05:44:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 05:44:09 - mmengine - INFO - Iter(train) [600000/640000] base_lr: 3.9024e-06 lr: 2.1729e-06 eta: 12:00:12 time: 1.0624 data_time: 0.0346 memory: 21523 grad_norm: 4.6164 loss: 1.1715 caption_loss_cls: 1.9419 grounding_loss_reg: 2.2362 detection_loss_cls: 0.0273 detection_loss_reg: 0.3161 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3152 instance_segmentation_loss_poly: 0.8085 +2023/11/08 05:44:09 - mmengine - INFO - Saving checkpoint at 600000 iterations +2023/11/08 05:52:49 - mmengine - INFO - Evaluating bbox... +2023/11/08 05:53:46 - mmengine - INFO - bbox_mAP_copypaste: 0.467 0.643 0.506 0.292 0.515 0.614 +2023/11/08 05:53:46 - mmengine - INFO - Evaluating segm... +2023/11/08 05:54:59 - mmengine - INFO - segm_mAP_copypaste: 0.318 0.561 0.313 0.161 0.363 0.489 +2023/11/08 06:00:09 - mmengine - INFO - per class results: +2023/11/08 06:00:09 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.98 | 88.09 | +| building | 80.27 | 90.35 | +| sky | 92.88 | 97.7 | +| floor | 80.65 | 90.24 | +| tree | 73.33 | 85.25 | +| ceiling | 83.4 | 94.2 | +| road | 82.83 | 91.53 | +| bed | 87.96 | 94.45 | +| windowpane | 60.25 | 77.71 | +| grass | 66.6 | 83.26 | +| cabinet | 60.89 | 72.76 | +| sidewalk | 66.47 | 77.06 | +| person | 79.51 | 91.09 | +| earth | 38.15 | 51.65 | +| door | 49.69 | 63.97 | +| table | 58.97 | 74.06 | +| mountain | 58.03 | 75.17 | +| plant | 52.78 | 65.22 | +| curtain | 67.4 | 83.27 | +| chair | 57.38 | 71.67 | +| car | 82.25 | 89.95 | +| water | 51.93 | 65.21 | +| painting | 71.52 | 86.78 | +| sofa | 66.88 | 80.66 | +| shelf | 43.03 | 63.27 | +| house | 43.8 | 67.44 | +| sea | 50.72 | 73.77 | +| mirror | 64.46 | 73.51 | +| rug | 63.5 | 72.49 | +| field | 30.06 | 43.21 | +| armchair | 43.99 | 63.28 | +| seat | 63.36 | 81.18 | +| fence | 42.52 | 57.1 | +| desk | 44.83 | 66.26 | +| rock | 35.48 | 51.85 | +| wardrobe | 46.03 | 60.34 | +| lamp | 60.67 | 73.75 | +| bathtub | 78.45 | 87.06 | +| railing | 27.0 | 40.73 | +| cushion | 57.44 | 69.16 | +| base | 25.16 | 35.32 | +| box | 25.42 | 32.52 | +| column | 48.14 | 59.74 | +| signboard | 37.28 | 50.39 | +| chest of drawers | 34.3 | 53.79 | +| counter | 31.68 | 44.38 | +| sand | 36.07 | 49.84 | +| sink | 72.48 | 79.1 | +| skyscraper | 37.99 | 45.74 | +| fireplace | 74.27 | 86.35 | +| refrigerator | 75.02 | 82.18 | +| grandstand | 35.21 | 67.38 | +| path | 25.31 | 35.02 | +| stairs | 26.17 | 33.82 | +| runway | 64.29 | 81.13 | +| case | 41.84 | 54.71 | +| pool table | 88.52 | 95.44 | +| pillow | 57.97 | 72.32 | +| screen door | 69.13 | 75.61 | +| stairway | 31.5 | 39.36 | +| river | 14.31 | 30.96 | +| bridge | 66.26 | 78.92 | +| bookcase | 35.1 | 57.99 | +| blind | 21.42 | 22.85 | +| coffee table | 65.96 | 81.52 | +| toilet | 84.27 | 88.93 | +| flower | 34.76 | 46.84 | +| book | 45.4 | 66.79 | +| hill | 10.88 | 19.99 | +| bench | 43.64 | 48.83 | +| countertop | 47.97 | 62.67 | +| stove | 77.23 | 83.75 | +| palm | 44.22 | 57.31 | +| kitchen island | 39.44 | 70.22 | +| computer | 72.04 | 82.68 | +| swivel chair | 45.02 | 56.93 | +| boat | 72.84 | 86.84 | +| bar | 48.01 | 58.26 | +| arcade machine | 38.26 | 40.27 | +| hovel | 12.85 | 14.64 | +| bus | 86.36 | 95.03 | +| towel | 61.81 | 73.38 | +| light | 48.34 | 57.18 | +| truck | 40.14 | 46.02 | +| tower | 31.5 | 40.94 | +| chandelier | 62.54 | 76.79 | +| awning | 21.44 | 25.12 | +| streetlight | 28.55 | 35.99 | +| booth | 51.51 | 52.82 | +| television receiver | 70.12 | 80.56 | +| airplane | 55.28 | 65.93 | +| dirt track | 0.79 | 3.52 | +| apparel | 37.17 | 56.08 | +| pole | 31.24 | 44.36 | +| land | 2.31 | 3.27 | +| bannister | 13.72 | 18.45 | +| escalator | 32.24 | 35.69 | +| ottoman | 45.54 | 65.98 | +| bottle | 27.46 | 34.01 | +| buffet | 43.3 | 48.68 | +| poster | 28.14 | 38.34 | +| stage | 12.7 | 20.65 | +| van | 34.47 | 46.02 | +| ship | 73.98 | 81.19 | +| fountain | 12.56 | 12.89 | +| conveyer belt | 79.73 | 87.71 | +| canopy | 26.88 | 31.57 | +| washer | 67.71 | 71.88 | +| plaything | 36.23 | 51.67 | +| swimming pool | 56.37 | 71.92 | +| stool | 42.52 | 54.38 | +| barrel | 16.83 | 31.55 | +| basket | 28.16 | 40.94 | +| waterfall | 55.54 | 74.28 | +| tent | 93.0 | 97.53 | +| bag | 13.95 | 15.97 | +| minibike | 72.53 | 81.02 | +| cradle | 75.04 | 92.41 | +| oven | 45.07 | 58.68 | +| ball | 40.07 | 44.2 | +| food | 58.46 | 65.19 | +| step | 15.27 | 17.65 | +| tank | 41.82 | 45.91 | +| trade name | 23.57 | 27.37 | +| microwave | 83.15 | 90.19 | +| pot | 46.04 | 51.6 | +| animal | 62.17 | 66.13 | +| bicycle | 55.24 | 71.41 | +| lake | 62.02 | 67.32 | +| dishwasher | 54.66 | 75.6 | +| screen | 58.83 | 86.12 | +| blanket | 13.52 | 16.51 | +| sculpture | 54.36 | 63.49 | +| hood | 59.43 | 64.64 | +| sconce | 34.82 | 43.23 | +| vase | 42.66 | 54.88 | +| traffic light | 36.23 | 54.22 | +| tray | 10.55 | 17.82 | +| ashcan | 39.22 | 55.1 | +| fan | 57.22 | 70.94 | +| pier | 39.83 | 56.61 | +| crt screen | 5.31 | 14.23 | +| plate | 55.36 | 72.15 | +| monitor | 18.94 | 22.47 | +| bulletin board | 31.91 | 40.18 | +| shower | 4.26 | 11.91 | +| radiator | 50.81 | 56.46 | +| glass | 16.38 | 17.73 | +| clock | 26.29 | 31.89 | +| flag | 29.61 | 34.44 | ++---------------------+-------+-------+ +2023/11/08 06:00:26 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4670 coco/bbox_mAP_50: 0.6430 coco/bbox_mAP_75: 0.5060 coco/bbox_mAP_s: 0.2920 coco/bbox_mAP_m: 0.5150 coco/bbox_mAP_l: 0.6140 coco/segm_mAP: 0.3180 coco/segm_mAP_50: 0.5610 coco/segm_mAP_75: 0.3130 coco/segm_mAP_s: 0.1610 coco/segm_mAP_m: 0.3630 coco/segm_mAP_l: 0.4890 Bleu_1: 0.7562 Bleu_2: 0.5955 Bleu_3: 0.4569 Bleu_4: 0.3478 METEOR: 0.2713 ROUGE_L: 0.5584 CIDEr: 1.1073 SPICE: 0.2025 aAcc: 82.2800 mIoU: 47.9300 mAcc: 58.9700 visual-grounding/miou: 0.7889 visual-grounding/acc: 0.8565 data_time: 0.0104 time: 0.5277 +2023/11/08 06:09:24 - mmengine - INFO - Iter(train) [600500/640000] base_lr: 3.8552e-06 lr: 2.1687e-06 eta: 11:51:07 time: 1.0545 data_time: 0.0316 memory: 21524 grad_norm: 4.6403 loss: 1.1757 caption_loss_cls: 1.9389 grounding_loss_reg: 2.2338 detection_loss_cls: 0.0273 detection_loss_reg: 0.3152 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3146 instance_segmentation_loss_poly: 0.8074 +2023/11/08 06:17:49 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 06:17:49 - mmengine - INFO - Iter(train) [601000/640000] base_lr: 3.8087e-06 lr: 2.1644e-06 eta: 11:40:01 time: 1.0461 data_time: 0.0316 memory: 21523 grad_norm: 4.6715 loss: 1.1839 caption_loss_cls: 1.9414 grounding_loss_reg: 2.2339 detection_loss_cls: 0.0273 detection_loss_reg: 0.3148 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3140 instance_segmentation_loss_poly: 0.8065 +2023/11/08 06:17:49 - mmengine - INFO - Saving checkpoint at 601000 iterations +2023/11/08 06:26:51 - mmengine - INFO - Iter(train) [601500/640000] base_lr: 3.7628e-06 lr: 2.1603e-06 eta: 11:31:15 time: 1.0564 data_time: 0.0322 memory: 21523 grad_norm: 4.6487 loss: 1.1854 caption_loss_cls: 1.9416 grounding_loss_reg: 2.2324 detection_loss_cls: 0.0272 detection_loss_reg: 0.3147 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3139 instance_segmentation_loss_poly: 0.8065 +2023/11/08 06:35:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 06:35:50 - mmengine - INFO - Iter(train) [602000/640000] base_lr: 3.7174e-06 lr: 2.1561e-06 eta: 11:22:15 time: 1.0630 data_time: 0.0324 memory: 21523 grad_norm: 4.5758 loss: 1.1611 caption_loss_cls: 1.9404 grounding_loss_reg: 2.2305 detection_loss_cls: 0.0272 detection_loss_reg: 0.3146 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3142 instance_segmentation_loss_poly: 0.8065 +2023/11/08 06:35:50 - mmengine - INFO - Saving checkpoint at 602000 iterations +2023/11/08 06:45:21 - mmengine - INFO - Iter(train) [602500/640000] base_lr: 3.6726e-06 lr: 2.1521e-06 eta: 11:14:51 time: 1.0736 data_time: 0.0328 memory: 21523 grad_norm: 4.5417 loss: 1.1493 caption_loss_cls: 1.9373 grounding_loss_reg: 2.2294 detection_loss_cls: 0.0271 detection_loss_reg: 0.3144 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3137 instance_segmentation_loss_poly: 0.8050 +2023/11/08 06:54:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 06:54:21 - mmengine - INFO - Iter(train) [603000/640000] base_lr: 3.6285e-06 lr: 2.1480e-06 eta: 11:05:51 time: 1.0733 data_time: 0.0330 memory: 21523 grad_norm: 4.5453 loss: 1.1484 caption_loss_cls: 1.9366 grounding_loss_reg: 2.2275 detection_loss_cls: 0.0272 detection_loss_reg: 0.3148 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3131 instance_segmentation_loss_poly: 0.8043 +2023/11/08 06:54:21 - mmengine - INFO - Saving checkpoint at 603000 iterations +2023/11/08 07:03:43 - mmengine - INFO - Iter(train) [603500/640000] base_lr: 3.5849e-06 lr: 2.1441e-06 eta: 10:57:49 time: 1.0797 data_time: 0.0336 memory: 21523 grad_norm: 4.5025 loss: 1.1457 caption_loss_cls: 1.9356 grounding_loss_reg: 2.2275 detection_loss_cls: 0.0272 detection_loss_reg: 0.3147 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3131 instance_segmentation_loss_poly: 0.8046 +2023/11/08 07:12:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 07:12:33 - mmengine - INFO - Iter(train) [604000/640000] base_lr: 3.5419e-06 lr: 2.1402e-06 eta: 10:48:20 time: 1.0812 data_time: 0.0338 memory: 21523 grad_norm: 4.4661 loss: 1.1348 caption_loss_cls: 1.9363 grounding_loss_reg: 2.2259 detection_loss_cls: 0.0271 detection_loss_reg: 0.3144 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3127 instance_segmentation_loss_poly: 0.8029 +2023/11/08 07:12:33 - mmengine - INFO - Saving checkpoint at 604000 iterations +2023/11/08 07:21:54 - mmengine - INFO - Iter(train) [604500/640000] base_lr: 3.4994e-06 lr: 2.1363e-06 eta: 10:40:09 time: 1.0866 data_time: 0.0367 memory: 21523 grad_norm: 4.3868 loss: 1.1206 caption_loss_cls: 1.9361 grounding_loss_reg: 2.2266 detection_loss_cls: 0.0270 detection_loss_reg: 0.3133 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0273 instance_segmentation_loss_reg: 0.3117 instance_segmentation_loss_poly: 0.8012 +2023/11/08 07:31:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 07:31:05 - mmengine - INFO - Iter(train) [605000/640000] base_lr: 3.4576e-06 lr: 2.1325e-06 eta: 10:31:30 time: 1.0980 data_time: 0.0370 memory: 21523 grad_norm: 4.3794 loss: 1.1194 caption_loss_cls: 1.9346 grounding_loss_reg: 2.2255 detection_loss_cls: 0.0271 detection_loss_reg: 0.3141 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0273 instance_segmentation_loss_reg: 0.3123 instance_segmentation_loss_poly: 0.8018 +2023/11/08 07:31:05 - mmengine - INFO - Saving checkpoint at 605000 iterations +2023/11/08 07:40:18 - mmengine - INFO - Iter(train) [605500/640000] base_lr: 3.4163e-06 lr: 2.1288e-06 eta: 10:22:54 time: 1.1006 data_time: 0.0370 memory: 21523 grad_norm: 4.4036 loss: 1.1224 caption_loss_cls: 1.9342 grounding_loss_reg: 2.2252 detection_loss_cls: 0.0272 detection_loss_reg: 0.3141 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3127 instance_segmentation_loss_poly: 0.8034 +2023/11/08 07:49:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 07:49:36 - mmengine - INFO - Iter(train) [606000/640000] base_lr: 3.3757e-06 lr: 2.1251e-06 eta: 10:14:25 time: 1.1053 data_time: 0.0371 memory: 21523 grad_norm: 4.4208 loss: 1.1252 caption_loss_cls: 1.9302 grounding_loss_reg: 2.2246 detection_loss_cls: 0.0271 detection_loss_reg: 0.3137 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0273 instance_segmentation_loss_reg: 0.3124 instance_segmentation_loss_poly: 0.8028 +2023/11/08 07:49:36 - mmengine - INFO - Saving checkpoint at 606000 iterations +2023/11/08 07:58:22 - mmengine - INFO - Iter(train) [606500/640000] base_lr: 3.3356e-06 lr: 2.1214e-06 eta: 10:04:49 time: 1.0941 data_time: 0.0371 memory: 21523 grad_norm: 4.4746 loss: 1.1369 caption_loss_cls: 1.9304 grounding_loss_reg: 2.2242 detection_loss_cls: 0.0271 detection_loss_reg: 0.3132 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3129 instance_segmentation_loss_poly: 0.8037 +2023/11/08 08:06:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 08:06:55 - mmengine - INFO - Iter(train) [607000/640000] base_lr: 3.2961e-06 lr: 2.1178e-06 eta: 9:54:51 time: 1.0873 data_time: 0.0366 memory: 21523 grad_norm: 4.4868 loss: 1.1274 caption_loss_cls: 1.9300 grounding_loss_reg: 2.2224 detection_loss_cls: 0.0270 detection_loss_reg: 0.3131 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3125 instance_segmentation_loss_poly: 0.8027 +2023/11/08 08:06:55 - mmengine - INFO - Saving checkpoint at 607000 iterations +2023/11/08 08:16:06 - mmengine - INFO - Iter(train) [607500/640000] base_lr: 3.2572e-06 lr: 2.1143e-06 eta: 9:46:08 time: 1.0847 data_time: 0.0364 memory: 21523 grad_norm: 4.4794 loss: 1.1252 caption_loss_cls: 1.9284 grounding_loss_reg: 2.2218 detection_loss_cls: 0.0271 detection_loss_reg: 0.3141 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3125 instance_segmentation_loss_poly: 0.8027 +2023/11/08 08:24:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 08:24:55 - mmengine - INFO - Iter(train) [608000/640000] base_lr: 3.2189e-06 lr: 2.1108e-06 eta: 9:36:44 time: 1.0843 data_time: 0.0364 memory: 21523 grad_norm: 4.5071 loss: 1.1338 caption_loss_cls: 1.9283 grounding_loss_reg: 2.2206 detection_loss_cls: 0.0270 detection_loss_reg: 0.3133 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3126 instance_segmentation_loss_poly: 0.8030 +2023/11/08 08:24:55 - mmengine - INFO - Saving checkpoint at 608000 iterations +2023/11/08 08:34:11 - mmengine - INFO - Iter(train) [608500/640000] base_lr: 3.1812e-06 lr: 2.1074e-06 eta: 9:28:08 time: 1.0831 data_time: 0.0364 memory: 21523 grad_norm: 4.5433 loss: 1.1426 caption_loss_cls: 1.9289 grounding_loss_reg: 2.2207 detection_loss_cls: 0.0270 detection_loss_reg: 0.3130 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3125 instance_segmentation_loss_poly: 0.8019 +2023/11/08 08:43:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 08:43:12 - mmengine - INFO - Iter(train) [609000/640000] base_lr: 3.1441e-06 lr: 2.1040e-06 eta: 9:19:07 time: 1.0806 data_time: 0.0363 memory: 21523 grad_norm: 4.5413 loss: 1.1360 caption_loss_cls: 1.9296 grounding_loss_reg: 2.2190 detection_loss_cls: 0.0270 detection_loss_reg: 0.3128 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3121 instance_segmentation_loss_poly: 0.8016 +2023/11/08 08:43:12 - mmengine - INFO - Saving checkpoint at 609000 iterations +2023/11/08 08:52:05 - mmengine - INFO - Iter(train) [609500/640000] base_lr: 3.1075e-06 lr: 2.1007e-06 eta: 9:09:52 time: 1.0755 data_time: 0.0358 memory: 21523 grad_norm: 4.5169 loss: 1.1242 caption_loss_cls: 1.9275 grounding_loss_reg: 2.2193 detection_loss_cls: 0.0270 detection_loss_reg: 0.3127 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3125 instance_segmentation_loss_poly: 0.8022 +2023/11/08 09:00:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 09:00:59 - mmengine - INFO - Iter(train) [610000/640000] base_lr: 3.0716e-06 lr: 2.0974e-06 eta: 9:00:40 time: 1.0697 data_time: 0.0357 memory: 21523 grad_norm: 4.5155 loss: 1.1266 caption_loss_cls: 1.9249 grounding_loss_reg: 2.2193 detection_loss_cls: 0.0271 detection_loss_reg: 0.3130 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0271 instance_segmentation_loss_reg: 0.3115 instance_segmentation_loss_poly: 0.8002 +2023/11/08 09:00:59 - mmengine - INFO - Saving checkpoint at 610000 iterations +2023/11/08 09:10:31 - mmengine - INFO - Iter(train) [610500/640000] base_lr: 3.0362e-06 lr: 2.0942e-06 eta: 8:52:24 time: 1.0812 data_time: 0.0359 memory: 21523 grad_norm: 4.5071 loss: 1.1217 caption_loss_cls: 1.9271 grounding_loss_reg: 2.2226 detection_loss_cls: 0.0271 detection_loss_reg: 0.3127 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0270 instance_segmentation_loss_reg: 0.3114 instance_segmentation_loss_poly: 0.7999 +2023/11/08 09:19:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 09:19:30 - mmengine - INFO - Iter(train) [611000/640000] base_lr: 3.0015e-06 lr: 2.0910e-06 eta: 8:43:18 time: 1.0877 data_time: 0.0363 memory: 21523 grad_norm: 4.4752 loss: 1.1222 caption_loss_cls: 1.9284 grounding_loss_reg: 2.2218 detection_loss_cls: 0.0270 detection_loss_reg: 0.3124 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0270 instance_segmentation_loss_reg: 0.3112 instance_segmentation_loss_poly: 0.7993 +2023/11/08 09:19:30 - mmengine - INFO - Saving checkpoint at 611000 iterations +2023/11/08 09:28:12 - mmengine - INFO - Iter(train) [611500/640000] base_lr: 2.9673e-06 lr: 2.0879e-06 eta: 8:33:50 time: 1.0803 data_time: 0.0360 memory: 21523 grad_norm: 4.5765 loss: 1.1276 caption_loss_cls: 1.9307 grounding_loss_reg: 2.2197 detection_loss_cls: 0.0269 detection_loss_reg: 0.3115 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3101 instance_segmentation_loss_poly: 0.7974 +2023/11/08 09:37:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 09:37:20 - mmengine - INFO - Iter(train) [612000/640000] base_lr: 2.9337e-06 lr: 2.0849e-06 eta: 8:24:57 time: 1.0852 data_time: 0.0363 memory: 21523 grad_norm: 4.5320 loss: 1.1281 caption_loss_cls: 1.9319 grounding_loss_reg: 2.2184 detection_loss_cls: 0.0269 detection_loss_reg: 0.3115 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3114 instance_segmentation_loss_poly: 0.8002 +2023/11/08 09:37:20 - mmengine - INFO - Saving checkpoint at 612000 iterations +2023/11/08 09:46:36 - mmengine - INFO - Iter(train) [612500/640000] base_lr: 2.9007e-06 lr: 2.0819e-06 eta: 8:16:14 time: 1.0851 data_time: 0.0365 memory: 21523 grad_norm: 4.5779 loss: 1.1308 caption_loss_cls: 1.9332 grounding_loss_reg: 2.2176 detection_loss_cls: 0.0270 detection_loss_reg: 0.3124 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0270 instance_segmentation_loss_reg: 0.3115 instance_segmentation_loss_poly: 0.7996 +2023/11/08 09:55:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 09:55:51 - mmengine - INFO - Iter(train) [613000/640000] base_lr: 2.8683e-06 lr: 2.0789e-06 eta: 8:07:28 time: 1.0886 data_time: 0.0366 memory: 21523 grad_norm: 4.5366 loss: 1.1268 caption_loss_cls: 1.9325 grounding_loss_reg: 2.2182 detection_loss_cls: 0.0271 detection_loss_reg: 0.3122 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0270 instance_segmentation_loss_reg: 0.3121 instance_segmentation_loss_poly: 0.7997 +2023/11/08 09:55:51 - mmengine - INFO - Saving checkpoint at 613000 iterations +2023/11/08 10:05:19 - mmengine - INFO - Iter(train) [613500/640000] base_lr: 2.8365e-06 lr: 2.0760e-06 eta: 7:58:56 time: 1.0976 data_time: 0.0372 memory: 21523 grad_norm: 4.5079 loss: 1.1330 caption_loss_cls: 1.9316 grounding_loss_reg: 2.2197 detection_loss_cls: 0.0270 detection_loss_reg: 0.3125 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3115 instance_segmentation_loss_poly: 0.7981 +2023/11/08 10:14:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 10:14:04 - mmengine - INFO - Iter(train) [614000/640000] base_lr: 2.8053e-06 lr: 2.0732e-06 eta: 7:49:34 time: 1.0950 data_time: 0.0374 memory: 21523 grad_norm: 4.5438 loss: 1.1396 caption_loss_cls: 1.9314 grounding_loss_reg: 2.2188 detection_loss_cls: 0.0270 detection_loss_reg: 0.3117 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3111 instance_segmentation_loss_poly: 0.7969 +2023/11/08 10:14:04 - mmengine - INFO - Saving checkpoint at 614000 iterations +2023/11/08 10:23:47 - mmengine - INFO - Iter(train) [614500/640000] base_lr: 2.7746e-06 lr: 2.0704e-06 eta: 7:41:14 time: 1.0978 data_time: 0.0372 memory: 21523 grad_norm: 4.4300 loss: 1.1272 caption_loss_cls: 1.9300 grounding_loss_reg: 2.2209 detection_loss_cls: 0.0269 detection_loss_reg: 0.3115 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0266 instance_segmentation_loss_reg: 0.3102 instance_segmentation_loss_poly: 0.7946 +2023/11/08 10:33:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 10:33:25 - mmengine - INFO - Iter(train) [615000/640000] base_lr: 2.7446e-06 lr: 2.0677e-06 eta: 7:32:47 time: 1.1076 data_time: 0.0376 memory: 21523 grad_norm: 4.3975 loss: 1.1260 caption_loss_cls: 1.9310 grounding_loss_reg: 2.2206 detection_loss_cls: 0.0269 detection_loss_reg: 0.3108 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0267 instance_segmentation_loss_reg: 0.3108 instance_segmentation_loss_poly: 0.7951 +2023/11/08 10:33:25 - mmengine - INFO - Saving checkpoint at 615000 iterations +2023/11/08 10:42:43 - mmengine - INFO - Iter(train) [615500/640000] base_lr: 2.7151e-06 lr: 2.0650e-06 eta: 7:23:57 time: 1.1165 data_time: 0.0381 memory: 21523 grad_norm: 4.3413 loss: 1.1255 caption_loss_cls: 1.9301 grounding_loss_reg: 2.2183 detection_loss_cls: 0.0269 detection_loss_reg: 0.3105 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3119 instance_segmentation_loss_poly: 0.7976 +2023/11/08 10:52:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 10:52:14 - mmengine - INFO - Iter(train) [616000/640000] base_lr: 2.6863e-06 lr: 2.0624e-06 eta: 7:15:18 time: 1.1224 data_time: 0.0379 memory: 21523 grad_norm: 4.2951 loss: 1.1112 caption_loss_cls: 1.9270 grounding_loss_reg: 2.2201 detection_loss_cls: 0.0270 detection_loss_reg: 0.3115 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3122 instance_segmentation_loss_poly: 0.7993 +2023/11/08 10:52:14 - mmengine - INFO - Saving checkpoint at 616000 iterations +2023/11/08 11:01:18 - mmengine - INFO - Iter(train) [616500/640000] base_lr: 2.6580e-06 lr: 2.0598e-06 eta: 7:06:13 time: 1.1195 data_time: 0.0377 memory: 21523 grad_norm: 4.2078 loss: 1.1018 caption_loss_cls: 1.9262 grounding_loss_reg: 2.2187 detection_loss_cls: 0.0270 detection_loss_reg: 0.3124 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3121 instance_segmentation_loss_poly: 0.7991 +2023/11/08 11:10:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 11:10:21 - mmengine - INFO - Iter(train) [617000/640000] base_lr: 2.6303e-06 lr: 2.0573e-06 eta: 6:57:08 time: 1.1165 data_time: 0.0375 memory: 21523 grad_norm: 4.2674 loss: 1.1061 caption_loss_cls: 1.9270 grounding_loss_reg: 2.2183 detection_loss_cls: 0.0270 detection_loss_reg: 0.3127 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3121 instance_segmentation_loss_poly: 0.7983 +2023/11/08 11:10:21 - mmengine - INFO - Saving checkpoint at 617000 iterations +2023/11/08 11:19:34 - mmengine - INFO - Iter(train) [617500/640000] base_lr: 2.6033e-06 lr: 2.0548e-06 eta: 6:48:10 time: 1.1125 data_time: 0.0372 memory: 21523 grad_norm: 4.2646 loss: 1.0985 caption_loss_cls: 1.9270 grounding_loss_reg: 2.2162 detection_loss_cls: 0.0271 detection_loss_reg: 0.3123 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3120 instance_segmentation_loss_poly: 0.7978 +2023/11/08 11:28:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 11:28:41 - mmengine - INFO - Iter(train) [618000/640000] base_lr: 2.5768e-06 lr: 2.0524e-06 eta: 6:39:08 time: 1.1182 data_time: 0.0372 memory: 21523 grad_norm: 4.2285 loss: 1.0907 caption_loss_cls: 1.9244 grounding_loss_reg: 2.2156 detection_loss_cls: 0.0270 detection_loss_reg: 0.3113 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3113 instance_segmentation_loss_poly: 0.7967 +2023/11/08 11:28:41 - mmengine - INFO - Saving checkpoint at 618000 iterations +2023/11/08 11:37:45 - mmengine - INFO - Iter(train) [618500/640000] base_lr: 2.5509e-06 lr: 2.0501e-06 eta: 6:30:03 time: 1.1084 data_time: 0.0371 memory: 21523 grad_norm: 4.3194 loss: 1.1058 caption_loss_cls: 1.9278 grounding_loss_reg: 2.2156 detection_loss_cls: 0.0270 detection_loss_reg: 0.3111 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3122 instance_segmentation_loss_poly: 0.7979 +2023/11/08 11:46:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 11:46:08 - mmengine - INFO - Iter(train) [619000/640000] base_lr: 2.5256e-06 lr: 2.0478e-06 eta: 6:20:28 time: 1.0895 data_time: 0.0365 memory: 21523 grad_norm: 4.4228 loss: 1.1223 caption_loss_cls: 1.9295 grounding_loss_reg: 2.2137 detection_loss_cls: 0.0271 detection_loss_reg: 0.3118 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3121 instance_segmentation_loss_poly: 0.7978 +2023/11/08 11:46:08 - mmengine - INFO - Saving checkpoint at 619000 iterations +2023/11/08 11:55:17 - mmengine - INFO - Iter(train) [619500/640000] base_lr: 2.5009e-06 lr: 2.0455e-06 eta: 6:11:28 time: 1.0874 data_time: 0.0364 memory: 21523 grad_norm: 4.4540 loss: 1.1207 caption_loss_cls: 1.9266 grounding_loss_reg: 2.2132 detection_loss_cls: 0.0271 detection_loss_reg: 0.3121 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3118 instance_segmentation_loss_poly: 0.7966 +2023/11/08 12:04:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 12:04:03 - mmengine - INFO - Iter(train) [620000/640000] base_lr: 2.4768e-06 lr: 2.0433e-06 eta: 6:02:13 time: 1.0761 data_time: 0.0363 memory: 21523 grad_norm: 4.5512 loss: 1.1349 caption_loss_cls: 1.9233 grounding_loss_reg: 2.2127 detection_loss_cls: 0.0271 detection_loss_reg: 0.3124 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3119 instance_segmentation_loss_poly: 0.7966 +2023/11/08 12:04:03 - mmengine - INFO - Saving checkpoint at 620000 iterations +2023/11/08 12:13:21 - mmengine - INFO - Evaluating bbox... +2023/11/08 12:14:17 - mmengine - INFO - bbox_mAP_copypaste: 0.466 0.641 0.508 0.288 0.516 0.612 +2023/11/08 12:14:17 - mmengine - INFO - Evaluating segm... +2023/11/08 12:15:30 - mmengine - INFO - segm_mAP_copypaste: 0.316 0.559 0.310 0.157 0.362 0.488 +2023/11/08 12:21:23 - mmengine - INFO - per class results: +2023/11/08 12:21:23 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 76.13 | 88.31 | +| building | 80.25 | 90.45 | +| sky | 92.86 | 97.62 | +| floor | 80.67 | 89.68 | +| tree | 72.59 | 87.25 | +| ceiling | 83.65 | 93.76 | +| road | 83.21 | 89.55 | +| bed | 87.56 | 94.74 | +| windowpane | 60.31 | 78.01 | +| grass | 66.28 | 83.25 | +| cabinet | 60.88 | 74.06 | +| sidewalk | 67.72 | 81.63 | +| person | 79.26 | 91.83 | +| earth | 37.46 | 51.78 | +| door | 47.55 | 60.32 | +| table | 59.72 | 76.0 | +| mountain | 54.17 | 68.51 | +| plant | 49.49 | 57.94 | +| curtain | 67.76 | 82.63 | +| chair | 57.02 | 70.68 | +| car | 83.06 | 90.89 | +| water | 52.69 | 67.15 | +| painting | 70.41 | 86.02 | +| sofa | 66.4 | 80.21 | +| shelf | 43.22 | 62.52 | +| house | 41.14 | 59.14 | +| sea | 49.87 | 69.81 | +| mirror | 62.76 | 71.53 | +| rug | 64.52 | 73.17 | +| field | 29.77 | 42.47 | +| armchair | 43.26 | 63.93 | +| seat | 64.16 | 81.82 | +| fence | 42.26 | 60.5 | +| desk | 48.02 | 68.33 | +| rock | 36.94 | 58.24 | +| wardrobe | 44.29 | 60.09 | +| lamp | 60.52 | 73.75 | +| bathtub | 81.32 | 88.19 | +| railing | 27.71 | 41.77 | +| cushion | 57.61 | 69.51 | +| base | 24.86 | 34.95 | +| box | 25.27 | 31.5 | +| column | 47.34 | 59.21 | +| signboard | 37.38 | 51.48 | +| chest of drawers | 36.26 | 54.69 | +| counter | 30.97 | 42.68 | +| sand | 34.79 | 50.79 | +| sink | 72.41 | 78.48 | +| skyscraper | 42.59 | 51.65 | +| fireplace | 74.03 | 88.68 | +| refrigerator | 73.85 | 79.66 | +| grandstand | 34.97 | 66.46 | +| path | 28.87 | 39.74 | +| stairs | 25.03 | 32.01 | +| runway | 70.61 | 86.89 | +| case | 44.26 | 57.59 | +| pool table | 87.99 | 95.66 | +| pillow | 55.9 | 68.62 | +| screen door | 69.86 | 77.68 | +| stairway | 31.5 | 37.47 | +| river | 14.81 | 31.91 | +| bridge | 62.6 | 73.25 | +| bookcase | 34.64 | 55.96 | +| blind | 23.3 | 25.32 | +| coffee table | 64.9 | 80.94 | +| toilet | 84.29 | 89.23 | +| flower | 35.35 | 49.17 | +| book | 45.55 | 67.49 | +| hill | 11.34 | 19.01 | +| bench | 45.69 | 52.52 | +| countertop | 50.37 | 64.96 | +| stove | 76.21 | 84.55 | +| palm | 44.08 | 56.0 | +| kitchen island | 38.92 | 69.97 | +| computer | 68.63 | 79.65 | +| swivel chair | 43.66 | 55.86 | +| boat | 74.46 | 86.1 | +| bar | 44.54 | 54.86 | +| arcade machine | 53.69 | 57.09 | +| hovel | 13.61 | 16.14 | +| bus | 85.54 | 95.28 | +| towel | 62.25 | 76.33 | +| light | 47.49 | 55.63 | +| truck | 40.17 | 49.14 | +| tower | 33.28 | 42.63 | +| chandelier | 64.47 | 79.75 | +| awning | 22.45 | 26.81 | +| streetlight | 29.65 | 37.53 | +| booth | 45.86 | 47.3 | +| television receiver | 67.49 | 79.27 | +| airplane | 56.48 | 66.8 | +| dirt track | 0.44 | 1.77 | +| apparel | 37.25 | 55.57 | +| pole | 30.26 | 42.31 | +| land | 2.3 | 3.11 | +| bannister | 12.87 | 16.76 | +| escalator | 27.31 | 28.88 | +| ottoman | 43.21 | 66.66 | +| bottle | 28.17 | 35.34 | +| buffet | 43.37 | 48.51 | +| poster | 27.28 | 39.75 | +| stage | 9.63 | 16.13 | +| van | 42.2 | 57.08 | +| ship | 73.44 | 79.85 | +| fountain | 11.51 | 11.81 | +| conveyer belt | 79.91 | 85.77 | +| canopy | 26.98 | 31.93 | +| washer | 69.14 | 71.59 | +| plaything | 36.4 | 52.09 | +| swimming pool | 57.45 | 73.64 | +| stool | 42.39 | 59.59 | +| barrel | 40.87 | 55.34 | +| basket | 29.68 | 42.47 | +| waterfall | 53.91 | 70.56 | +| tent | 92.97 | 97.68 | +| bag | 14.48 | 16.79 | +| minibike | 73.2 | 83.35 | +| cradle | 77.12 | 92.1 | +| oven | 42.45 | 53.45 | +| ball | 42.26 | 47.3 | +| food | 56.36 | 64.8 | +| step | 16.11 | 19.26 | +| tank | 38.16 | 44.79 | +| trade name | 25.22 | 30.8 | +| microwave | 82.6 | 90.05 | +| pot | 45.22 | 50.75 | +| animal | 62.64 | 66.79 | +| bicycle | 54.91 | 71.58 | +| lake | 60.98 | 64.76 | +| dishwasher | 52.06 | 70.7 | +| screen | 64.82 | 83.53 | +| blanket | 14.63 | 19.03 | +| sculpture | 59.6 | 71.03 | +| hood | 57.98 | 62.57 | +| sconce | 35.13 | 44.77 | +| vase | 42.7 | 54.83 | +| traffic light | 36.98 | 54.7 | +| tray | 10.38 | 17.09 | +| ashcan | 35.47 | 49.23 | +| fan | 56.77 | 70.02 | +| pier | 42.42 | 59.82 | +| crt screen | 6.19 | 16.7 | +| plate | 55.46 | 71.63 | +| monitor | 15.5 | 19.92 | +| bulletin board | 36.31 | 46.95 | +| shower | 8.01 | 11.23 | +| radiator | 51.5 | 56.86 | +| glass | 16.54 | 18.03 | +| clock | 26.42 | 32.46 | +| flag | 29.25 | 34.89 | ++---------------------+-------+-------+ +2023/11/08 12:21:38 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4660 coco/bbox_mAP_50: 0.6410 coco/bbox_mAP_75: 0.5080 coco/bbox_mAP_s: 0.2880 coco/bbox_mAP_m: 0.5160 coco/bbox_mAP_l: 0.6120 coco/segm_mAP: 0.3160 coco/segm_mAP_50: 0.5590 coco/segm_mAP_75: 0.3100 coco/segm_mAP_s: 0.1570 coco/segm_mAP_m: 0.3620 coco/segm_mAP_l: 0.4880 Bleu_1: 0.7599 Bleu_2: 0.5970 Bleu_3: 0.4571 Bleu_4: 0.3477 METEOR: 0.2710 ROUGE_L: 0.5596 CIDEr: 1.1226 SPICE: 0.2031 aAcc: 82.2100 mIoU: 48.2200 mAcc: 59.3100 visual-grounding/miou: 0.7892 visual-grounding/acc: 0.8555 data_time: 0.0053 time: 0.5236 +2023/11/08 12:30:40 - mmengine - INFO - Iter(train) [620500/640000] base_lr: 2.4532e-06 lr: 2.0412e-06 eta: 5:53:09 time: 1.0760 data_time: 0.0333 memory: 21523 grad_norm: 4.5787 loss: 1.1465 caption_loss_cls: 1.9283 grounding_loss_reg: 2.2116 detection_loss_cls: 0.0271 detection_loss_reg: 0.3133 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3122 instance_segmentation_loss_poly: 0.7978 +2023/11/08 12:39:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 12:39:56 - mmengine - INFO - Iter(train) [621000/640000] base_lr: 2.4303e-06 lr: 2.0391e-06 eta: 5:44:13 time: 1.0793 data_time: 0.0336 memory: 21523 grad_norm: 4.5573 loss: 1.1455 caption_loss_cls: 1.9272 grounding_loss_reg: 2.2083 detection_loss_cls: 0.0270 detection_loss_reg: 0.3130 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3117 instance_segmentation_loss_poly: 0.7966 +2023/11/08 12:39:56 - mmengine - INFO - Saving checkpoint at 621000 iterations +2023/11/08 12:49:09 - mmengine - INFO - Iter(train) [621500/640000] base_lr: 2.4080e-06 lr: 2.0371e-06 eta: 5:35:15 time: 1.0793 data_time: 0.0333 memory: 21523 grad_norm: 4.5176 loss: 1.1369 caption_loss_cls: 1.9285 grounding_loss_reg: 2.2073 detection_loss_cls: 0.0270 detection_loss_reg: 0.3128 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3119 instance_segmentation_loss_poly: 0.7978 +2023/11/08 12:58:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 12:58:12 - mmengine - INFO - Iter(train) [622000/640000] base_lr: 2.3862e-06 lr: 2.0351e-06 eta: 5:26:10 time: 1.0781 data_time: 0.0333 memory: 21523 grad_norm: 4.5532 loss: 1.1436 caption_loss_cls: 1.9250 grounding_loss_reg: 2.2089 detection_loss_cls: 0.0271 detection_loss_reg: 0.3127 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3123 instance_segmentation_loss_poly: 0.7996 +2023/11/08 12:58:12 - mmengine - INFO - Saving checkpoint at 622000 iterations +2023/11/08 13:07:44 - mmengine - INFO - Iter(train) [622500/640000] base_lr: 2.3651e-06 lr: 2.0332e-06 eta: 5:17:22 time: 1.0854 data_time: 0.0333 memory: 21523 grad_norm: 4.5056 loss: 1.1362 caption_loss_cls: 1.9285 grounding_loss_reg: 2.2093 detection_loss_cls: 0.0271 detection_loss_reg: 0.3130 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3123 instance_segmentation_loss_poly: 0.7996 +2023/11/08 13:16:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 13:16:41 - mmengine - INFO - Iter(train) [623000/640000] base_lr: 2.3445e-06 lr: 2.0313e-06 eta: 5:08:14 time: 1.0937 data_time: 0.0334 memory: 21523 grad_norm: 4.4697 loss: 1.1171 caption_loss_cls: 1.9269 grounding_loss_reg: 2.2080 detection_loss_cls: 0.0270 detection_loss_reg: 0.3124 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3117 instance_segmentation_loss_poly: 0.7983 +2023/11/08 13:16:41 - mmengine - INFO - Saving checkpoint at 623000 iterations +2023/11/08 13:25:31 - mmengine - INFO - Iter(train) [623500/640000] base_lr: 2.3246e-06 lr: 2.0295e-06 eta: 4:59:03 time: 1.0890 data_time: 0.0331 memory: 21523 grad_norm: 4.4817 loss: 1.1225 caption_loss_cls: 1.9278 grounding_loss_reg: 2.2084 detection_loss_cls: 0.0270 detection_loss_reg: 0.3122 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3116 instance_segmentation_loss_poly: 0.7977 +2023/11/08 13:34:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 13:34:36 - mmengine - INFO - Iter(train) [624000/640000] base_lr: 2.3052e-06 lr: 2.0277e-06 eta: 4:50:00 time: 1.0939 data_time: 0.0333 memory: 21523 grad_norm: 4.4489 loss: 1.1225 caption_loss_cls: 1.9305 grounding_loss_reg: 2.2057 detection_loss_cls: 0.0270 detection_loss_reg: 0.3119 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3124 instance_segmentation_loss_poly: 0.7995 +2023/11/08 13:34:36 - mmengine - INFO - Saving checkpoint at 624000 iterations +2023/11/08 13:43:59 - mmengine - INFO - Iter(train) [624500/640000] base_lr: 2.2865e-06 lr: 2.0260e-06 eta: 4:41:04 time: 1.0985 data_time: 0.0367 memory: 21523 grad_norm: 4.4640 loss: 1.1247 caption_loss_cls: 1.9293 grounding_loss_reg: 2.2064 detection_loss_cls: 0.0270 detection_loss_reg: 0.3127 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3123 instance_segmentation_loss_poly: 0.7993 +2023/11/08 13:52:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 13:52:56 - mmengine - INFO - Iter(train) [625000/640000] base_lr: 2.2683e-06 lr: 2.0244e-06 eta: 4:31:57 time: 1.0938 data_time: 0.0366 memory: 21523 grad_norm: 4.4545 loss: 1.1293 caption_loss_cls: 1.9300 grounding_loss_reg: 2.2079 detection_loss_cls: 0.0271 detection_loss_reg: 0.3127 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3126 instance_segmentation_loss_poly: 0.8000 +2023/11/08 13:52:56 - mmengine - INFO - Saving checkpoint at 625000 iterations +2023/11/08 14:01:57 - mmengine - INFO - Iter(train) [625500/640000] base_lr: 2.2507e-06 lr: 2.0228e-06 eta: 4:22:52 time: 1.0909 data_time: 0.0366 memory: 21523 grad_norm: 4.4967 loss: 1.1329 caption_loss_cls: 1.9274 grounding_loss_reg: 2.2064 detection_loss_cls: 0.0270 detection_loss_reg: 0.3131 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3129 instance_segmentation_loss_poly: 0.8000 +2023/11/08 14:10:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 14:10:52 - mmengine - INFO - Iter(train) [626000/640000] base_lr: 2.2337e-06 lr: 2.0212e-06 eta: 4:13:44 time: 1.0889 data_time: 0.0366 memory: 21523 grad_norm: 4.4738 loss: 1.1290 caption_loss_cls: 1.9256 grounding_loss_reg: 2.2049 detection_loss_cls: 0.0269 detection_loss_reg: 0.3133 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0270 instance_segmentation_loss_reg: 0.3141 instance_segmentation_loss_poly: 0.8027 +2023/11/08 14:10:52 - mmengine - INFO - Saving checkpoint at 626000 iterations +2023/11/08 14:20:19 - mmengine - INFO - Iter(train) [626500/640000] base_lr: 2.2173e-06 lr: 2.0198e-06 eta: 4:04:49 time: 1.0875 data_time: 0.0369 memory: 21523 grad_norm: 4.5071 loss: 1.1353 caption_loss_cls: 1.9293 grounding_loss_reg: 2.2028 detection_loss_cls: 0.0269 detection_loss_reg: 0.3133 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0270 instance_segmentation_loss_reg: 0.3143 instance_segmentation_loss_poly: 0.8028 +2023/11/08 14:29:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 14:29:38 - mmengine - INFO - Iter(train) [627000/640000] base_lr: 2.2015e-06 lr: 2.0183e-06 eta: 3:55:50 time: 1.0933 data_time: 0.0373 memory: 21523 grad_norm: 4.5215 loss: 1.1476 caption_loss_cls: 1.9292 grounding_loss_reg: 2.2031 detection_loss_cls: 0.0269 detection_loss_reg: 0.3137 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0270 instance_segmentation_loss_reg: 0.3139 instance_segmentation_loss_poly: 0.8027 +2023/11/08 14:29:38 - mmengine - INFO - Saving checkpoint at 627000 iterations +2023/11/08 14:38:09 - mmengine - INFO - Iter(train) [627500/640000] base_lr: 2.1863e-06 lr: 2.0169e-06 eta: 3:46:34 time: 1.0885 data_time: 0.0373 memory: 21523 grad_norm: 4.5562 loss: 1.1538 caption_loss_cls: 1.9313 grounding_loss_reg: 2.2005 detection_loss_cls: 0.0269 detection_loss_reg: 0.3134 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0271 instance_segmentation_loss_reg: 0.3149 instance_segmentation_loss_poly: 0.8047 +2023/11/08 14:47:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 14:47:31 - mmengine - INFO - Iter(train) [628000/640000] base_lr: 2.1717e-06 lr: 2.0156e-06 eta: 3:37:36 time: 1.0924 data_time: 0.0374 memory: 21523 grad_norm: 4.5332 loss: 1.1519 caption_loss_cls: 1.9308 grounding_loss_reg: 2.2012 detection_loss_cls: 0.0270 detection_loss_reg: 0.3146 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0271 instance_segmentation_loss_reg: 0.3147 instance_segmentation_loss_poly: 0.8052 +2023/11/08 14:47:31 - mmengine - INFO - Saving checkpoint at 628000 iterations +2023/11/08 14:57:15 - mmengine - INFO - Iter(train) [628500/640000] base_lr: 2.1577e-06 lr: 2.0143e-06 eta: 3:28:44 time: 1.0978 data_time: 0.0374 memory: 21523 grad_norm: 4.4997 loss: 1.1467 caption_loss_cls: 1.9296 grounding_loss_reg: 2.2027 detection_loss_cls: 0.0268 detection_loss_reg: 0.3141 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3160 instance_segmentation_loss_poly: 0.8077 +2023/11/08 15:06:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 15:06:04 - mmengine - INFO - Iter(train) [629000/640000] base_lr: 2.1443e-06 lr: 2.0131e-06 eta: 3:19:35 time: 1.0959 data_time: 0.0373 memory: 21523 grad_norm: 4.5347 loss: 1.1437 caption_loss_cls: 1.9265 grounding_loss_reg: 2.2040 detection_loss_cls: 0.0268 detection_loss_reg: 0.3140 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3157 instance_segmentation_loss_poly: 0.8081 +2023/11/08 15:06:04 - mmengine - INFO - Saving checkpoint at 629000 iterations +2023/11/08 15:15:09 - mmengine - INFO - Iter(train) [629500/640000] base_lr: 2.1315e-06 lr: 2.0120e-06 eta: 3:10:30 time: 1.0969 data_time: 0.0375 memory: 21523 grad_norm: 4.5489 loss: 1.1547 caption_loss_cls: 1.9275 grounding_loss_reg: 2.2030 detection_loss_cls: 0.0269 detection_loss_reg: 0.3152 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3160 instance_segmentation_loss_poly: 0.8088 +2023/11/08 15:24:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 15:24:05 - mmengine - INFO - Iter(train) [630000/640000] base_lr: 2.1193e-06 lr: 2.0108e-06 eta: 3:01:24 time: 1.0971 data_time: 0.0373 memory: 21523 grad_norm: 4.5897 loss: 1.1558 caption_loss_cls: 1.9279 grounding_loss_reg: 2.2033 detection_loss_cls: 0.0269 detection_loss_reg: 0.3152 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3163 instance_segmentation_loss_poly: 0.8095 +2023/11/08 15:24:05 - mmengine - INFO - Saving checkpoint at 630000 iterations +2023/11/08 15:32:42 - mmengine - INFO - Iter(train) [630500/640000] base_lr: 2.1076e-06 lr: 2.0098e-06 eta: 2:52:13 time: 1.0845 data_time: 0.0367 memory: 21523 grad_norm: 4.6013 loss: 1.1500 caption_loss_cls: 1.9247 grounding_loss_reg: 2.2012 detection_loss_cls: 0.0270 detection_loss_reg: 0.3161 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0273 instance_segmentation_loss_reg: 0.3164 instance_segmentation_loss_poly: 0.8098 +2023/11/08 15:41:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 15:41:34 - mmengine - INFO - Iter(train) [631000/640000] base_lr: 2.0966e-06 lr: 2.0088e-06 eta: 2:43:06 time: 1.0779 data_time: 0.0364 memory: 21523 grad_norm: 4.5514 loss: 1.1500 caption_loss_cls: 1.9261 grounding_loss_reg: 2.2012 detection_loss_cls: 0.0271 detection_loss_reg: 0.3163 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3181 instance_segmentation_loss_poly: 0.8131 +2023/11/08 15:41:34 - mmengine - INFO - Saving checkpoint at 631000 iterations +2023/11/08 15:50:28 - mmengine - INFO - Iter(train) [631500/640000] base_lr: 2.0862e-06 lr: 2.0078e-06 eta: 2:34:01 time: 1.0835 data_time: 0.0363 memory: 21523 grad_norm: 4.5114 loss: 1.1392 caption_loss_cls: 1.9241 grounding_loss_reg: 2.2028 detection_loss_cls: 0.0273 detection_loss_reg: 0.3177 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3181 instance_segmentation_loss_poly: 0.8130 +2023/11/08 15:59:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 15:59:15 - mmengine - INFO - Iter(train) [632000/640000] base_lr: 2.0763e-06 lr: 2.0069e-06 eta: 2:24:54 time: 1.0749 data_time: 0.0361 memory: 21523 grad_norm: 4.5596 loss: 1.1455 caption_loss_cls: 1.9225 grounding_loss_reg: 2.2034 detection_loss_cls: 0.0273 detection_loss_reg: 0.3188 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3186 instance_segmentation_loss_poly: 0.8137 +2023/11/08 15:59:15 - mmengine - INFO - Saving checkpoint at 632000 iterations +2023/11/08 16:08:14 - mmengine - INFO - Iter(train) [632500/640000] base_lr: 2.0671e-06 lr: 2.0061e-06 eta: 2:15:50 time: 1.0638 data_time: 0.0358 memory: 21523 grad_norm: 4.6441 loss: 1.1531 caption_loss_cls: 1.9227 grounding_loss_reg: 2.2044 detection_loss_cls: 0.0273 detection_loss_reg: 0.3185 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3189 instance_segmentation_loss_poly: 0.8147 +2023/11/08 16:17:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 16:17:38 - mmengine - INFO - Iter(train) [633000/640000] base_lr: 2.0585e-06 lr: 2.0053e-06 eta: 2:06:49 time: 1.0723 data_time: 0.0362 memory: 21523 grad_norm: 4.6229 loss: 1.1496 caption_loss_cls: 1.9226 grounding_loss_reg: 2.2033 detection_loss_cls: 0.0273 detection_loss_reg: 0.3196 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3201 instance_segmentation_loss_poly: 0.8171 +2023/11/08 16:17:38 - mmengine - INFO - Saving checkpoint at 633000 iterations +2023/11/08 16:26:49 - mmengine - INFO - Iter(train) [633500/640000] base_lr: 2.0504e-06 lr: 2.0046e-06 eta: 1:57:47 time: 1.0737 data_time: 0.0362 memory: 21523 grad_norm: 4.6456 loss: 1.1536 caption_loss_cls: 1.9243 grounding_loss_reg: 2.2021 detection_loss_cls: 0.0273 detection_loss_reg: 0.3194 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3206 instance_segmentation_loss_poly: 0.8172 +2023/11/08 16:35:49 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 16:35:49 - mmengine - INFO - Iter(train) [634000/640000] base_lr: 2.0429e-06 lr: 2.0039e-06 eta: 1:48:43 time: 1.0748 data_time: 0.0363 memory: 21523 grad_norm: 4.6159 loss: 1.1550 caption_loss_cls: 1.9255 grounding_loss_reg: 2.2021 detection_loss_cls: 0.0275 detection_loss_reg: 0.3208 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3207 instance_segmentation_loss_poly: 0.8172 +2023/11/08 16:35:49 - mmengine - INFO - Saving checkpoint at 634000 iterations +2023/11/08 16:45:10 - mmengine - INFO - Iter(train) [634500/640000] base_lr: 2.0361e-06 lr: 2.0033e-06 eta: 1:39:41 time: 1.0858 data_time: 0.0368 memory: 21523 grad_norm: 4.6052 loss: 1.1546 caption_loss_cls: 1.9260 grounding_loss_reg: 2.1998 detection_loss_cls: 0.0274 detection_loss_reg: 0.3209 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3208 instance_segmentation_loss_poly: 0.8173 +2023/11/08 16:54:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 16:54:09 - mmengine - INFO - Iter(train) [635000/640000] base_lr: 2.0298e-06 lr: 2.0027e-06 eta: 1:30:37 time: 1.0874 data_time: 0.0369 memory: 21523 grad_norm: 4.6548 loss: 1.1552 caption_loss_cls: 1.9254 grounding_loss_reg: 2.1993 detection_loss_cls: 0.0274 detection_loss_reg: 0.3214 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3204 instance_segmentation_loss_poly: 0.8164 +2023/11/08 16:54:09 - mmengine - INFO - Saving checkpoint at 635000 iterations +2023/11/08 17:03:31 - mmengine - INFO - Iter(train) [635500/640000] base_lr: 2.0242e-06 lr: 2.0022e-06 eta: 1:21:35 time: 1.0947 data_time: 0.0374 memory: 21523 grad_norm: 4.5940 loss: 1.1536 caption_loss_cls: 1.9242 grounding_loss_reg: 2.2008 detection_loss_cls: 0.0274 detection_loss_reg: 0.3214 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3203 instance_segmentation_loss_poly: 0.8157 +2023/11/08 17:13:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 17:13:04 - mmengine - INFO - Iter(train) [636000/640000] base_lr: 2.0191e-06 lr: 2.0017e-06 eta: 1:12:33 time: 1.1060 data_time: 0.0376 memory: 21523 grad_norm: 4.5404 loss: 1.1441 caption_loss_cls: 1.9269 grounding_loss_reg: 2.2030 detection_loss_cls: 0.0274 detection_loss_reg: 0.3217 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3199 instance_segmentation_loss_poly: 0.8149 +2023/11/08 17:13:04 - mmengine - INFO - Saving checkpoint at 636000 iterations +2023/11/08 17:22:20 - mmengine - INFO - Iter(train) [636500/640000] base_lr: 2.0146e-06 lr: 2.0013e-06 eta: 1:03:30 time: 1.1102 data_time: 0.0376 memory: 21523 grad_norm: 4.5087 loss: 1.1314 caption_loss_cls: 1.9286 grounding_loss_reg: 2.2023 detection_loss_cls: 0.0274 detection_loss_reg: 0.3211 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3198 instance_segmentation_loss_poly: 0.8145 +2023/11/08 17:31:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 17:31:52 - mmengine - INFO - Iter(train) [637000/640000] base_lr: 2.0107e-06 lr: 2.0010e-06 eta: 0:54:27 time: 1.1124 data_time: 0.0375 memory: 21523 grad_norm: 4.3925 loss: 1.1220 caption_loss_cls: 1.9315 grounding_loss_reg: 2.2011 detection_loss_cls: 0.0274 detection_loss_reg: 0.3202 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3193 instance_segmentation_loss_poly: 0.8140 +2023/11/08 17:31:52 - mmengine - INFO - Saving checkpoint at 637000 iterations +2023/11/08 17:41:08 - mmengine - INFO - Iter(train) [637500/640000] base_lr: 2.0075e-06 lr: 2.0007e-06 eta: 0:45:23 time: 1.1138 data_time: 0.0377 memory: 21523 grad_norm: 4.3739 loss: 1.1241 caption_loss_cls: 1.9374 grounding_loss_reg: 2.2003 detection_loss_cls: 0.0273 detection_loss_reg: 0.3200 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3196 instance_segmentation_loss_poly: 0.8143 +2023/11/08 17:50:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 17:50:22 - mmengine - INFO - Iter(train) [638000/640000] base_lr: 2.0048e-06 lr: 2.0004e-06 eta: 0:36:19 time: 1.1171 data_time: 0.0379 memory: 21523 grad_norm: 4.3404 loss: 1.1231 caption_loss_cls: 1.9377 grounding_loss_reg: 2.2007 detection_loss_cls: 0.0274 detection_loss_reg: 0.3212 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3197 instance_segmentation_loss_poly: 0.8151 +2023/11/08 17:50:22 - mmengine - INFO - Saving checkpoint at 638000 iterations +2023/11/08 17:59:39 - mmengine - INFO - Iter(train) [638500/640000] base_lr: 2.0027e-06 lr: 2.0002e-06 eta: 0:27:14 time: 1.1162 data_time: 0.0378 memory: 21523 grad_norm: 4.3490 loss: 1.1313 caption_loss_cls: 1.9379 grounding_loss_reg: 2.2024 detection_loss_cls: 0.0274 detection_loss_reg: 0.3213 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3196 instance_segmentation_loss_poly: 0.8143 +2023/11/08 18:08:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 18:08:51 - mmengine - INFO - Iter(train) [639000/640000] base_lr: 2.0012e-06 lr: 2.0001e-06 eta: 0:18:10 time: 1.1194 data_time: 0.0376 memory: 21523 grad_norm: 4.2790 loss: 1.1133 caption_loss_cls: 1.9339 grounding_loss_reg: 2.2003 detection_loss_cls: 0.0274 detection_loss_reg: 0.3210 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3196 instance_segmentation_loss_poly: 0.8144 +2023/11/08 18:08:51 - mmengine - INFO - Saving checkpoint at 639000 iterations +2023/11/08 18:18:03 - mmengine - INFO - Iter(train) [639500/640000] base_lr: 2.0003e-06 lr: 2.0000e-06 eta: 0:09:05 time: 1.1168 data_time: 0.0373 memory: 21523 grad_norm: 4.3165 loss: 1.1126 caption_loss_cls: 1.9363 grounding_loss_reg: 2.2031 detection_loss_cls: 0.0273 detection_loss_reg: 0.3205 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3197 instance_segmentation_loss_poly: 0.8150 +2023/11/08 18:27:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_20231108_024040 +2023/11/08 18:27:17 - mmengine - INFO - Iter(train) [640000/640000] base_lr: 2.0000e-06 lr: 2.0000e-06 eta: 0:00:00 time: 1.1121 data_time: 0.0372 memory: 21523 grad_norm: 4.3695 loss: 1.1146 caption_loss_cls: 1.9340 grounding_loss_reg: 2.2009 detection_loss_cls: 0.0273 detection_loss_reg: 0.3206 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3198 instance_segmentation_loss_poly: 0.8150 +2023/11/08 18:27:17 - mmengine - INFO - Saving checkpoint at 640000 iterations +2023/11/08 18:36:08 - mmengine - INFO - Evaluating bbox... +2023/11/08 18:37:05 - mmengine - INFO - bbox_mAP_copypaste: 0.467 0.642 0.507 0.293 0.516 0.614 +2023/11/08 18:37:05 - mmengine - INFO - Evaluating segm... +2023/11/08 18:38:17 - mmengine - INFO - segm_mAP_copypaste: 0.319 0.564 0.314 0.164 0.363 0.491 +2023/11/08 18:42:58 - mmengine - INFO - per class results: +2023/11/08 18:42:58 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 76.13 | 88.46 | +| building | 80.57 | 90.44 | +| sky | 92.88 | 97.64 | +| floor | 80.05 | 90.12 | +| tree | 73.05 | 86.42 | +| ceiling | 83.67 | 93.6 | +| road | 83.06 | 89.35 | +| bed | 88.1 | 94.62 | +| windowpane | 60.31 | 76.59 | +| grass | 66.96 | 85.01 | +| cabinet | 60.53 | 72.41 | +| sidewalk | 67.99 | 82.45 | +| person | 79.43 | 91.66 | +| earth | 38.6 | 51.9 | +| door | 50.36 | 64.9 | +| table | 59.6 | 75.9 | +| mountain | 53.66 | 68.44 | +| plant | 51.58 | 63.28 | +| curtain | 67.4 | 81.98 | +| chair | 57.19 | 71.32 | +| car | 82.84 | 90.36 | +| water | 50.88 | 66.08 | +| painting | 70.79 | 86.82 | +| sofa | 67.89 | 82.09 | +| shelf | 43.48 | 64.68 | +| house | 43.69 | 62.82 | +| sea | 47.27 | 69.33 | +| mirror | 63.04 | 72.47 | +| rug | 64.11 | 74.35 | +| field | 28.87 | 41.1 | +| armchair | 44.22 | 62.93 | +| seat | 62.05 | 79.78 | +| fence | 42.5 | 61.31 | +| desk | 45.98 | 66.34 | +| rock | 36.05 | 54.41 | +| wardrobe | 44.26 | 59.93 | +| lamp | 60.67 | 74.88 | +| bathtub | 78.45 | 86.26 | +| railing | 28.29 | 43.21 | +| cushion | 57.86 | 70.29 | +| base | 25.02 | 34.61 | +| box | 25.93 | 33.31 | +| column | 47.25 | 58.71 | +| signboard | 37.32 | 50.17 | +| chest of drawers | 34.45 | 52.1 | +| counter | 30.31 | 40.75 | +| sand | 33.69 | 50.18 | +| sink | 72.79 | 78.9 | +| skyscraper | 46.97 | 56.86 | +| fireplace | 73.64 | 85.99 | +| refrigerator | 75.04 | 83.06 | +| grandstand | 35.47 | 64.91 | +| path | 31.14 | 39.63 | +| stairs | 27.34 | 35.28 | +| runway | 68.69 | 83.38 | +| case | 45.68 | 58.35 | +| pool table | 87.61 | 95.48 | +| pillow | 55.79 | 67.89 | +| screen door | 67.9 | 75.71 | +| stairway | 31.19 | 37.82 | +| river | 15.93 | 31.37 | +| bridge | 69.06 | 79.59 | +| bookcase | 34.95 | 57.77 | +| blind | 23.97 | 26.01 | +| coffee table | 64.23 | 79.57 | +| toilet | 84.57 | 89.15 | +| flower | 35.23 | 49.06 | +| book | 45.58 | 66.89 | +| hill | 10.9 | 18.91 | +| bench | 47.05 | 53.05 | +| countertop | 51.78 | 64.23 | +| stove | 77.3 | 84.29 | +| palm | 44.17 | 56.7 | +| kitchen island | 40.33 | 71.61 | +| computer | 70.61 | 82.66 | +| swivel chair | 42.43 | 52.71 | +| boat | 75.81 | 85.37 | +| bar | 34.54 | 41.53 | +| arcade machine | 40.31 | 42.27 | +| hovel | 12.57 | 14.85 | +| bus | 85.66 | 95.17 | +| towel | 61.42 | 74.48 | +| light | 47.96 | 55.23 | +| truck | 41.16 | 49.05 | +| tower | 29.97 | 38.56 | +| chandelier | 62.64 | 77.93 | +| awning | 23.02 | 27.7 | +| streetlight | 28.41 | 35.8 | +| booth | 45.61 | 46.33 | +| television receiver | 67.18 | 78.79 | +| airplane | 56.21 | 66.7 | +| dirt track | 0.47 | 1.92 | +| apparel | 36.8 | 55.73 | +| pole | 30.01 | 41.21 | +| land | 0.5 | 0.67 | +| bannister | 13.06 | 17.58 | +| escalator | 27.18 | 28.52 | +| ottoman | 44.73 | 65.63 | +| bottle | 28.86 | 36.59 | +| buffet | 37.99 | 42.04 | +| poster | 26.79 | 36.94 | +| stage | 9.59 | 16.63 | +| van | 43.58 | 59.62 | +| ship | 38.37 | 40.53 | +| fountain | 11.5 | 11.78 | +| conveyer belt | 78.9 | 84.67 | +| canopy | 22.42 | 28.05 | +| washer | 69.18 | 71.21 | +| plaything | 36.52 | 51.37 | +| swimming pool | 55.6 | 71.24 | +| stool | 43.49 | 56.72 | +| barrel | 41.42 | 51.91 | +| basket | 29.28 | 44.32 | +| waterfall | 50.83 | 64.55 | +| tent | 92.13 | 97.63 | +| bag | 12.49 | 13.89 | +| minibike | 72.83 | 82.23 | +| cradle | 76.72 | 92.31 | +| oven | 44.92 | 57.41 | +| ball | 40.43 | 44.7 | +| food | 56.79 | 63.7 | +| step | 15.54 | 18.28 | +| tank | 38.33 | 43.97 | +| trade name | 25.7 | 31.51 | +| microwave | 82.9 | 89.83 | +| pot | 45.66 | 51.0 | +| animal | 61.28 | 65.07 | +| bicycle | 55.98 | 72.7 | +| lake | 61.95 | 66.39 | +| dishwasher | 52.42 | 73.67 | +| screen | 60.14 | 85.75 | +| blanket | 13.8 | 17.25 | +| sculpture | 58.74 | 70.81 | +| hood | 57.24 | 61.29 | +| sconce | 35.64 | 44.25 | +| vase | 41.69 | 55.93 | +| traffic light | 34.58 | 53.58 | +| tray | 11.75 | 17.92 | +| ashcan | 40.28 | 53.46 | +| fan | 56.78 | 69.4 | +| pier | 47.83 | 61.79 | +| crt screen | 7.26 | 19.16 | +| plate | 55.68 | 70.94 | +| monitor | 20.03 | 24.38 | +| bulletin board | 32.17 | 41.35 | +| shower | 4.81 | 10.52 | +| radiator | 49.28 | 54.6 | +| glass | 16.55 | 17.93 | +| clock | 27.13 | 32.51 | +| flag | 30.14 | 36.03 | ++---------------------+-------+-------+ +2023/11/08 18:43:13 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4670 coco/bbox_mAP_50: 0.6420 coco/bbox_mAP_75: 0.5070 coco/bbox_mAP_s: 0.2930 coco/bbox_mAP_m: 0.5160 coco/bbox_mAP_l: 0.6140 coco/segm_mAP: 0.3190 coco/segm_mAP_50: 0.5640 coco/segm_mAP_75: 0.3140 coco/segm_mAP_s: 0.1640 coco/segm_mAP_m: 0.3630 coco/segm_mAP_l: 0.4910 Bleu_1: 0.7648 Bleu_2: 0.6039 Bleu_3: 0.4645 Bleu_4: 0.3543 METEOR: 0.2727 ROUGE_L: 0.5636 CIDEr: 1.1257 SPICE: 0.2048 aAcc: 82.2700 mIoU: 47.8200 mAcc: 58.7000 visual-grounding/miou: 0.7907 visual-grounding/acc: 0.8584 data_time: 0.0044 time: 0.5221