diff --git "a/multi_large.log" "b/multi_large.log" new file mode 100644--- /dev/null +++ "b/multi_large.log" @@ -0,0 +1,7230 @@ +2024/01/01 11:06:28 - mmengine - INFO - Iter(train) [ 500/640000] base_lr: 2.0000e-04 lr: 2.0000e-05 eta: 10 days, 20:15:52 time: 1.4651 data_time: 0.0151 memory: 25725 grad_norm: 18.3564 loss: 4.6180 detection_loss_cls: 0.9718 detection_loss_reg: 0.7050 caption_loss_cls: 8.6409 grounding_loss_reg: 8.8402 semantic_segmentation_loss_cls: 0.2366 instance_segmentation_loss_cls: 0.5720 instance_segmentation_loss_reg: 0.7064 instance_segmentation_loss_poly: 2.7246 +2024/01/01 11:18:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 11:18:56 - mmengine - INFO - Iter(train) [ 1000/640000] base_lr: 2.0000e-04 lr: 2.0000e-05 eta: 10 days, 22:46:09 time: 1.4804 data_time: 0.0159 memory: 25723 grad_norm: 12.4007 loss: 3.9507 detection_loss_cls: 0.6334 detection_loss_reg: 0.6433 caption_loss_cls: 6.8427 grounding_loss_reg: 7.8535 semantic_segmentation_loss_cls: 0.1537 instance_segmentation_loss_cls: 0.3903 instance_segmentation_loss_reg: 0.6582 instance_segmentation_loss_poly: 2.2974 +2024/01/01 11:31:01 - mmengine - INFO - Iter(train) [ 1500/640000] base_lr: 2.0000e-04 lr: 2.0000e-05 eta: 10 days, 20:45:39 time: 1.4702 data_time: 0.0154 memory: 25723 grad_norm: 9.6677 loss: 3.5662 detection_loss_cls: 0.4558 detection_loss_reg: 0.6426 caption_loss_cls: 6.0677 grounding_loss_reg: 7.4106 semantic_segmentation_loss_cls: 0.1157 instance_segmentation_loss_cls: 0.3310 instance_segmentation_loss_reg: 0.6447 instance_segmentation_loss_poly: 2.1918 +2024/01/01 11:43:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 11:43:16 - mmengine - INFO - Iter(train) [ 2000/640000] base_lr: 2.0000e-04 lr: 2.0000e-05 eta: 10 days, 20:30:00 time: 1.4699 data_time: 0.0153 memory: 25723 grad_norm: 8.1815 loss: 3.3303 detection_loss_cls: 0.3652 detection_loss_reg: 0.6083 caption_loss_cls: 5.5511 grounding_loss_reg: 7.1288 semantic_segmentation_loss_cls: 0.0952 instance_segmentation_loss_cls: 0.2803 instance_segmentation_loss_reg: 0.6179 instance_segmentation_loss_poly: 2.0678 +2024/01/01 11:43:16 - mmengine - INFO - Saving checkpoint at 2000 iterations +2024/01/01 11:55:58 - mmengine - INFO - Iter(train) [ 2500/640000] base_lr: 1.9999e-04 lr: 1.9999e-05 eta: 10 days, 22:13:55 time: 1.4808 data_time: 0.0226 memory: 25723 grad_norm: 7.2556 loss: 3.1784 detection_loss_cls: 0.3091 detection_loss_reg: 0.5822 caption_loss_cls: 5.1766 grounding_loss_reg: 6.9412 semantic_segmentation_loss_cls: 0.0846 instance_segmentation_loss_cls: 0.2418 instance_segmentation_loss_reg: 0.5903 instance_segmentation_loss_poly: 1.9456 +2024/01/01 12:08:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 12:08:10 - mmengine - INFO - Iter(train) [ 3000/640000] base_lr: 1.9999e-04 lr: 1.9999e-05 eta: 10 days, 21:32:43 time: 1.4781 data_time: 0.0214 memory: 25723 grad_norm: 6.6118 loss: 3.0571 detection_loss_cls: 0.2706 detection_loss_reg: 0.5562 caption_loss_cls: 4.9247 grounding_loss_reg: 6.7864 semantic_segmentation_loss_cls: 0.0759 instance_segmentation_loss_cls: 0.2163 instance_segmentation_loss_reg: 0.5618 instance_segmentation_loss_poly: 1.8453 +2024/01/01 12:20:12 - mmengine - INFO - Iter(train) [ 3500/640000] base_lr: 1.9999e-04 lr: 1.9999e-05 eta: 10 days, 20:28:56 time: 1.4733 data_time: 0.0205 memory: 25723 grad_norm: 6.1438 loss: 2.9765 detection_loss_cls: 0.2481 detection_loss_reg: 0.5486 caption_loss_cls: 4.7496 grounding_loss_reg: 6.6382 semantic_segmentation_loss_cls: 0.0684 instance_segmentation_loss_cls: 0.1995 instance_segmentation_loss_reg: 0.5519 instance_segmentation_loss_poly: 1.7946 +2024/01/01 12:32:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 12:32:42 - mmengine - INFO - Iter(train) [ 4000/640000] base_lr: 1.9998e-04 lr: 1.9998e-05 eta: 10 days, 20:51:27 time: 1.4766 data_time: 0.0199 memory: 25723 grad_norm: 5.7425 loss: 2.8935 detection_loss_cls: 0.2287 detection_loss_reg: 0.5404 caption_loss_cls: 4.6269 grounding_loss_reg: 6.5379 semantic_segmentation_loss_cls: 0.0620 instance_segmentation_loss_cls: 0.1852 instance_segmentation_loss_reg: 0.5434 instance_segmentation_loss_poly: 1.7561 +2024/01/01 12:32:42 - mmengine - INFO - Saving checkpoint at 4000 iterations +2024/01/01 12:44:37 - mmengine - INFO - Iter(train) [ 4500/640000] base_lr: 1.9998e-04 lr: 1.9998e-05 eta: 10 days, 19:43:24 time: 1.4721 data_time: 0.0243 memory: 25723 grad_norm: 3.8512 loss: 2.6376 detection_loss_cls: 0.2141 detection_loss_reg: 0.5385 caption_loss_cls: 4.5191 grounding_loss_reg: 6.4273 semantic_segmentation_loss_cls: 0.0577 instance_segmentation_loss_cls: 0.1740 instance_segmentation_loss_reg: 0.5382 instance_segmentation_loss_poly: 1.7287 +2024/01/01 12:57:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 12:57:17 - mmengine - INFO - Iter(train) [ 5000/640000] base_lr: 1.9997e-04 lr: 1.9997e-05 eta: 10 days, 20:23:56 time: 1.4752 data_time: 0.0243 memory: 25723 grad_norm: 3.3983 loss: 2.5065 detection_loss_cls: 0.1998 detection_loss_reg: 0.5272 caption_loss_cls: 4.4213 grounding_loss_reg: 6.3519 semantic_segmentation_loss_cls: 0.0541 instance_segmentation_loss_cls: 0.1628 instance_segmentation_loss_reg: 0.5279 instance_segmentation_loss_poly: 1.6873 +2024/01/01 13:09:35 - mmengine - INFO - Iter(train) [ 5500/640000] base_lr: 1.9996e-04 lr: 1.9997e-05 eta: 10 days, 20:10:16 time: 1.4784 data_time: 0.0245 memory: 25723 grad_norm: 3.2386 loss: 2.4497 detection_loss_cls: 0.1912 detection_loss_reg: 0.5268 caption_loss_cls: 4.3268 grounding_loss_reg: 6.2690 semantic_segmentation_loss_cls: 0.0510 instance_segmentation_loss_cls: 0.1546 instance_segmentation_loss_reg: 0.5237 instance_segmentation_loss_poly: 1.6645 +2024/01/01 13:21:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 13:21:46 - mmengine - INFO - Iter(train) [ 6000/640000] base_lr: 1.9996e-04 lr: 1.9996e-05 eta: 10 days, 19:46:21 time: 1.4776 data_time: 0.0246 memory: 25723 grad_norm: 3.1441 loss: 2.4188 detection_loss_cls: 0.1805 detection_loss_reg: 0.5189 caption_loss_cls: 4.2790 grounding_loss_reg: 6.1904 semantic_segmentation_loss_cls: 0.0488 instance_segmentation_loss_cls: 0.1479 instance_segmentation_loss_reg: 0.5168 instance_segmentation_loss_poly: 1.6440 +2024/01/01 13:21:46 - mmengine - INFO - Saving checkpoint at 6000 iterations +2024/01/01 13:33:47 - mmengine - INFO - Iter(train) [ 6500/640000] base_lr: 1.9995e-04 lr: 1.9995e-05 eta: 10 days, 19:07:14 time: 1.4673 data_time: 0.0244 memory: 25723 grad_norm: 3.0763 loss: 2.3836 detection_loss_cls: 0.1742 detection_loss_reg: 0.5151 caption_loss_cls: 4.2024 grounding_loss_reg: 6.1185 semantic_segmentation_loss_cls: 0.0464 instance_segmentation_loss_cls: 0.1426 instance_segmentation_loss_reg: 0.5145 instance_segmentation_loss_poly: 1.6318 +2024/01/01 13:45:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 13:45:52 - mmengine - INFO - Iter(train) [ 7000/640000] base_lr: 1.9994e-04 lr: 1.9995e-05 eta: 10 days, 18:36:58 time: 1.4653 data_time: 0.0244 memory: 25723 grad_norm: 3.0238 loss: 2.3570 detection_loss_cls: 0.1667 detection_loss_reg: 0.5088 caption_loss_cls: 4.1531 grounding_loss_reg: 6.0437 semantic_segmentation_loss_cls: 0.0447 instance_segmentation_loss_cls: 0.1378 instance_segmentation_loss_reg: 0.5086 instance_segmentation_loss_poly: 1.6099 +2024/01/01 13:58:13 - mmengine - INFO - Iter(train) [ 7500/640000] base_lr: 1.9993e-04 lr: 1.9994e-05 eta: 10 days, 18:32:58 time: 1.4701 data_time: 0.0245 memory: 25723 grad_norm: 2.9712 loss: 2.3176 detection_loss_cls: 0.1615 detection_loss_reg: 0.5056 caption_loss_cls: 4.0920 grounding_loss_reg: 5.9832 semantic_segmentation_loss_cls: 0.0430 instance_segmentation_loss_cls: 0.1323 instance_segmentation_loss_reg: 0.5016 instance_segmentation_loss_poly: 1.5872 +2024/01/01 14:10:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 14:10:33 - mmengine - INFO - Iter(train) [ 8000/640000] base_lr: 1.9992e-04 lr: 1.9993e-05 eta: 10 days, 18:26:24 time: 1.4677 data_time: 0.0244 memory: 25723 grad_norm: 2.9735 loss: 2.2952 detection_loss_cls: 0.1550 detection_loss_reg: 0.4988 caption_loss_cls: 4.0465 grounding_loss_reg: 5.9155 semantic_segmentation_loss_cls: 0.0418 instance_segmentation_loss_cls: 0.1276 instance_segmentation_loss_reg: 0.4949 instance_segmentation_loss_poly: 1.5618 +2024/01/01 14:10:33 - mmengine - INFO - Saving checkpoint at 8000 iterations +2024/01/01 14:22:55 - mmengine - INFO - Iter(train) [ 8500/640000] base_lr: 1.9991e-04 lr: 1.9992e-05 eta: 10 days, 18:20:52 time: 1.4744 data_time: 0.0243 memory: 25723 grad_norm: 2.9254 loss: 2.2362 detection_loss_cls: 0.1509 detection_loss_reg: 0.4968 caption_loss_cls: 3.9951 grounding_loss_reg: 5.8614 semantic_segmentation_loss_cls: 0.0405 instance_segmentation_loss_cls: 0.1244 instance_segmentation_loss_reg: 0.4926 instance_segmentation_loss_poly: 1.5504 +2024/01/01 14:35:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 14:35:09 - mmengine - INFO - Iter(train) [ 9000/640000] base_lr: 1.9990e-04 lr: 1.9991e-05 eta: 10 days, 18:06:39 time: 1.4680 data_time: 0.0243 memory: 25723 grad_norm: 2.9319 loss: 2.2244 detection_loss_cls: 0.1469 detection_loss_reg: 0.4967 caption_loss_cls: 3.9487 grounding_loss_reg: 5.8104 semantic_segmentation_loss_cls: 0.0392 instance_segmentation_loss_cls: 0.1216 instance_segmentation_loss_reg: 0.4922 instance_segmentation_loss_poly: 1.5431 +2024/01/01 14:48:16 - mmengine - INFO - Iter(train) [ 9500/640000] base_lr: 1.9989e-04 lr: 1.9990e-05 eta: 10 days, 18:50:19 time: 1.4803 data_time: 0.0245 memory: 25723 grad_norm: 2.8805 loss: 2.1784 detection_loss_cls: 0.1431 detection_loss_reg: 0.4962 caption_loss_cls: 3.9195 grounding_loss_reg: 5.7646 semantic_segmentation_loss_cls: 0.0381 instance_segmentation_loss_cls: 0.1185 instance_segmentation_loss_reg: 0.4925 instance_segmentation_loss_poly: 1.5367 +2024/01/01 15:00:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 15:00:24 - mmengine - INFO - Iter(train) [ 10000/640000] base_lr: 1.9988e-04 lr: 1.9989e-05 eta: 10 days, 18:26:52 time: 1.4795 data_time: 0.0245 memory: 25723 grad_norm: 2.8735 loss: 2.1384 detection_loss_cls: 0.1397 detection_loss_reg: 0.4933 caption_loss_cls: 3.8896 grounding_loss_reg: 5.7091 semantic_segmentation_loss_cls: 0.0370 instance_segmentation_loss_cls: 0.1154 instance_segmentation_loss_reg: 0.4888 instance_segmentation_loss_poly: 1.5212 +2024/01/01 15:00:24 - mmengine - INFO - Saving checkpoint at 10000 iterations +2024/01/01 15:13:32 - mmengine - INFO - Iter(train) [ 10500/640000] base_lr: 1.9987e-04 lr: 1.9988e-05 eta: 10 days, 19:03:33 time: 1.4961 data_time: 0.0246 memory: 25723 grad_norm: 2.8244 loss: 2.0816 detection_loss_cls: 0.1357 detection_loss_reg: 0.4917 caption_loss_cls: 3.8534 grounding_loss_reg: 5.6655 semantic_segmentation_loss_cls: 0.0361 instance_segmentation_loss_cls: 0.1128 instance_segmentation_loss_reg: 0.4867 instance_segmentation_loss_poly: 1.5109 +2024/01/01 15:26:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 15:26:11 - mmengine - INFO - Iter(train) [ 11000/640000] base_lr: 1.9986e-04 lr: 1.9987e-05 eta: 10 days, 19:08:36 time: 1.5048 data_time: 0.0247 memory: 25723 grad_norm: 2.7812 loss: 2.0374 detection_loss_cls: 0.1324 detection_loss_reg: 0.4874 caption_loss_cls: 3.8223 grounding_loss_reg: 5.6319 semantic_segmentation_loss_cls: 0.0352 instance_segmentation_loss_cls: 0.1101 instance_segmentation_loss_reg: 0.4819 instance_segmentation_loss_poly: 1.4935 +2024/01/01 15:38:20 - mmengine - INFO - Iter(train) [ 11500/640000] base_lr: 1.9984e-04 lr: 1.9986e-05 eta: 10 days, 18:45:02 time: 1.5018 data_time: 0.0246 memory: 25723 grad_norm: 2.7878 loss: 2.0249 detection_loss_cls: 0.1294 detection_loss_reg: 0.4860 caption_loss_cls: 3.7924 grounding_loss_reg: 5.5938 semantic_segmentation_loss_cls: 0.0345 instance_segmentation_loss_cls: 0.1081 instance_segmentation_loss_reg: 0.4807 instance_segmentation_loss_poly: 1.4853 +2024/01/01 15:49:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 15:49:41 - mmengine - INFO - Iter(train) [ 12000/640000] base_lr: 1.9983e-04 lr: 1.9984e-05 eta: 10 days, 17:39:52 time: 1.4869 data_time: 0.0244 memory: 25723 grad_norm: 2.8085 loss: 2.0147 detection_loss_cls: 0.1272 detection_loss_reg: 0.4833 caption_loss_cls: 3.7625 grounding_loss_reg: 5.5560 semantic_segmentation_loss_cls: 0.0338 instance_segmentation_loss_cls: 0.1065 instance_segmentation_loss_reg: 0.4785 instance_segmentation_loss_poly: 1.4773 +2024/01/01 15:49:41 - mmengine - INFO - Saving checkpoint at 12000 iterations +2024/01/01 16:02:21 - mmengine - INFO - Iter(train) [ 12500/640000] base_lr: 1.9981e-04 lr: 1.9983e-05 eta: 10 days, 17:45:35 time: 1.4916 data_time: 0.0244 memory: 25723 grad_norm: 2.8299 loss: 2.0150 detection_loss_cls: 0.1252 detection_loss_reg: 0.4842 caption_loss_cls: 3.7370 grounding_loss_reg: 5.5180 semantic_segmentation_loss_cls: 0.0332 instance_segmentation_loss_cls: 0.1044 instance_segmentation_loss_reg: 0.4776 instance_segmentation_loss_poly: 1.4694 +2024/01/01 16:14:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 16:14:00 - mmengine - INFO - Iter(train) [ 13000/640000] base_lr: 1.9980e-04 lr: 1.9982e-05 eta: 10 days, 17:00:54 time: 1.4827 data_time: 0.0242 memory: 25723 grad_norm: 2.8475 loss: 2.0013 detection_loss_cls: 0.1223 detection_loss_reg: 0.4809 caption_loss_cls: 3.7053 grounding_loss_reg: 5.4819 semantic_segmentation_loss_cls: 0.0326 instance_segmentation_loss_cls: 0.1031 instance_segmentation_loss_reg: 0.4769 instance_segmentation_loss_poly: 1.4650 +2024/01/01 16:26:13 - mmengine - INFO - Iter(train) [ 13500/640000] base_lr: 1.9978e-04 lr: 1.9980e-05 eta: 10 days, 16:44:43 time: 1.4692 data_time: 0.0240 memory: 25723 grad_norm: 2.9256 loss: 2.0132 detection_loss_cls: 0.1205 detection_loss_reg: 0.4794 caption_loss_cls: 3.6882 grounding_loss_reg: 5.4503 semantic_segmentation_loss_cls: 0.0320 instance_segmentation_loss_cls: 0.1012 instance_segmentation_loss_reg: 0.4743 instance_segmentation_loss_poly: 1.4557 +2024/01/01 16:38:49 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 16:38:49 - mmengine - INFO - Iter(train) [ 14000/640000] base_lr: 1.9977e-04 lr: 1.9979e-05 eta: 10 days, 16:46:07 time: 1.4761 data_time: 0.0241 memory: 25723 grad_norm: 2.9406 loss: 1.9967 detection_loss_cls: 0.1187 detection_loss_reg: 0.4779 caption_loss_cls: 3.6627 grounding_loss_reg: 5.4153 semantic_segmentation_loss_cls: 0.0315 instance_segmentation_loss_cls: 0.0995 instance_segmentation_loss_reg: 0.4722 instance_segmentation_loss_poly: 1.4455 +2024/01/01 16:38:49 - mmengine - INFO - Saving checkpoint at 14000 iterations +2024/01/01 16:51:00 - mmengine - INFO - Iter(train) [ 14500/640000] base_lr: 1.9975e-04 lr: 1.9977e-05 eta: 10 days, 16:28:24 time: 1.4619 data_time: 0.0238 memory: 25723 grad_norm: 3.0321 loss: 2.0219 detection_loss_cls: 0.1169 detection_loss_reg: 0.4760 caption_loss_cls: 3.6361 grounding_loss_reg: 5.3845 semantic_segmentation_loss_cls: 0.0310 instance_segmentation_loss_cls: 0.0980 instance_segmentation_loss_reg: 0.4696 instance_segmentation_loss_poly: 1.4371 +2024/01/01 17:03:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 17:03:06 - mmengine - INFO - Iter(train) [ 15000/640000] base_lr: 1.9973e-04 lr: 1.9976e-05 eta: 10 days, 16:07:40 time: 1.4536 data_time: 0.0237 memory: 25723 grad_norm: 3.0722 loss: 2.0261 detection_loss_cls: 0.1151 detection_loss_reg: 0.4745 caption_loss_cls: 3.6106 grounding_loss_reg: 5.3550 semantic_segmentation_loss_cls: 0.0305 instance_segmentation_loss_cls: 0.0969 instance_segmentation_loss_reg: 0.4690 instance_segmentation_loss_poly: 1.4312 +2024/01/01 17:15:16 - mmengine - INFO - Iter(train) [ 15500/640000] base_lr: 1.9971e-04 lr: 1.9974e-05 eta: 10 days, 15:50:39 time: 1.4540 data_time: 0.0237 memory: 25723 grad_norm: 3.1346 loss: 2.0197 detection_loss_cls: 0.1135 detection_loss_reg: 0.4735 caption_loss_cls: 3.5950 grounding_loss_reg: 5.3224 semantic_segmentation_loss_cls: 0.0301 instance_segmentation_loss_cls: 0.0958 instance_segmentation_loss_reg: 0.4681 instance_segmentation_loss_poly: 1.4250 +2024/01/01 17:27:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 17:27:35 - mmengine - INFO - Iter(train) [ 16000/640000] base_lr: 1.9969e-04 lr: 1.9972e-05 eta: 10 days, 15:39:13 time: 1.4685 data_time: 0.0238 memory: 25723 grad_norm: 3.1035 loss: 1.9959 detection_loss_cls: 0.1111 detection_loss_reg: 0.4688 caption_loss_cls: 3.5814 grounding_loss_reg: 5.2988 semantic_segmentation_loss_cls: 0.0298 instance_segmentation_loss_cls: 0.0944 instance_segmentation_loss_reg: 0.4640 instance_segmentation_loss_poly: 1.4126 +2024/01/01 17:27:35 - mmengine - INFO - Saving checkpoint at 16000 iterations +2024/01/01 17:39:44 - mmengine - INFO - Iter(train) [ 16500/640000] base_lr: 1.9968e-04 lr: 1.9970e-05 eta: 10 days, 15:21:31 time: 1.4607 data_time: 0.0235 memory: 25723 grad_norm: 3.1053 loss: 1.9739 detection_loss_cls: 0.1095 detection_loss_reg: 0.4683 caption_loss_cls: 3.5641 grounding_loss_reg: 5.2716 semantic_segmentation_loss_cls: 0.0294 instance_segmentation_loss_cls: 0.0936 instance_segmentation_loss_reg: 0.4646 instance_segmentation_loss_poly: 1.4104 +2024/01/01 17:52:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 17:52:53 - mmengine - INFO - Iter(train) [ 17000/640000] base_lr: 1.9966e-04 lr: 1.9969e-05 eta: 10 days, 15:40:42 time: 1.4831 data_time: 0.0239 memory: 25723 grad_norm: 3.0561 loss: 1.9516 detection_loss_cls: 0.1082 detection_loss_reg: 0.4673 caption_loss_cls: 3.5475 grounding_loss_reg: 5.2496 semantic_segmentation_loss_cls: 0.0291 instance_segmentation_loss_cls: 0.0923 instance_segmentation_loss_reg: 0.4631 instance_segmentation_loss_poly: 1.4037 +2024/01/01 18:05:15 - mmengine - INFO - Iter(train) [ 17500/640000] base_lr: 1.9963e-04 lr: 1.9967e-05 eta: 10 days, 15:30:38 time: 1.4855 data_time: 0.0238 memory: 25723 grad_norm: 3.0298 loss: 1.9338 detection_loss_cls: 0.1067 detection_loss_reg: 0.4654 caption_loss_cls: 3.5312 grounding_loss_reg: 5.2263 semantic_segmentation_loss_cls: 0.0288 instance_segmentation_loss_cls: 0.0912 instance_segmentation_loss_reg: 0.4609 instance_segmentation_loss_poly: 1.3966 +2024/01/01 18:17:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 18:17:07 - mmengine - INFO - Iter(train) [ 18000/640000] base_lr: 1.9961e-04 lr: 1.9965e-05 eta: 10 days, 15:02:56 time: 1.4746 data_time: 0.0237 memory: 25723 grad_norm: 3.0169 loss: 1.9263 detection_loss_cls: 0.1055 detection_loss_reg: 0.4642 caption_loss_cls: 3.5085 grounding_loss_reg: 5.2000 semantic_segmentation_loss_cls: 0.0284 instance_segmentation_loss_cls: 0.0901 instance_segmentation_loss_reg: 0.4598 instance_segmentation_loss_poly: 1.3927 +2024/01/01 18:17:07 - mmengine - INFO - Saving checkpoint at 18000 iterations +2024/01/01 18:29:07 - mmengine - INFO - Iter(train) [ 18500/640000] base_lr: 1.9959e-04 lr: 1.9963e-05 eta: 10 days, 14:40:31 time: 1.4719 data_time: 0.0238 memory: 25723 grad_norm: 3.0112 loss: 1.9192 detection_loss_cls: 0.1044 detection_loss_reg: 0.4637 caption_loss_cls: 3.4894 grounding_loss_reg: 5.1683 semantic_segmentation_loss_cls: 0.0281 instance_segmentation_loss_cls: 0.0891 instance_segmentation_loss_reg: 0.4589 instance_segmentation_loss_poly: 1.3890 +2024/01/01 18:42:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 18:42:03 - mmengine - INFO - Iter(train) [ 19000/640000] base_lr: 1.9957e-04 lr: 1.9961e-05 eta: 10 days, 14:48:43 time: 1.4842 data_time: 0.0240 memory: 25723 grad_norm: 2.9895 loss: 1.9057 detection_loss_cls: 0.1033 detection_loss_reg: 0.4632 caption_loss_cls: 3.4755 grounding_loss_reg: 5.1415 semantic_segmentation_loss_cls: 0.0278 instance_segmentation_loss_cls: 0.0881 instance_segmentation_loss_reg: 0.4579 instance_segmentation_loss_poly: 1.3842 +2024/01/01 18:55:13 - mmengine - INFO - Iter(train) [ 19500/640000] base_lr: 1.9955e-04 lr: 1.9959e-05 eta: 10 days, 15:03:43 time: 1.4991 data_time: 0.0242 memory: 25723 grad_norm: 2.8946 loss: 1.8777 detection_loss_cls: 0.1021 detection_loss_reg: 0.4629 caption_loss_cls: 3.4615 grounding_loss_reg: 5.1225 semantic_segmentation_loss_cls: 0.0275 instance_segmentation_loss_cls: 0.0873 instance_segmentation_loss_reg: 0.4579 instance_segmentation_loss_poly: 1.3817 +2024/01/01 19:07:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 19:07:19 - mmengine - INFO - Iter(train) [ 20000/640000] base_lr: 1.9952e-04 lr: 1.9957e-05 eta: 10 days, 14:44:27 time: 1.4960 data_time: 0.0244 memory: 25723 grad_norm: 3.8976 loss: 1.8803 detection_loss_cls: 0.1009 detection_loss_reg: 0.4606 caption_loss_cls: 3.3277 grounding_loss_reg: 5.0974 semantic_segmentation_loss_cls: 0.0237 instance_segmentation_loss_cls: 0.0864 instance_segmentation_loss_reg: 0.4561 instance_segmentation_loss_poly: 1.3752 +2024/01/01 19:07:19 - mmengine - INFO - Saving checkpoint at 20000 iterations +2024/01/01 19:19:35 - mmengine - INFO - Evaluating bbox... +2024/01/01 19:20:31 - mmengine - INFO - bbox_mAP_copypaste: 0.268 0.455 0.292 0.171 0.333 0.330 +2024/01/01 19:20:31 - mmengine - INFO - Evaluating segm... +2024/01/01 19:21:43 - mmengine - INFO - segm_mAP_copypaste: 0.143 0.331 0.106 0.064 0.195 0.238 +2024/01/01 19:28:19 - mmengine - INFO - per class results: +2024/01/01 19:28:19 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 73.52 | 87.73 | +| building | 77.11 | 85.02 | +| sky | 89.97 | 97.72 | +| floor | 79.75 | 87.85 | +| tree | 69.4 | 86.66 | +| ceiling | 81.57 | 91.26 | +| road | 73.44 | 93.17 | +| bed | 82.19 | 93.02 | +| windowpane | 56.34 | 76.59 | +| grass | 58.35 | 88.48 | +| cabinet | 53.84 | 64.95 | +| sidewalk | 50.11 | 59.53 | +| person | 74.32 | 82.35 | +| earth | 25.37 | 28.83 | +| door | 40.58 | 53.05 | +| table | 49.66 | 71.26 | +| mountain | 53.21 | 82.31 | +| plant | 45.73 | 57.94 | +| curtain | 65.4 | 82.79 | +| chair | 45.7 | 53.73 | +| car | 77.12 | 86.47 | +| water | 54.61 | 73.38 | +| painting | 59.07 | 84.69 | +| sofa | 59.26 | 84.08 | +| shelf | 13.6 | 15.27 | +| house | 34.28 | 54.55 | +| sea | 45.61 | 58.37 | +| mirror | 47.09 | 70.02 | +| rug | 63.81 | 69.54 | +| field | 22.33 | 41.85 | +| armchair | 29.17 | 42.96 | +| seat | 45.36 | 78.63 | +| fence | 31.88 | 62.2 | +| desk | 30.35 | 50.31 | +| rock | 37.89 | 48.32 | +| wardrobe | 44.46 | 56.76 | +| lamp | 50.47 | 66.69 | +| bathtub | 64.51 | 76.02 | +| railing | 25.29 | 31.82 | +| cushion | 33.27 | 40.44 | +| base | 19.86 | 45.89 | +| box | 16.62 | 23.92 | +| column | 40.24 | 45.06 | +| signboard | 31.5 | 47.22 | +| chest of drawers | 31.24 | 59.66 | +| counter | 23.62 | 26.92 | +| sand | 24.48 | 53.09 | +| sink | 51.68 | 59.33 | +| skyscraper | 42.4 | 48.83 | +| fireplace | 52.19 | 60.83 | +| refrigerator | 59.78 | 66.86 | +| grandstand | 38.79 | 64.75 | +| path | 19.4 | 37.01 | +| stairs | 36.65 | 42.73 | +| runway | 65.28 | 89.82 | +| case | 43.79 | 53.36 | +| pool table | 86.41 | 94.64 | +| pillow | 47.7 | 78.23 | +| screen door | 15.11 | 15.16 | +| stairway | 34.38 | 39.69 | +| river | 16.59 | 19.34 | +| bridge | 53.21 | 56.93 | +| bookcase | 14.3 | 78.01 | +| blind | 0.34 | 0.34 | +| coffee table | 50.75 | 78.56 | +| toilet | 75.11 | 84.17 | +| flower | 26.18 | 41.88 | +| book | 25.51 | 29.79 | +| hill | 4.32 | 4.47 | +| bench | 32.04 | 37.8 | +| countertop | 46.72 | 64.42 | +| stove | 55.07 | 74.68 | +| palm | 40.56 | 48.11 | +| kitchen island | 22.21 | 37.25 | +| computer | 52.56 | 70.08 | +| swivel chair | 36.29 | 48.84 | +| boat | 58.3 | 78.03 | +| bar | 9.49 | 10.02 | +| arcade machine | 9.01 | 9.12 | +| hovel | 25.82 | 30.23 | +| bus | 81.16 | 90.05 | +| towel | 44.01 | 48.57 | +| light | 37.77 | 45.52 | +| truck | 28.23 | 39.74 | +| tower | 4.53 | 5.31 | +| chandelier | 48.94 | 55.65 | +| awning | 20.07 | 35.07 | +| streetlight | 13.53 | 14.73 | +| booth | 31.74 | 33.27 | +| television receiver | 49.14 | 52.77 | +| airplane | 49.71 | 56.11 | +| dirt track | 3.83 | 16.84 | +| apparel | 21.84 | 38.44 | +| pole | 16.45 | 20.24 | +| land | 0.15 | 0.22 | +| bannister | 4.65 | 5.44 | +| escalator | 7.07 | 7.56 | +| ottoman | 24.67 | 29.23 | +| bottle | 20.79 | 29.03 | +| buffet | 31.27 | 38.37 | +| poster | 9.52 | 15.18 | +| stage | 2.94 | 3.37 | +| van | 8.34 | 9.08 | +| ship | 0.57 | 0.57 | +| fountain | 7.75 | 8.17 | +| conveyer belt | 64.79 | 68.14 | +| canopy | 19.96 | 24.41 | +| washer | 34.9 | 50.33 | +| plaything | 9.07 | 10.02 | +| swimming pool | 6.7 | 7.25 | +| stool | 16.85 | 17.67 | +| barrel | 12.86 | 62.33 | +| basket | 16.68 | 26.09 | +| waterfall | 68.04 | 82.83 | +| tent | 90.24 | 94.51 | +| bag | 12.49 | 16.14 | +| minibike | 58.07 | 68.54 | +| cradle | 46.31 | 57.41 | +| oven | 4.21 | 4.3 | +| ball | 39.64 | 49.19 | +| food | 49.93 | 57.08 | +| step | 6.19 | 6.64 | +| tank | 27.94 | 31.87 | +| trade name | 13.54 | 14.62 | +| microwave | 43.67 | 47.21 | +| pot | 25.17 | 29.34 | +| animal | 59.89 | 69.24 | +| bicycle | 44.43 | 63.8 | +| lake | 0.05 | 0.05 | +| dishwasher | 21.97 | 24.42 | +| screen | 63.92 | 80.3 | +| blanket | 8.2 | 9.28 | +| sculpture | 30.32 | 33.19 | +| hood | 41.26 | 45.27 | +| sconce | 4.85 | 4.91 | +| vase | 29.74 | 47.76 | +| traffic light | 20.39 | 33.8 | +| tray | 5.33 | 8.08 | +| ashcan | 21.79 | 37.12 | +| fan | 41.17 | 50.27 | +| pier | 19.28 | 73.74 | +| crt screen | 0.0 | 0.0 | +| plate | 32.07 | 39.7 | +| monitor | 0.69 | 0.75 | +| bulletin board | 11.94 | 12.59 | +| shower | 0.0 | 0.0 | +| radiator | 28.87 | 29.6 | +| glass | 2.27 | 2.29 | +| clock | 15.27 | 19.92 | +| flag | 21.94 | 23.97 | ++---------------------+-------+-------+ +2024/01/01 19:28:37 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.2680 coco/bbox_mAP_50: 0.4550 coco/bbox_mAP_75: 0.2920 coco/bbox_mAP_s: 0.1710 coco/bbox_mAP_m: 0.3330 coco/bbox_mAP_l: 0.3300 coco/segm_mAP: 0.1430 coco/segm_mAP_50: 0.3310 coco/segm_mAP_75: 0.1060 coco/segm_mAP_s: 0.0640 coco/segm_mAP_m: 0.1950 coco/segm_mAP_l: 0.2380 Bleu_1: 0.6724 Bleu_2: 0.4918 Bleu_3: 0.3456 Bleu_4: 0.2409 METEOR: 0.2213 ROUGE_L: 0.4940 CIDEr: 0.7394 SPICE: 0.1512 aAcc: 78.0700 mIoU: 35.4100 mAcc: 46.0400 visual-grounding/miou: 0.5422 visual-grounding/acc: 0.6085 data_time: 0.0098 time: 1.3612 +2024/01/01 19:41:14 - mmengine - INFO - Iter(train) [ 20500/640000] base_lr: 1.9950e-04 lr: 1.9954e-05 eta: 10 days, 14:42:02 time: 1.5036 data_time: 0.0212 memory: 25726 grad_norm: 3.8677 loss: 1.8635 detection_loss_cls: 0.0793 detection_loss_reg: 0.4541 caption_loss_cls: 3.2723 grounding_loss_reg: 4.9960 semantic_segmentation_loss_cls: 0.0214 instance_segmentation_loss_cls: 0.0768 instance_segmentation_loss_reg: 0.4510 instance_segmentation_loss_poly: 1.3483 +2024/01/01 19:53:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 19:53:15 - mmengine - INFO - Iter(train) [ 21000/640000] base_lr: 1.9947e-04 lr: 1.9952e-05 eta: 10 days, 14:20:24 time: 1.4867 data_time: 0.0211 memory: 25725 grad_norm: 3.9257 loss: 1.8630 detection_loss_cls: 0.0749 detection_loss_reg: 0.4494 caption_loss_cls: 3.2282 grounding_loss_reg: 4.9221 semantic_segmentation_loss_cls: 0.0201 instance_segmentation_loss_cls: 0.0712 instance_segmentation_loss_reg: 0.4461 instance_segmentation_loss_poly: 1.3247 +2024/01/01 20:05:37 - mmengine - INFO - Iter(train) [ 21500/640000] base_lr: 1.9945e-04 lr: 1.9950e-05 eta: 10 days, 14:09:09 time: 1.4865 data_time: 0.0214 memory: 25725 grad_norm: 3.9295 loss: 1.8482 detection_loss_cls: 0.0722 detection_loss_reg: 0.4454 caption_loss_cls: 3.1940 grounding_loss_reg: 4.8640 semantic_segmentation_loss_cls: 0.0196 instance_segmentation_loss_cls: 0.0666 instance_segmentation_loss_reg: 0.4400 instance_segmentation_loss_poly: 1.3035 +2024/01/01 20:18:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 20:18:33 - mmengine - INFO - Iter(train) [ 22000/640000] base_lr: 1.9942e-04 lr: 1.9948e-05 eta: 10 days, 14:13:38 time: 1.5024 data_time: 0.0218 memory: 25725 grad_norm: 3.8952 loss: 1.8241 detection_loss_cls: 0.0703 detection_loss_reg: 0.4414 caption_loss_cls: 3.1667 grounding_loss_reg: 4.8158 semantic_segmentation_loss_cls: 0.0192 instance_segmentation_loss_cls: 0.0642 instance_segmentation_loss_reg: 0.4354 instance_segmentation_loss_poly: 1.2868 +2024/01/01 20:18:33 - mmengine - INFO - Saving checkpoint at 22000 iterations +2024/01/01 20:31:13 - mmengine - INFO - Iter(train) [ 22500/640000] base_lr: 1.9940e-04 lr: 1.9945e-05 eta: 10 days, 14:10:04 time: 1.5123 data_time: 0.0229 memory: 25725 grad_norm: 3.8700 loss: 1.8062 detection_loss_cls: 0.0690 detection_loss_reg: 0.4383 caption_loss_cls: 3.1470 grounding_loss_reg: 4.7558 semantic_segmentation_loss_cls: 0.0188 instance_segmentation_loss_cls: 0.0628 instance_segmentation_loss_reg: 0.4326 instance_segmentation_loss_poly: 1.2761 +2024/01/01 20:43:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 20:43:02 - mmengine - INFO - Iter(train) [ 23000/640000] base_lr: 1.9937e-04 lr: 1.9943e-05 eta: 10 days, 13:43:35 time: 1.4958 data_time: 0.0229 memory: 25725 grad_norm: 3.8684 loss: 1.7909 detection_loss_cls: 0.0679 detection_loss_reg: 0.4362 caption_loss_cls: 3.1145 grounding_loss_reg: 4.7140 semantic_segmentation_loss_cls: 0.0185 instance_segmentation_loss_cls: 0.0619 instance_segmentation_loss_reg: 0.4312 instance_segmentation_loss_poly: 1.2690 +2024/01/01 20:54:58 - mmengine - INFO - Iter(train) [ 23500/640000] base_lr: 1.9934e-04 lr: 1.9940e-05 eta: 10 days, 13:20:51 time: 1.4774 data_time: 0.0227 memory: 25725 grad_norm: 3.9273 loss: 1.7907 detection_loss_cls: 0.0674 detection_loss_reg: 0.4364 caption_loss_cls: 3.0945 grounding_loss_reg: 4.6682 semantic_segmentation_loss_cls: 0.0182 instance_segmentation_loss_cls: 0.0612 instance_segmentation_loss_reg: 0.4298 instance_segmentation_loss_poly: 1.2631 +2024/01/01 21:06:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 21:06:24 - mmengine - INFO - Iter(train) [ 24000/640000] base_lr: 1.9931e-04 lr: 1.9938e-05 eta: 10 days, 12:45:36 time: 1.4673 data_time: 0.0228 memory: 25725 grad_norm: 2.9728 loss: 1.7868 detection_loss_cls: 0.0664 detection_loss_reg: 0.4338 caption_loss_cls: 3.0700 grounding_loss_reg: 4.6192 semantic_segmentation_loss_cls: 0.0181 instance_segmentation_loss_cls: 0.0606 instance_segmentation_loss_reg: 0.4292 instance_segmentation_loss_poly: 1.2595 +2024/01/01 21:06:24 - mmengine - INFO - Saving checkpoint at 24000 iterations +2024/01/01 21:18:46 - mmengine - INFO - Iter(train) [ 24500/640000] base_lr: 1.9928e-04 lr: 1.9935e-05 eta: 10 days, 12:34:29 time: 1.4629 data_time: 0.0269 memory: 25725 grad_norm: 3.0298 loss: 1.7901 detection_loss_cls: 0.0658 detection_loss_reg: 0.4327 caption_loss_cls: 3.0482 grounding_loss_reg: 4.5712 semantic_segmentation_loss_cls: 0.0180 instance_segmentation_loss_cls: 0.0598 instance_segmentation_loss_reg: 0.4267 instance_segmentation_loss_poly: 1.2488 +2024/01/01 21:31:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 21:31:34 - mmengine - INFO - Iter(train) [ 25000/640000] base_lr: 1.9926e-04 lr: 1.9932e-05 eta: 10 days, 12:34:07 time: 1.4745 data_time: 0.0272 memory: 25725 grad_norm: 2.9894 loss: 1.7775 detection_loss_cls: 0.0652 detection_loss_reg: 0.4315 caption_loss_cls: 3.0327 grounding_loss_reg: 4.5319 semantic_segmentation_loss_cls: 0.0179 instance_segmentation_loss_cls: 0.0594 instance_segmentation_loss_reg: 0.4258 instance_segmentation_loss_poly: 1.2437 +2024/01/01 21:44:11 - mmengine - INFO - Iter(train) [ 25500/640000] base_lr: 1.9923e-04 lr: 1.9930e-05 eta: 10 days, 12:29:05 time: 1.4784 data_time: 0.0273 memory: 25725 grad_norm: 2.9518 loss: 1.7650 detection_loss_cls: 0.0643 detection_loss_reg: 0.4291 caption_loss_cls: 3.0180 grounding_loss_reg: 4.4960 semantic_segmentation_loss_cls: 0.0177 instance_segmentation_loss_cls: 0.0588 instance_segmentation_loss_reg: 0.4234 instance_segmentation_loss_poly: 1.2357 +2024/01/01 21:56:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 21:56:46 - mmengine - INFO - Iter(train) [ 26000/640000] base_lr: 1.9919e-04 lr: 1.9927e-05 eta: 10 days, 12:22:35 time: 1.4731 data_time: 0.0274 memory: 25725 grad_norm: 2.9769 loss: 1.7800 detection_loss_cls: 0.0638 detection_loss_reg: 0.4293 caption_loss_cls: 3.0000 grounding_loss_reg: 4.4586 semantic_segmentation_loss_cls: 0.0175 instance_segmentation_loss_cls: 0.0583 instance_segmentation_loss_reg: 0.4232 instance_segmentation_loss_poly: 1.2315 +2024/01/01 21:56:46 - mmengine - INFO - Saving checkpoint at 26000 iterations +2024/01/01 22:09:51 - mmengine - INFO - Iter(train) [ 26500/640000] base_lr: 1.9916e-04 lr: 1.9924e-05 eta: 10 days, 12:27:48 time: 1.4795 data_time: 0.0273 memory: 25725 grad_norm: 2.9376 loss: 1.7640 detection_loss_cls: 0.0630 detection_loss_reg: 0.4283 caption_loss_cls: 2.9821 grounding_loss_reg: 4.4271 semantic_segmentation_loss_cls: 0.0174 instance_segmentation_loss_cls: 0.0579 instance_segmentation_loss_reg: 0.4239 instance_segmentation_loss_poly: 1.2281 +2024/01/01 22:22:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 22:22:32 - mmengine - INFO - Iter(train) [ 27000/640000] base_lr: 1.9913e-04 lr: 1.9921e-05 eta: 10 days, 12:23:04 time: 1.4924 data_time: 0.0276 memory: 25725 grad_norm: 2.9460 loss: 1.7604 detection_loss_cls: 0.0626 detection_loss_reg: 0.4273 caption_loss_cls: 2.9655 grounding_loss_reg: 4.3991 semantic_segmentation_loss_cls: 0.0172 instance_segmentation_loss_cls: 0.0573 instance_segmentation_loss_reg: 0.4222 instance_segmentation_loss_poly: 1.2200 +2024/01/01 22:36:02 - mmengine - INFO - Iter(train) [ 27500/640000] base_lr: 1.9910e-04 lr: 1.9918e-05 eta: 10 days, 12:36:27 time: 1.5159 data_time: 0.0281 memory: 25725 grad_norm: 2.9192 loss: 1.7433 detection_loss_cls: 0.0619 detection_loss_reg: 0.4260 caption_loss_cls: 2.9576 grounding_loss_reg: 4.3699 semantic_segmentation_loss_cls: 0.0171 instance_segmentation_loss_cls: 0.0570 instance_segmentation_loss_reg: 0.4221 instance_segmentation_loss_poly: 1.2163 +2024/01/01 22:47:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 22:47:54 - mmengine - INFO - Iter(train) [ 28000/640000] base_lr: 1.9907e-04 lr: 1.9915e-05 eta: 10 days, 12:12:57 time: 1.5223 data_time: 0.0282 memory: 25725 grad_norm: 2.8873 loss: 1.7359 detection_loss_cls: 0.0618 detection_loss_reg: 0.4263 caption_loss_cls: 2.9470 grounding_loss_reg: 4.3420 semantic_segmentation_loss_cls: 0.0170 instance_segmentation_loss_cls: 0.0568 instance_segmentation_loss_reg: 0.4222 instance_segmentation_loss_poly: 1.2159 +2024/01/01 22:47:54 - mmengine - INFO - Saving checkpoint at 28000 iterations +2024/01/01 23:00:20 - mmengine - INFO - Iter(train) [ 28500/640000] base_lr: 1.9903e-04 lr: 1.9912e-05 eta: 10 days, 12:02:07 time: 1.5235 data_time: 0.0283 memory: 25725 grad_norm: 2.8597 loss: 1.7317 detection_loss_cls: 0.0613 detection_loss_reg: 0.4262 caption_loss_cls: 2.9302 grounding_loss_reg: 4.3180 semantic_segmentation_loss_cls: 0.0169 instance_segmentation_loss_cls: 0.0561 instance_segmentation_loss_reg: 0.4201 instance_segmentation_loss_poly: 1.2088 +2024/01/01 23:12:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 23:12:50 - mmengine - INFO - Iter(train) [ 29000/640000] base_lr: 1.9900e-04 lr: 1.9909e-05 eta: 10 days, 11:52:24 time: 1.5189 data_time: 0.0282 memory: 25725 grad_norm: 2.8694 loss: 1.7322 detection_loss_cls: 0.0608 detection_loss_reg: 0.4242 caption_loss_cls: 2.9207 grounding_loss_reg: 4.2928 semantic_segmentation_loss_cls: 0.0167 instance_segmentation_loss_cls: 0.0556 instance_segmentation_loss_reg: 0.4186 instance_segmentation_loss_poly: 1.2031 +2024/01/01 23:24:54 - mmengine - INFO - Iter(train) [ 29500/640000] base_lr: 1.9896e-04 lr: 1.9906e-05 eta: 10 days, 11:33:49 time: 1.5106 data_time: 0.0280 memory: 25725 grad_norm: 2.9222 loss: 1.7358 detection_loss_cls: 0.0600 detection_loss_reg: 0.4206 caption_loss_cls: 2.9040 grounding_loss_reg: 4.2664 semantic_segmentation_loss_cls: 0.0167 instance_segmentation_loss_cls: 0.0551 instance_segmentation_loss_reg: 0.4147 instance_segmentation_loss_poly: 1.1937 +2024/01/01 23:36:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/01 23:36:44 - mmengine - INFO - Iter(train) [ 30000/640000] base_lr: 1.9893e-04 lr: 1.9903e-05 eta: 10 days, 11:10:42 time: 1.4995 data_time: 0.0277 memory: 25725 grad_norm: 3.0019 loss: 1.7298 detection_loss_cls: 0.0599 detection_loss_reg: 0.4207 caption_loss_cls: 2.8925 grounding_loss_reg: 4.2408 semantic_segmentation_loss_cls: 0.0165 instance_segmentation_loss_cls: 0.0550 instance_segmentation_loss_reg: 0.4147 instance_segmentation_loss_poly: 1.1919 +2024/01/01 23:36:44 - mmengine - INFO - Saving checkpoint at 30000 iterations +2024/01/01 23:49:49 - mmengine - INFO - Iter(train) [ 30500/640000] base_lr: 1.9889e-04 lr: 1.9899e-05 eta: 10 days, 11:13:10 time: 1.4996 data_time: 0.0278 memory: 25725 grad_norm: 3.0241 loss: 1.7332 detection_loss_cls: 0.0595 detection_loss_reg: 0.4195 caption_loss_cls: 2.8851 grounding_loss_reg: 4.2188 semantic_segmentation_loss_cls: 0.0164 instance_segmentation_loss_cls: 0.0547 instance_segmentation_loss_reg: 0.4138 instance_segmentation_loss_poly: 1.1879 +2024/01/02 00:01:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 00:01:23 - mmengine - INFO - Iter(train) [ 31000/640000] base_lr: 1.9886e-04 lr: 1.9896e-05 eta: 10 days, 10:44:58 time: 1.4827 data_time: 0.0274 memory: 25725 grad_norm: 3.0633 loss: 1.7411 detection_loss_cls: 0.0593 detection_loss_reg: 0.4194 caption_loss_cls: 2.8743 grounding_loss_reg: 4.1917 semantic_segmentation_loss_cls: 0.0163 instance_segmentation_loss_cls: 0.0546 instance_segmentation_loss_reg: 0.4133 instance_segmentation_loss_poly: 1.1860 +2024/01/02 00:13:26 - mmengine - INFO - Iter(train) [ 31500/640000] base_lr: 1.9882e-04 lr: 1.9893e-05 eta: 10 days, 10:26:39 time: 1.4608 data_time: 0.0271 memory: 25725 grad_norm: 3.0703 loss: 1.7501 detection_loss_cls: 0.0590 detection_loss_reg: 0.4187 caption_loss_cls: 2.8609 grounding_loss_reg: 4.1707 semantic_segmentation_loss_cls: 0.0162 instance_segmentation_loss_cls: 0.0542 instance_segmentation_loss_reg: 0.4118 instance_segmentation_loss_poly: 1.1822 +2024/01/02 00:25:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 00:25:06 - mmengine - INFO - Iter(train) [ 32000/640000] base_lr: 1.9878e-04 lr: 1.9889e-05 eta: 10 days, 10:01:21 time: 1.4578 data_time: 0.0271 memory: 25725 grad_norm: 3.0820 loss: 1.7484 detection_loss_cls: 0.0586 detection_loss_reg: 0.4178 caption_loss_cls: 2.8519 grounding_loss_reg: 4.1459 semantic_segmentation_loss_cls: 0.0161 instance_segmentation_loss_cls: 0.0540 instance_segmentation_loss_reg: 0.4117 instance_segmentation_loss_poly: 1.1804 +2024/01/02 00:25:06 - mmengine - INFO - Saving checkpoint at 32000 iterations +2024/01/02 00:36:57 - mmengine - INFO - Iter(train) [ 32500/640000] base_lr: 1.9874e-04 lr: 1.9886e-05 eta: 10 days, 9:40:05 time: 1.4492 data_time: 0.0269 memory: 25725 grad_norm: 3.0896 loss: 1.7405 detection_loss_cls: 0.0583 detection_loss_reg: 0.4164 caption_loss_cls: 2.8422 grounding_loss_reg: 4.1176 semantic_segmentation_loss_cls: 0.0160 instance_segmentation_loss_cls: 0.0539 instance_segmentation_loss_reg: 0.4112 instance_segmentation_loss_poly: 1.1784 +2024/01/02 00:48:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 00:48:52 - mmengine - INFO - Iter(train) [ 33000/640000] base_lr: 1.9870e-04 lr: 1.9882e-05 eta: 10 days, 9:20:11 time: 1.4406 data_time: 0.0267 memory: 25725 grad_norm: 3.1706 loss: 1.7459 detection_loss_cls: 0.0581 detection_loss_reg: 0.4159 caption_loss_cls: 2.8302 grounding_loss_reg: 4.0955 semantic_segmentation_loss_cls: 0.0160 instance_segmentation_loss_cls: 0.0538 instance_segmentation_loss_reg: 0.4104 instance_segmentation_loss_poly: 1.1751 +2024/01/02 01:00:54 - mmengine - INFO - Iter(train) [ 33500/640000] base_lr: 1.9866e-04 lr: 1.9879e-05 eta: 10 days, 9:02:23 time: 1.4399 data_time: 0.0268 memory: 25725 grad_norm: 3.1642 loss: 1.7486 detection_loss_cls: 0.0579 detection_loss_reg: 0.4158 caption_loss_cls: 2.8220 grounding_loss_reg: 4.0733 semantic_segmentation_loss_cls: 0.0159 instance_segmentation_loss_cls: 0.0537 instance_segmentation_loss_reg: 0.4107 instance_segmentation_loss_poly: 1.1737 +2024/01/02 01:13:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 01:13:12 - mmengine - INFO - Iter(train) [ 34000/640000] base_lr: 1.9862e-04 lr: 1.9875e-05 eta: 10 days, 8:49:51 time: 1.4470 data_time: 0.0269 memory: 25725 grad_norm: 3.0996 loss: 1.7322 detection_loss_cls: 0.0577 detection_loss_reg: 0.4168 caption_loss_cls: 2.8124 grounding_loss_reg: 4.0563 semantic_segmentation_loss_cls: 0.0158 instance_segmentation_loss_cls: 0.0536 instance_segmentation_loss_reg: 0.4110 instance_segmentation_loss_poly: 1.1736 +2024/01/02 01:13:12 - mmengine - INFO - Saving checkpoint at 34000 iterations +2024/01/02 01:25:46 - mmengine - INFO - Iter(train) [ 34500/640000] base_lr: 1.9858e-04 lr: 1.9871e-05 eta: 10 days, 8:41:59 time: 1.4392 data_time: 0.0266 memory: 25725 grad_norm: 3.2384 loss: 1.7298 detection_loss_cls: 0.0577 detection_loss_reg: 0.4167 caption_loss_cls: 2.8098 grounding_loss_reg: 4.0389 semantic_segmentation_loss_cls: 0.0157 instance_segmentation_loss_cls: 0.0534 instance_segmentation_loss_reg: 0.4110 instance_segmentation_loss_poly: 1.1718 +2024/01/02 01:38:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 01:38:12 - mmengine - INFO - Iter(train) [ 35000/640000] base_lr: 1.9854e-04 lr: 1.9868e-05 eta: 10 days, 8:31:28 time: 1.4522 data_time: 0.0270 memory: 25725 grad_norm: 3.2125 loss: 1.7323 detection_loss_cls: 0.0576 detection_loss_reg: 0.4161 caption_loss_cls: 2.8033 grounding_loss_reg: 4.0177 semantic_segmentation_loss_cls: 0.0156 instance_segmentation_loss_cls: 0.0533 instance_segmentation_loss_reg: 0.4111 instance_segmentation_loss_poly: 1.1705 +2024/01/02 01:51:33 - mmengine - INFO - Iter(train) [ 35500/640000] base_lr: 1.9850e-04 lr: 1.9864e-05 eta: 10 days, 8:36:38 time: 1.4718 data_time: 0.0273 memory: 25725 grad_norm: 3.1800 loss: 1.7122 detection_loss_cls: 0.0575 detection_loss_reg: 0.4162 caption_loss_cls: 2.7938 grounding_loss_reg: 4.0018 semantic_segmentation_loss_cls: 0.0155 instance_segmentation_loss_cls: 0.0527 instance_segmentation_loss_reg: 0.4089 instance_segmentation_loss_poly: 1.1643 +2024/01/02 02:04:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 02:04:15 - mmengine - INFO - Iter(train) [ 36000/640000] base_lr: 1.9846e-04 lr: 1.9860e-05 eta: 10 days, 8:30:27 time: 1.4874 data_time: 0.0275 memory: 25725 grad_norm: 3.1463 loss: 1.6915 detection_loss_cls: 0.0574 detection_loss_reg: 0.4170 caption_loss_cls: 2.7845 grounding_loss_reg: 3.9842 semantic_segmentation_loss_cls: 0.0154 instance_segmentation_loss_cls: 0.0527 instance_segmentation_loss_reg: 0.4103 instance_segmentation_loss_poly: 1.1674 +2024/01/02 02:04:15 - mmengine - INFO - Saving checkpoint at 36000 iterations +2024/01/02 02:16:15 - mmengine - INFO - Iter(train) [ 36500/640000] base_lr: 1.9842e-04 lr: 1.9856e-05 eta: 10 days, 8:12:14 time: 1.4893 data_time: 0.0277 memory: 25725 grad_norm: 3.1723 loss: 1.6997 detection_loss_cls: 0.0570 detection_loss_reg: 0.4155 caption_loss_cls: 2.7801 grounding_loss_reg: 3.9634 semantic_segmentation_loss_cls: 0.0153 instance_segmentation_loss_cls: 0.0525 instance_segmentation_loss_reg: 0.4092 instance_segmentation_loss_poly: 1.1646 +2024/01/02 02:28:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 02:28:16 - mmengine - INFO - Iter(train) [ 37000/640000] base_lr: 1.9837e-04 lr: 1.9852e-05 eta: 10 days, 7:54:51 time: 1.4910 data_time: 0.0278 memory: 25725 grad_norm: 3.1409 loss: 1.6996 detection_loss_cls: 0.0567 detection_loss_reg: 0.4157 caption_loss_cls: 2.7763 grounding_loss_reg: 3.9440 semantic_segmentation_loss_cls: 0.0153 instance_segmentation_loss_cls: 0.0523 instance_segmentation_loss_reg: 0.4088 instance_segmentation_loss_poly: 1.1626 +2024/01/02 02:40:47 - mmengine - INFO - Iter(train) [ 37500/640000] base_lr: 1.9833e-04 lr: 1.9848e-05 eta: 10 days, 7:45:24 time: 1.4984 data_time: 0.0279 memory: 25725 grad_norm: 3.1803 loss: 1.6902 detection_loss_cls: 0.0566 detection_loss_reg: 0.4159 caption_loss_cls: 2.7726 grounding_loss_reg: 3.9220 semantic_segmentation_loss_cls: 0.0152 instance_segmentation_loss_cls: 0.0522 instance_segmentation_loss_reg: 0.4093 instance_segmentation_loss_poly: 1.1619 +2024/01/02 02:52:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 02:52:48 - mmengine - INFO - Iter(train) [ 38000/640000] base_lr: 1.9828e-04 lr: 1.9844e-05 eta: 10 days, 7:27:48 time: 1.4938 data_time: 0.0279 memory: 25725 grad_norm: 3.2093 loss: 1.7037 detection_loss_cls: 0.0563 detection_loss_reg: 0.4144 caption_loss_cls: 2.7705 grounding_loss_reg: 3.9084 semantic_segmentation_loss_cls: 0.0151 instance_segmentation_loss_cls: 0.0522 instance_segmentation_loss_reg: 0.4085 instance_segmentation_loss_poly: 1.1585 +2024/01/02 02:52:48 - mmengine - INFO - Saving checkpoint at 38000 iterations +2024/01/02 03:05:57 - mmengine - INFO - Iter(train) [ 38500/640000] base_lr: 1.9824e-04 lr: 1.9840e-05 eta: 10 days, 7:28:18 time: 1.5026 data_time: 0.0280 memory: 25725 grad_norm: 3.0784 loss: 1.6871 detection_loss_cls: 0.0561 detection_loss_reg: 0.4130 caption_loss_cls: 2.7685 grounding_loss_reg: 3.8959 semantic_segmentation_loss_cls: 0.0150 instance_segmentation_loss_cls: 0.0519 instance_segmentation_loss_reg: 0.4063 instance_segmentation_loss_poly: 1.1509 +2024/01/02 03:18:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 03:18:00 - mmengine - INFO - Iter(train) [ 39000/640000] base_lr: 1.9819e-04 lr: 1.9836e-05 eta: 10 days, 7:11:25 time: 1.4969 data_time: 0.0278 memory: 25725 grad_norm: 3.0896 loss: 1.6857 detection_loss_cls: 0.0558 detection_loss_reg: 0.4112 caption_loss_cls: 2.7675 grounding_loss_reg: 3.8830 semantic_segmentation_loss_cls: 0.0150 instance_segmentation_loss_cls: 0.0518 instance_segmentation_loss_reg: 0.4054 instance_segmentation_loss_poly: 1.1478 +2024/01/02 03:30:24 - mmengine - INFO - Iter(train) [ 39500/640000] base_lr: 1.9814e-04 lr: 1.9831e-05 eta: 10 days, 7:00:08 time: 1.4827 data_time: 0.0276 memory: 25725 grad_norm: 3.1019 loss: 1.6848 detection_loss_cls: 0.0559 detection_loss_reg: 0.4103 caption_loss_cls: 2.7600 grounding_loss_reg: 3.8715 semantic_segmentation_loss_cls: 0.0149 instance_segmentation_loss_cls: 0.0516 instance_segmentation_loss_reg: 0.4033 instance_segmentation_loss_poly: 1.1423 +2024/01/02 03:42:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 03:42:56 - mmengine - INFO - Iter(train) [ 40000/640000] base_lr: 1.9810e-04 lr: 1.9827e-05 eta: 10 days, 6:50:34 time: 1.4800 data_time: 0.0274 memory: 25725 grad_norm: 3.0658 loss: 1.6711 detection_loss_cls: 0.0559 detection_loss_reg: 0.4111 caption_loss_cls: 2.7502 grounding_loss_reg: 3.8575 semantic_segmentation_loss_cls: 0.0147 instance_segmentation_loss_cls: 0.0516 instance_segmentation_loss_reg: 0.4032 instance_segmentation_loss_poly: 1.1420 +2024/01/02 03:42:56 - mmengine - INFO - Saving checkpoint at 40000 iterations +2024/01/02 03:55:37 - mmengine - INFO - Evaluating bbox... +2024/01/02 03:56:32 - mmengine - INFO - bbox_mAP_copypaste: 0.355 0.535 0.389 0.221 0.424 0.450 +2024/01/02 03:56:32 - mmengine - INFO - Evaluating segm... +2024/01/02 03:57:44 - mmengine - INFO - segm_mAP_copypaste: 0.205 0.426 0.179 0.091 0.246 0.326 +2024/01/02 04:03:41 - mmengine - INFO - per class results: +2024/01/02 04:03:41 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.63 | 86.28 | +| building | 80.82 | 92.77 | +| sky | 92.82 | 97.26 | +| floor | 80.15 | 87.04 | +| tree | 71.98 | 88.1 | +| ceiling | 82.56 | 90.45 | +| road | 80.4 | 91.13 | +| bed | 85.0 | 92.28 | +| windowpane | 59.52 | 82.23 | +| grass | 66.01 | 89.82 | +| cabinet | 59.17 | 74.62 | +| sidewalk | 59.21 | 73.05 | +| person | 77.96 | 91.43 | +| earth | 41.12 | 53.97 | +| door | 43.84 | 61.69 | +| table | 55.26 | 73.94 | +| mountain | 48.28 | 59.3 | +| plant | 49.68 | 61.09 | +| curtain | 69.64 | 88.28 | +| chair | 54.4 | 72.31 | +| car | 79.89 | 89.75 | +| water | 56.58 | 82.31 | +| painting | 67.08 | 73.15 | +| sofa | 63.05 | 75.25 | +| shelf | 41.05 | 66.17 | +| house | 37.8 | 42.03 | +| sea | 49.39 | 58.35 | +| mirror | 55.42 | 72.84 | +| rug | 67.15 | 72.79 | +| field | 18.53 | 21.67 | +| armchair | 36.63 | 51.08 | +| seat | 45.68 | 85.52 | +| fence | 38.89 | 63.71 | +| desk | 32.33 | 58.05 | +| rock | 33.28 | 71.47 | +| wardrobe | 36.7 | 40.18 | +| lamp | 53.23 | 67.44 | +| bathtub | 77.7 | 89.17 | +| railing | 32.02 | 40.94 | +| cushion | 50.86 | 68.82 | +| base | 21.83 | 31.33 | +| box | 23.47 | 31.06 | +| column | 47.72 | 59.59 | +| signboard | 26.56 | 36.3 | +| chest of drawers | 33.86 | 51.3 | +| counter | 38.29 | 53.82 | +| sand | 32.83 | 34.22 | +| sink | 64.3 | 77.18 | +| skyscraper | 28.8 | 30.11 | +| fireplace | 60.81 | 76.35 | +| refrigerator | 59.22 | 62.95 | +| grandstand | 50.44 | 66.8 | +| path | 17.64 | 27.47 | +| stairs | 37.67 | 54.97 | +| runway | 68.66 | 77.16 | +| case | 31.33 | 32.38 | +| pool table | 89.97 | 95.1 | +| pillow | 50.42 | 72.75 | +| screen door | 0.02 | 0.02 | +| stairway | 27.31 | 29.37 | +| river | 14.45 | 16.11 | +| bridge | 57.91 | 83.19 | +| bookcase | 17.84 | 18.59 | +| blind | 19.89 | 20.9 | +| coffee table | 53.2 | 68.48 | +| toilet | 74.21 | 90.38 | +| flower | 30.59 | 55.22 | +| book | 44.77 | 66.47 | +| hill | 0.06 | 0.06 | +| bench | 37.33 | 58.33 | +| countertop | 47.64 | 63.09 | +| stove | 62.48 | 80.54 | +| palm | 46.02 | 56.77 | +| kitchen island | 32.54 | 53.48 | +| computer | 57.88 | 74.1 | +| swivel chair | 28.23 | 33.23 | +| boat | 50.79 | 88.33 | +| bar | 43.12 | 55.53 | +| arcade machine | 49.14 | 51.02 | +| hovel | 37.81 | 67.27 | +| bus | 69.76 | 96.96 | +| towel | 48.44 | 76.55 | +| light | 45.92 | 59.3 | +| truck | 29.06 | 53.7 | +| tower | 30.0 | 43.19 | +| chandelier | 61.45 | 78.98 | +| awning | 5.94 | 7.75 | +| streetlight | 23.73 | 28.44 | +| booth | 29.55 | 36.4 | +| television receiver | 63.81 | 77.8 | +| airplane | 52.9 | 64.44 | +| dirt track | 0.0 | 0.0 | +| apparel | 15.68 | 20.53 | +| pole | 26.84 | 46.02 | +| land | 0.07 | 0.08 | +| bannister | 6.23 | 7.0 | +| escalator | 20.31 | 21.8 | +| ottoman | 46.48 | 59.1 | +| bottle | 22.33 | 29.64 | +| buffet | 28.84 | 34.3 | +| poster | 25.44 | 45.52 | +| stage | 7.69 | 16.16 | +| van | 35.63 | 48.15 | +| ship | 1.97 | 1.99 | +| fountain | 13.15 | 13.81 | +| conveyer belt | 42.41 | 93.98 | +| canopy | 8.28 | 9.18 | +| washer | 57.8 | 63.35 | +| plaything | 16.78 | 19.95 | +| swimming pool | 22.2 | 22.86 | +| stool | 37.87 | 53.18 | +| barrel | 15.25 | 41.71 | +| basket | 29.28 | 39.87 | +| waterfall | 67.55 | 83.93 | +| tent | 86.54 | 95.89 | +| bag | 18.58 | 21.21 | +| minibike | 64.62 | 80.68 | +| cradle | 55.8 | 64.98 | +| oven | 22.27 | 26.01 | +| ball | 43.62 | 55.21 | +| food | 55.24 | 68.24 | +| step | 4.86 | 5.22 | +| tank | 28.74 | 36.81 | +| trade name | 0.0 | 0.0 | +| microwave | 55.06 | 60.82 | +| pot | 35.63 | 46.47 | +| animal | 60.31 | 69.56 | +| bicycle | 53.43 | 70.74 | +| lake | 0.0 | 0.0 | +| dishwasher | 36.54 | 67.48 | +| screen | 70.75 | 79.49 | +| blanket | 7.49 | 8.08 | +| sculpture | 38.33 | 48.79 | +| hood | 50.52 | 58.43 | +| sconce | 27.09 | 39.58 | +| vase | 34.87 | 52.42 | +| traffic light | 24.63 | 30.62 | +| tray | 9.32 | 15.18 | +| ashcan | 32.16 | 58.49 | +| fan | 44.84 | 69.43 | +| pier | 31.94 | 50.27 | +| crt screen | 10.63 | 11.77 | +| plate | 43.89 | 64.0 | +| monitor | 14.49 | 16.27 | +| bulletin board | 38.27 | 58.32 | +| shower | 0.41 | 13.49 | +| radiator | 42.69 | 56.35 | +| glass | 11.76 | 12.7 | +| clock | 17.58 | 26.19 | +| flag | 27.72 | 31.75 | ++---------------------+-------+-------+ +2024/01/02 04:03:57 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.3550 coco/bbox_mAP_50: 0.5350 coco/bbox_mAP_75: 0.3890 coco/bbox_mAP_s: 0.2210 coco/bbox_mAP_m: 0.4240 coco/bbox_mAP_l: 0.4500 coco/segm_mAP: 0.2050 coco/segm_mAP_50: 0.4260 coco/segm_mAP_75: 0.1790 coco/segm_mAP_s: 0.0910 coco/segm_mAP_m: 0.2460 coco/segm_mAP_l: 0.3260 Bleu_1: 0.6880 Bleu_2: 0.5018 Bleu_3: 0.3545 Bleu_4: 0.2460 METEOR: 0.2285 ROUGE_L: 0.5014 CIDEr: 0.7917 SPICE: 0.1598 aAcc: 80.8200 mIoU: 40.8900 mAcc: 53.1000 visual-grounding/miou: 0.6135 visual-grounding/acc: 0.6799 data_time: 0.0036 time: 1.3565 +2024/01/02 04:16:40 - mmengine - INFO - Iter(train) [ 40500/640000] base_lr: 1.9805e-04 lr: 1.9823e-05 eta: 10 days, 6:44:11 time: 1.4914 data_time: 0.0234 memory: 25725 grad_norm: 3.0031 loss: 1.6602 detection_loss_cls: 0.0557 detection_loss_reg: 0.4108 caption_loss_cls: 2.7463 grounding_loss_reg: 3.8454 semantic_segmentation_loss_cls: 0.0147 instance_segmentation_loss_cls: 0.0516 instance_segmentation_loss_reg: 0.4037 instance_segmentation_loss_poly: 1.1418 +2024/01/02 04:29:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 04:29:13 - mmengine - INFO - Iter(train) [ 41000/640000] base_lr: 1.9800e-04 lr: 1.9818e-05 eta: 10 days, 6:34:50 time: 1.4992 data_time: 0.0234 memory: 25725 grad_norm: 2.9462 loss: 1.6260 detection_loss_cls: 0.0557 detection_loss_reg: 0.4105 caption_loss_cls: 2.7436 grounding_loss_reg: 3.8288 semantic_segmentation_loss_cls: 0.0147 instance_segmentation_loss_cls: 0.0515 instance_segmentation_loss_reg: 0.4038 instance_segmentation_loss_poly: 1.1416 +2024/01/02 04:41:27 - mmengine - INFO - Iter(train) [ 41500/640000] base_lr: 1.9795e-04 lr: 1.9814e-05 eta: 10 days, 6:20:44 time: 1.4950 data_time: 0.0233 memory: 25725 grad_norm: 2.9099 loss: 1.6331 detection_loss_cls: 0.0557 detection_loss_reg: 0.4115 caption_loss_cls: 2.7401 grounding_loss_reg: 3.8157 semantic_segmentation_loss_cls: 0.0146 instance_segmentation_loss_cls: 0.0513 instance_segmentation_loss_reg: 0.4026 instance_segmentation_loss_poly: 1.1371 +2024/01/02 04:53:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 04:53:48 - mmengine - INFO - Iter(train) [ 42000/640000] base_lr: 1.9790e-04 lr: 1.9809e-05 eta: 10 days, 6:08:17 time: 1.5000 data_time: 0.0234 memory: 25725 grad_norm: 2.8844 loss: 1.6139 detection_loss_cls: 0.0554 detection_loss_reg: 0.4092 caption_loss_cls: 2.7394 grounding_loss_reg: 3.8016 semantic_segmentation_loss_cls: 0.0145 instance_segmentation_loss_cls: 0.0512 instance_segmentation_loss_reg: 0.4032 instance_segmentation_loss_poly: 1.1367 +2024/01/02 04:53:48 - mmengine - INFO - Saving checkpoint at 42000 iterations +2024/01/02 05:06:42 - mmengine - INFO - Iter(train) [ 42500/640000] base_lr: 1.9785e-04 lr: 1.9805e-05 eta: 10 days, 6:03:42 time: 1.4962 data_time: 0.0234 memory: 25725 grad_norm: 2.8758 loss: 1.6230 detection_loss_cls: 0.0553 detection_loss_reg: 0.4098 caption_loss_cls: 2.7368 grounding_loss_reg: 3.7859 semantic_segmentation_loss_cls: 0.0145 instance_segmentation_loss_cls: 0.0512 instance_segmentation_loss_reg: 0.4034 instance_segmentation_loss_poly: 1.1357 +2024/01/02 05:18:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 05:18:52 - mmengine - INFO - Iter(train) [ 43000/640000] base_lr: 1.9780e-04 lr: 1.9800e-05 eta: 10 days, 5:48:49 time: 1.4981 data_time: 0.0235 memory: 25725 grad_norm: 2.8605 loss: 1.6190 detection_loss_cls: 0.0552 detection_loss_reg: 0.4101 caption_loss_cls: 2.7349 grounding_loss_reg: 3.7770 semantic_segmentation_loss_cls: 0.0144 instance_segmentation_loss_cls: 0.0509 instance_segmentation_loss_reg: 0.4030 instance_segmentation_loss_poly: 1.1344 +2024/01/02 05:31:30 - mmengine - INFO - Iter(train) [ 43500/640000] base_lr: 1.9775e-04 lr: 1.9796e-05 eta: 10 days, 5:40:12 time: 1.5013 data_time: 0.0237 memory: 25725 grad_norm: 2.8768 loss: 1.6281 detection_loss_cls: 0.0549 detection_loss_reg: 0.4092 caption_loss_cls: 2.7337 grounding_loss_reg: 3.7672 semantic_segmentation_loss_cls: 0.0143 instance_segmentation_loss_cls: 0.0507 instance_segmentation_loss_reg: 0.4027 instance_segmentation_loss_poly: 1.1325 +2024/01/02 05:43:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 05:43:15 - mmengine - INFO - Iter(train) [ 44000/640000] base_lr: 1.9770e-04 lr: 1.9791e-05 eta: 10 days, 5:19:46 time: 1.4898 data_time: 0.0235 memory: 25725 grad_norm: 2.9771 loss: 1.6586 detection_loss_cls: 0.0548 detection_loss_reg: 0.4097 caption_loss_cls: 2.7274 grounding_loss_reg: 3.7556 semantic_segmentation_loss_cls: 0.0143 instance_segmentation_loss_cls: 0.0504 instance_segmentation_loss_reg: 0.4022 instance_segmentation_loss_poly: 1.1320 +2024/01/02 05:43:15 - mmengine - INFO - Saving checkpoint at 44000 iterations +2024/01/02 05:56:54 - mmengine - INFO - Iter(train) [ 44500/640000] base_lr: 1.9765e-04 lr: 1.9786e-05 eta: 10 days, 5:24:42 time: 1.5033 data_time: 0.0279 memory: 25725 grad_norm: 2.9567 loss: 1.6437 detection_loss_cls: 0.0545 detection_loss_reg: 0.4083 caption_loss_cls: 2.7291 grounding_loss_reg: 3.7477 semantic_segmentation_loss_cls: 0.0142 instance_segmentation_loss_cls: 0.0502 instance_segmentation_loss_reg: 0.4002 instance_segmentation_loss_poly: 1.1279 +2024/01/02 06:09:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 06:09:46 - mmengine - INFO - Iter(train) [ 45000/640000] base_lr: 1.9759e-04 lr: 1.9781e-05 eta: 10 days, 5:19:01 time: 1.5080 data_time: 0.0279 memory: 25725 grad_norm: 2.9629 loss: 1.6594 detection_loss_cls: 0.0543 detection_loss_reg: 0.4073 caption_loss_cls: 2.7252 grounding_loss_reg: 3.7385 semantic_segmentation_loss_cls: 0.0141 instance_segmentation_loss_cls: 0.0499 instance_segmentation_loss_reg: 0.3990 instance_segmentation_loss_poly: 1.1239 +2024/01/02 06:22:04 - mmengine - INFO - Iter(train) [ 45500/640000] base_lr: 1.9754e-04 lr: 1.9776e-05 eta: 10 days, 5:05:48 time: 1.5092 data_time: 0.0278 memory: 25725 grad_norm: 2.9687 loss: 1.6491 detection_loss_cls: 0.0540 detection_loss_reg: 0.4055 caption_loss_cls: 2.7209 grounding_loss_reg: 3.7304 semantic_segmentation_loss_cls: 0.0141 instance_segmentation_loss_cls: 0.0496 instance_segmentation_loss_reg: 0.3976 instance_segmentation_loss_poly: 1.1184 +2024/01/02 06:34:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 06:34:33 - mmengine - INFO - Iter(train) [ 46000/640000] base_lr: 1.9749e-04 lr: 1.9772e-05 eta: 10 days, 4:54:47 time: 1.5111 data_time: 0.0277 memory: 25725 grad_norm: 2.9474 loss: 1.6562 detection_loss_cls: 0.0539 detection_loss_reg: 0.4049 caption_loss_cls: 2.7212 grounding_loss_reg: 3.7253 semantic_segmentation_loss_cls: 0.0140 instance_segmentation_loss_cls: 0.0495 instance_segmentation_loss_reg: 0.3963 instance_segmentation_loss_poly: 1.1161 +2024/01/02 06:34:33 - mmengine - INFO - Saving checkpoint at 46000 iterations +2024/01/02 06:46:48 - mmengine - INFO - Iter(train) [ 46500/640000] base_lr: 1.9743e-04 lr: 1.9767e-05 eta: 10 days, 4:40:57 time: 1.5015 data_time: 0.0276 memory: 25725 grad_norm: 2.9823 loss: 1.6604 detection_loss_cls: 0.0537 detection_loss_reg: 0.4031 caption_loss_cls: 2.7235 grounding_loss_reg: 3.7135 semantic_segmentation_loss_cls: 0.0140 instance_segmentation_loss_cls: 0.0492 instance_segmentation_loss_reg: 0.3934 instance_segmentation_loss_poly: 1.1115 +2024/01/02 06:59:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 06:59:30 - mmengine - INFO - Iter(train) [ 47000/640000] base_lr: 1.9738e-04 lr: 1.9762e-05 eta: 10 days, 4:32:41 time: 1.5093 data_time: 0.0276 memory: 25725 grad_norm: 2.9865 loss: 1.6422 detection_loss_cls: 0.0535 detection_loss_reg: 0.4015 caption_loss_cls: 2.7199 grounding_loss_reg: 3.7049 semantic_segmentation_loss_cls: 0.0139 instance_segmentation_loss_cls: 0.0491 instance_segmentation_loss_reg: 0.3929 instance_segmentation_loss_poly: 1.1089 +2024/01/02 07:11:08 - mmengine - INFO - Iter(train) [ 47500/640000] base_lr: 1.9732e-04 lr: 1.9756e-05 eta: 10 days, 4:11:13 time: 1.4945 data_time: 0.0271 memory: 25725 grad_norm: 3.0140 loss: 1.6378 detection_loss_cls: 0.0531 detection_loss_reg: 0.3998 caption_loss_cls: 2.7161 grounding_loss_reg: 3.6952 semantic_segmentation_loss_cls: 0.0139 instance_segmentation_loss_cls: 0.0489 instance_segmentation_loss_reg: 0.3922 instance_segmentation_loss_poly: 1.1056 +2024/01/02 07:23:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 07:23:09 - mmengine - INFO - Iter(train) [ 48000/640000] base_lr: 1.9726e-04 lr: 1.9751e-05 eta: 10 days, 3:54:36 time: 1.4984 data_time: 0.0273 memory: 25725 grad_norm: 2.9633 loss: 1.6267 detection_loss_cls: 0.0530 detection_loss_reg: 0.3995 caption_loss_cls: 2.7114 grounding_loss_reg: 3.6844 semantic_segmentation_loss_cls: 0.0138 instance_segmentation_loss_cls: 0.0488 instance_segmentation_loss_reg: 0.3920 instance_segmentation_loss_poly: 1.1047 +2024/01/02 07:23:09 - mmengine - INFO - Saving checkpoint at 48000 iterations +2024/01/02 07:35:40 - mmengine - INFO - Iter(train) [ 48500/640000] base_lr: 1.9721e-04 lr: 1.9746e-05 eta: 10 days, 3:44:10 time: 1.4816 data_time: 0.0270 memory: 25725 grad_norm: 2.9885 loss: 1.6299 detection_loss_cls: 0.0530 detection_loss_reg: 0.4003 caption_loss_cls: 2.7099 grounding_loss_reg: 3.6737 semantic_segmentation_loss_cls: 0.0137 instance_segmentation_loss_cls: 0.0487 instance_segmentation_loss_reg: 0.3913 instance_segmentation_loss_poly: 1.1018 +2024/01/02 07:48:26 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 07:48:26 - mmengine - INFO - Iter(train) [ 49000/640000] base_lr: 1.9715e-04 lr: 1.9741e-05 eta: 10 days, 3:36:38 time: 1.4800 data_time: 0.0272 memory: 25725 grad_norm: 2.9918 loss: 1.6332 detection_loss_cls: 0.0528 detection_loss_reg: 0.3995 caption_loss_cls: 2.7096 grounding_loss_reg: 3.6638 semantic_segmentation_loss_cls: 0.0137 instance_segmentation_loss_cls: 0.0486 instance_segmentation_loss_reg: 0.3917 instance_segmentation_loss_poly: 1.1009 +2024/01/02 08:01:03 - mmengine - INFO - Iter(train) [ 49500/640000] base_lr: 1.9709e-04 lr: 1.9736e-05 eta: 10 days, 3:27:16 time: 1.4847 data_time: 0.0273 memory: 25725 grad_norm: 2.9483 loss: 1.6258 detection_loss_cls: 0.0528 detection_loss_reg: 0.3998 caption_loss_cls: 2.7061 grounding_loss_reg: 3.6522 semantic_segmentation_loss_cls: 0.0137 instance_segmentation_loss_cls: 0.0485 instance_segmentation_loss_reg: 0.3925 instance_segmentation_loss_poly: 1.1027 +2024/01/02 08:13:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 08:13:12 - mmengine - INFO - Iter(train) [ 50000/640000] base_lr: 1.9703e-04 lr: 1.9730e-05 eta: 10 days, 3:12:16 time: 1.4798 data_time: 0.0272 memory: 25725 grad_norm: 2.9677 loss: 1.6134 detection_loss_cls: 0.0526 detection_loss_reg: 0.3993 caption_loss_cls: 2.7019 grounding_loss_reg: 3.6436 semantic_segmentation_loss_cls: 0.0137 instance_segmentation_loss_cls: 0.0482 instance_segmentation_loss_reg: 0.3902 instance_segmentation_loss_poly: 1.0980 +2024/01/02 08:13:12 - mmengine - INFO - Saving checkpoint at 50000 iterations +2024/01/02 08:25:49 - mmengine - INFO - Iter(train) [ 50500/640000] base_lr: 1.9697e-04 lr: 1.9725e-05 eta: 10 days, 3:02:50 time: 1.4852 data_time: 0.0273 memory: 25725 grad_norm: 2.9259 loss: 1.5964 detection_loss_cls: 0.0523 detection_loss_reg: 0.3977 caption_loss_cls: 2.6985 grounding_loss_reg: 3.6387 semantic_segmentation_loss_cls: 0.0137 instance_segmentation_loss_cls: 0.0481 instance_segmentation_loss_reg: 0.3898 instance_segmentation_loss_poly: 1.0974 +2024/01/02 08:37:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 08:37:56 - mmengine - INFO - Iter(train) [ 51000/640000] base_lr: 1.9691e-04 lr: 1.9719e-05 eta: 10 days, 2:47:28 time: 1.4765 data_time: 0.0272 memory: 25725 grad_norm: 2.9157 loss: 1.6063 detection_loss_cls: 0.0523 detection_loss_reg: 0.3984 caption_loss_cls: 2.7010 grounding_loss_reg: 3.6337 semantic_segmentation_loss_cls: 0.0136 instance_segmentation_loss_cls: 0.0480 instance_segmentation_loss_reg: 0.3899 instance_segmentation_loss_poly: 1.0964 +2024/01/02 08:49:54 - mmengine - INFO - Iter(train) [ 51500/640000] base_lr: 1.9685e-04 lr: 1.9714e-05 eta: 10 days, 2:30:36 time: 1.4814 data_time: 0.0273 memory: 25725 grad_norm: 2.9033 loss: 1.6008 detection_loss_cls: 0.0522 detection_loss_reg: 0.3981 caption_loss_cls: 2.6939 grounding_loss_reg: 3.6297 semantic_segmentation_loss_cls: 0.0136 instance_segmentation_loss_cls: 0.0477 instance_segmentation_loss_reg: 0.3891 instance_segmentation_loss_poly: 1.0936 +2024/01/02 09:02:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 09:02:07 - mmengine - INFO - Iter(train) [ 52000/640000] base_lr: 1.9679e-04 lr: 1.9708e-05 eta: 10 days, 2:16:30 time: 1.4843 data_time: 0.0273 memory: 25725 grad_norm: 2.9070 loss: 1.5982 detection_loss_cls: 0.0521 detection_loss_reg: 0.3984 caption_loss_cls: 2.6924 grounding_loss_reg: 3.6191 semantic_segmentation_loss_cls: 0.0136 instance_segmentation_loss_cls: 0.0477 instance_segmentation_loss_reg: 0.3896 instance_segmentation_loss_poly: 1.0939 +2024/01/02 09:02:07 - mmengine - INFO - Saving checkpoint at 52000 iterations +2024/01/02 09:14:55 - mmengine - INFO - Iter(train) [ 52500/640000] base_lr: 1.9673e-04 lr: 1.9703e-05 eta: 10 days, 2:09:03 time: 1.4885 data_time: 0.0273 memory: 25725 grad_norm: 2.9179 loss: 1.6001 detection_loss_cls: 0.0521 detection_loss_reg: 0.3977 caption_loss_cls: 2.6951 grounding_loss_reg: 3.6132 semantic_segmentation_loss_cls: 0.0135 instance_segmentation_loss_cls: 0.0474 instance_segmentation_loss_reg: 0.3869 instance_segmentation_loss_poly: 1.0880 +2024/01/02 09:27:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 09:27:17 - mmengine - INFO - Iter(train) [ 53000/640000] base_lr: 1.9667e-04 lr: 1.9697e-05 eta: 10 days, 1:56:45 time: 1.4826 data_time: 0.0271 memory: 25725 grad_norm: 2.9377 loss: 1.6005 detection_loss_cls: 0.0519 detection_loss_reg: 0.3974 caption_loss_cls: 2.6943 grounding_loss_reg: 3.6067 semantic_segmentation_loss_cls: 0.0135 instance_segmentation_loss_cls: 0.0473 instance_segmentation_loss_reg: 0.3865 instance_segmentation_loss_poly: 1.0876 +2024/01/02 09:39:13 - mmengine - INFO - Iter(train) [ 53500/640000] base_lr: 1.9661e-04 lr: 1.9691e-05 eta: 10 days, 1:39:32 time: 1.4722 data_time: 0.0268 memory: 25725 grad_norm: 2.9475 loss: 1.5882 detection_loss_cls: 0.0517 detection_loss_reg: 0.3970 caption_loss_cls: 2.6898 grounding_loss_reg: 3.5967 semantic_segmentation_loss_cls: 0.0135 instance_segmentation_loss_cls: 0.0470 instance_segmentation_loss_reg: 0.3853 instance_segmentation_loss_poly: 1.0840 +2024/01/02 09:51:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 09:51:39 - mmengine - INFO - Iter(train) [ 54000/640000] base_lr: 1.9654e-04 lr: 1.9686e-05 eta: 10 days, 1:27:56 time: 1.4765 data_time: 0.0270 memory: 25725 grad_norm: 2.9100 loss: 1.5955 detection_loss_cls: 0.0515 detection_loss_reg: 0.3951 caption_loss_cls: 2.6879 grounding_loss_reg: 3.5910 semantic_segmentation_loss_cls: 0.0134 instance_segmentation_loss_cls: 0.0470 instance_segmentation_loss_reg: 0.3851 instance_segmentation_loss_poly: 1.0823 +2024/01/02 09:51:39 - mmengine - INFO - Saving checkpoint at 54000 iterations +2024/01/02 10:03:57 - mmengine - INFO - Iter(train) [ 54500/640000] base_lr: 1.9648e-04 lr: 1.9680e-05 eta: 10 days, 1:14:59 time: 1.4718 data_time: 0.0269 memory: 25725 grad_norm: 2.9092 loss: 1.6138 detection_loss_cls: 0.0513 detection_loss_reg: 0.3943 caption_loss_cls: 2.6863 grounding_loss_reg: 3.5835 semantic_segmentation_loss_cls: 0.0134 instance_segmentation_loss_cls: 0.0467 instance_segmentation_loss_reg: 0.3834 instance_segmentation_loss_poly: 1.0794 +2024/01/02 10:16:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 10:16:41 - mmengine - INFO - Iter(train) [ 55000/640000] base_lr: 1.9641e-04 lr: 1.9674e-05 eta: 10 days, 1:06:36 time: 1.4812 data_time: 0.0272 memory: 25725 grad_norm: 2.9125 loss: 1.6072 detection_loss_cls: 0.0512 detection_loss_reg: 0.3943 caption_loss_cls: 2.6811 grounding_loss_reg: 3.5775 semantic_segmentation_loss_cls: 0.0133 instance_segmentation_loss_cls: 0.0468 instance_segmentation_loss_reg: 0.3850 instance_segmentation_loss_poly: 1.0826 +2024/01/02 10:29:19 - mmengine - INFO - Iter(train) [ 55500/640000] base_lr: 1.9635e-04 lr: 1.9668e-05 eta: 10 days, 0:56:58 time: 1.4910 data_time: 0.0274 memory: 25725 grad_norm: 2.8916 loss: 1.6083 detection_loss_cls: 0.0511 detection_loss_reg: 0.3939 caption_loss_cls: 2.6768 grounding_loss_reg: 3.5720 semantic_segmentation_loss_cls: 0.0133 instance_segmentation_loss_cls: 0.0466 instance_segmentation_loss_reg: 0.3836 instance_segmentation_loss_poly: 1.0794 +2024/01/02 10:42:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240101_105140 +2024/01/02 10:42:58 - mmengine - INFO - Iter(train) [ 56000/640000] base_lr: 1.9628e-04 lr: 1.9662e-05 eta: 10 days, 0:58:01 time: 1.5127 data_time: 0.0273 memory: 25725 grad_norm: 2.8811 loss: 1.5883 detection_loss_cls: 0.0509 detection_loss_reg: 0.3920 caption_loss_cls: 2.6795 grounding_loss_reg: 3.5663 semantic_segmentation_loss_cls: 0.0132 instance_segmentation_loss_cls: 0.0464 instance_segmentation_loss_reg: 0.3828 instance_segmentation_loss_poly: 1.0778 +2024/01/02 10:42:58 - mmengine - INFO - Saving checkpoint at 56000 iterations +2024/01/02 12:48:00 - mmengine - INFO - Iter(train) [ 56500/640000] base_lr: 1.9622e-04 lr: 1.9656e-05 eta: 9 days, 21:38:52 time: 1.5039 data_time: 0.0223 memory: 25721 grad_norm: 2.9124 loss: 1.5817 detection_loss_cls: 0.0510 detection_loss_reg: 0.3929 caption_loss_cls: 2.6683 grounding_loss_reg: 3.5612 semantic_segmentation_loss_cls: 0.0132 instance_segmentation_loss_cls: 0.0464 instance_segmentation_loss_reg: 0.3834 instance_segmentation_loss_poly: 1.0783 +2024/01/02 13:00:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 13:00:29 - mmengine - INFO - Iter(train) [ 57000/640000] base_lr: 1.9615e-04 lr: 1.9650e-05 eta: 9 days, 23:53:19 time: 1.5054 data_time: 0.0219 memory: 25718 grad_norm: 2.9327 loss: 1.5805 detection_loss_cls: 0.0506 detection_loss_reg: 0.3908 caption_loss_cls: 2.6628 grounding_loss_reg: 3.5527 semantic_segmentation_loss_cls: 0.0131 instance_segmentation_loss_cls: 0.0463 instance_segmentation_loss_reg: 0.3829 instance_segmentation_loss_poly: 1.0762 +2024/01/02 13:12:40 - mmengine - INFO - Iter(train) [ 57500/640000] base_lr: 1.9608e-04 lr: 1.9644e-05 eta: 9 days, 22:40:51 time: 1.5094 data_time: 0.0213 memory: 25718 grad_norm: 2.9874 loss: 1.5773 detection_loss_cls: 0.0505 detection_loss_reg: 0.3909 caption_loss_cls: 2.6550 grounding_loss_reg: 3.5428 semantic_segmentation_loss_cls: 0.0132 instance_segmentation_loss_cls: 0.0461 instance_segmentation_loss_reg: 0.3814 instance_segmentation_loss_poly: 1.0724 +2024/01/02 13:24:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 13:24:46 - mmengine - INFO - Iter(train) [ 58000/640000] base_lr: 1.9601e-04 lr: 1.9638e-05 eta: 9 days, 21:32:31 time: 1.5045 data_time: 0.0208 memory: 25718 grad_norm: 3.0390 loss: 1.5810 detection_loss_cls: 0.0503 detection_loss_reg: 0.3907 caption_loss_cls: 2.6514 grounding_loss_reg: 3.5427 semantic_segmentation_loss_cls: 0.0131 instance_segmentation_loss_cls: 0.0462 instance_segmentation_loss_reg: 0.3828 instance_segmentation_loss_poly: 1.0743 +2024/01/02 13:24:46 - mmengine - INFO - Saving checkpoint at 58000 iterations +2024/01/02 13:37:23 - mmengine - INFO - Iter(train) [ 58500/640000] base_lr: 1.9595e-04 lr: 1.9631e-05 eta: 9 days, 22:45:15 time: 1.5090 data_time: 0.0203 memory: 25718 grad_norm: 3.0619 loss: 1.5679 detection_loss_cls: 0.0503 detection_loss_reg: 0.3912 caption_loss_cls: 2.6437 grounding_loss_reg: 3.5348 semantic_segmentation_loss_cls: 0.0130 instance_segmentation_loss_cls: 0.0460 instance_segmentation_loss_reg: 0.3828 instance_segmentation_loss_poly: 1.0752 +2024/01/02 13:49:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 13:49:32 - mmengine - INFO - Iter(train) [ 59000/640000] base_lr: 1.9588e-04 lr: 1.9625e-05 eta: 9 days, 22:01:41 time: 1.5003 data_time: 0.0196 memory: 25718 grad_norm: 3.0831 loss: 1.5715 detection_loss_cls: 0.0502 detection_loss_reg: 0.3913 caption_loss_cls: 2.6381 grounding_loss_reg: 3.5320 semantic_segmentation_loss_cls: 0.0130 instance_segmentation_loss_cls: 0.0459 instance_segmentation_loss_reg: 0.3832 instance_segmentation_loss_poly: 1.0746 +2024/01/02 14:01:29 - mmengine - INFO - Iter(train) [ 59500/640000] base_lr: 1.9581e-04 lr: 1.9619e-05 eta: 9 days, 20:52:16 time: 1.4901 data_time: 0.0191 memory: 25718 grad_norm: 3.1812 loss: 1.5724 detection_loss_cls: 0.0498 detection_loss_reg: 0.3912 caption_loss_cls: 2.6354 grounding_loss_reg: 3.5222 semantic_segmentation_loss_cls: 0.0131 instance_segmentation_loss_cls: 0.0457 instance_segmentation_loss_reg: 0.3826 instance_segmentation_loss_poly: 1.0739 +2024/01/02 14:13:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 14:13:56 - mmengine - INFO - Iter(train) [ 60000/640000] base_lr: 1.9574e-04 lr: 1.9612e-05 eta: 9 days, 21:10:06 time: 1.4721 data_time: 0.0187 memory: 25718 grad_norm: 3.1790 loss: 1.5748 detection_loss_cls: 0.0496 detection_loss_reg: 0.3910 caption_loss_cls: 2.6341 grounding_loss_reg: 3.5158 semantic_segmentation_loss_cls: 0.0130 instance_segmentation_loss_cls: 0.0456 instance_segmentation_loss_reg: 0.3819 instance_segmentation_loss_poly: 1.0722 +2024/01/02 14:13:56 - mmengine - INFO - Saving checkpoint at 60000 iterations +2024/01/02 14:26:12 - mmengine - INFO - Evaluating bbox... +2024/01/02 14:27:07 - mmengine - INFO - bbox_mAP_copypaste: 0.373 0.562 0.417 0.249 0.427 0.466 +2024/01/02 14:27:07 - mmengine - INFO - Evaluating segm... +2024/01/02 14:28:19 - mmengine - INFO - segm_mAP_copypaste: 0.240 0.471 0.222 0.120 0.285 0.371 +2024/01/02 14:35:11 - mmengine - INFO - per class results: +2024/01/02 14:35:11 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 76.42 | 88.29 | +| building | 82.06 | 89.63 | +| sky | 93.27 | 96.11 | +| floor | 81.58 | 87.32 | +| tree | 69.31 | 93.44 | +| ceiling | 84.64 | 92.04 | +| road | 81.5 | 91.06 | +| bed | 85.77 | 92.22 | +| windowpane | 61.58 | 79.92 | +| grass | 66.97 | 78.25 | +| cabinet | 58.35 | 75.96 | +| sidewalk | 60.69 | 72.46 | +| person | 80.07 | 89.1 | +| earth | 37.61 | 51.37 | +| door | 46.65 | 69.56 | +| table | 53.51 | 62.56 | +| mountain | 59.43 | 75.4 | +| plant | 48.53 | 61.63 | +| curtain | 67.55 | 84.49 | +| chair | 51.9 | 64.2 | +| car | 81.82 | 92.06 | +| water | 40.67 | 47.74 | +| painting | 69.48 | 82.19 | +| sofa | 62.23 | 85.49 | +| shelf | 40.85 | 57.3 | +| house | 45.34 | 70.54 | +| sea | 65.39 | 81.09 | +| mirror | 60.93 | 68.26 | +| rug | 69.32 | 77.36 | +| field | 26.5 | 41.3 | +| armchair | 33.11 | 47.73 | +| seat | 56.54 | 69.05 | +| fence | 40.47 | 51.14 | +| desk | 37.2 | 53.98 | +| rock | 43.4 | 59.13 | +| wardrobe | 48.38 | 57.59 | +| lamp | 53.94 | 75.95 | +| bathtub | 60.97 | 86.0 | +| railing | 32.29 | 49.27 | +| cushion | 52.7 | 66.57 | +| base | 26.58 | 52.07 | +| box | 18.53 | 22.83 | +| column | 48.47 | 71.07 | +| signboard | 34.68 | 47.67 | +| chest of drawers | 40.29 | 61.48 | +| counter | 16.92 | 18.48 | +| sand | 35.1 | 41.61 | +| sink | 62.13 | 73.55 | +| skyscraper | 58.28 | 81.35 | +| fireplace | 66.07 | 85.07 | +| refrigerator | 66.61 | 76.45 | +| grandstand | 48.03 | 63.49 | +| path | 21.06 | 40.83 | +| stairs | 27.3 | 32.24 | +| runway | 65.01 | 77.67 | +| case | 30.69 | 32.52 | +| pool table | 83.56 | 97.39 | +| pillow | 55.28 | 76.86 | +| screen door | 8.77 | 8.81 | +| stairway | 28.81 | 43.04 | +| river | 11.92 | 59.75 | +| bridge | 63.54 | 88.61 | +| bookcase | 36.84 | 54.03 | +| blind | 19.11 | 20.09 | +| coffee table | 51.39 | 86.3 | +| toilet | 81.96 | 85.66 | +| flower | 24.16 | 30.93 | +| book | 44.64 | 60.71 | +| hill | 11.74 | 13.65 | +| bench | 42.9 | 48.68 | +| countertop | 48.04 | 56.0 | +| stove | 66.56 | 75.78 | +| palm | 44.56 | 59.27 | +| kitchen island | 35.95 | 83.45 | +| computer | 69.92 | 84.05 | +| swivel chair | 37.13 | 54.47 | +| boat | 68.92 | 72.25 | +| bar | 37.87 | 61.31 | +| arcade machine | 60.28 | 84.17 | +| hovel | 22.53 | 25.86 | +| bus | 91.39 | 95.59 | +| towel | 47.41 | 50.88 | +| light | 46.69 | 69.88 | +| truck | 34.65 | 47.75 | +| tower | 22.15 | 43.12 | +| chandelier | 52.5 | 57.89 | +| awning | 27.62 | 33.88 | +| streetlight | 27.78 | 39.61 | +| booth | 38.52 | 42.93 | +| television receiver | 58.42 | 80.29 | +| airplane | 56.51 | 62.2 | +| dirt track | 0.14 | 0.22 | +| apparel | 17.19 | 24.01 | +| pole | 23.88 | 36.65 | +| land | 1.27 | 1.54 | +| bannister | 12.7 | 18.52 | +| escalator | 9.96 | 10.69 | +| ottoman | 44.24 | 65.77 | +| bottle | 19.82 | 25.32 | +| buffet | 40.01 | 63.86 | +| poster | 21.72 | 29.97 | +| stage | 6.81 | 11.04 | +| van | 24.37 | 28.53 | +| ship | 11.23 | 12.89 | +| fountain | 15.73 | 17.22 | +| conveyer belt | 58.05 | 89.02 | +| canopy | 26.01 | 50.04 | +| washer | 62.09 | 63.35 | +| plaything | 27.49 | 31.88 | +| swimming pool | 34.84 | 43.84 | +| stool | 39.87 | 63.7 | +| barrel | 7.63 | 64.88 | +| basket | 24.77 | 33.04 | +| waterfall | 61.01 | 69.84 | +| tent | 91.37 | 95.07 | +| bag | 7.33 | 7.86 | +| minibike | 59.74 | 88.08 | +| cradle | 63.98 | 81.7 | +| oven | 12.04 | 14.57 | +| ball | 45.6 | 68.76 | +| food | 37.55 | 39.63 | +| step | 10.52 | 13.72 | +| tank | 28.79 | 40.06 | +| trade name | 27.74 | 34.22 | +| microwave | 73.43 | 89.86 | +| pot | 43.93 | 54.58 | +| animal | 57.63 | 60.62 | +| bicycle | 56.82 | 72.0 | +| lake | 11.45 | 13.07 | +| dishwasher | 50.79 | 69.8 | +| screen | 67.76 | 85.55 | +| blanket | 10.49 | 15.92 | +| sculpture | 38.92 | 59.4 | +| hood | 48.82 | 59.87 | +| sconce | 27.58 | 39.51 | +| vase | 36.38 | 58.33 | +| traffic light | 28.34 | 57.57 | +| tray | 6.24 | 22.35 | +| ashcan | 30.18 | 63.68 | +| fan | 48.9 | 58.14 | +| pier | 38.14 | 60.89 | +| crt screen | 0.13 | 0.17 | +| plate | 44.0 | 56.88 | +| monitor | 35.66 | 53.29 | +| bulletin board | 11.61 | 11.95 | +| shower | 0.55 | 12.82 | +| radiator | 41.35 | 45.19 | +| glass | 12.94 | 14.12 | +| clock | 19.46 | 29.28 | +| flag | 28.56 | 30.98 | ++---------------------+-------+-------+ +2024/01/02 14:35:29 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.3730 coco/bbox_mAP_50: 0.5620 coco/bbox_mAP_75: 0.4170 coco/bbox_mAP_s: 0.2490 coco/bbox_mAP_m: 0.4270 coco/bbox_mAP_l: 0.4660 coco/segm_mAP: 0.2400 coco/segm_mAP_50: 0.4710 coco/segm_mAP_75: 0.2220 coco/segm_mAP_s: 0.1200 coco/segm_mAP_m: 0.2850 coco/segm_mAP_l: 0.3710 Bleu_1: 0.6945 Bleu_2: 0.5212 Bleu_3: 0.3807 Bleu_4: 0.2775 METEOR: 0.2387 ROUGE_L: 0.5110 CIDEr: 0.8553 SPICE: 0.1695 aAcc: 81.2400 mIoU: 42.9400 mAcc: 55.8900 visual-grounding/miou: 0.6843 visual-grounding/acc: 0.7575 data_time: 0.0115 time: 1.3583 +2024/01/02 14:46:49 - mmengine - INFO - Iter(train) [ 60500/640000] base_lr: 1.9567e-04 lr: 1.9606e-05 eta: 9 days, 19:01:37 time: 1.4593 data_time: 0.0193 memory: 25721 grad_norm: 3.1978 loss: 1.5922 detection_loss_cls: 0.0494 detection_loss_reg: 0.3900 caption_loss_cls: 2.6289 grounding_loss_reg: 3.5096 semantic_segmentation_loss_cls: 0.0130 instance_segmentation_loss_cls: 0.0454 instance_segmentation_loss_reg: 0.3812 instance_segmentation_loss_poly: 1.0720 +2024/01/02 14:59:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 14:59:28 - mmengine - INFO - Iter(train) [ 61000/640000] base_lr: 1.9560e-04 lr: 1.9600e-05 eta: 9 days, 19:45:39 time: 1.4620 data_time: 0.0195 memory: 25721 grad_norm: 3.1470 loss: 1.5716 detection_loss_cls: 0.0492 detection_loss_reg: 0.3896 caption_loss_cls: 2.6284 grounding_loss_reg: 3.5050 semantic_segmentation_loss_cls: 0.0129 instance_segmentation_loss_cls: 0.0452 instance_segmentation_loss_reg: 0.3803 instance_segmentation_loss_poly: 1.0698 +2024/01/02 15:11:37 - mmengine - INFO - Iter(train) [ 61500/640000] base_lr: 1.9552e-04 lr: 1.9593e-05 eta: 9 days, 19:26:44 time: 1.4615 data_time: 0.0198 memory: 25721 grad_norm: 3.1788 loss: 1.5790 detection_loss_cls: 0.0489 detection_loss_reg: 0.3873 caption_loss_cls: 2.6257 grounding_loss_reg: 3.4979 semantic_segmentation_loss_cls: 0.0129 instance_segmentation_loss_cls: 0.0448 instance_segmentation_loss_reg: 0.3787 instance_segmentation_loss_poly: 1.0672 +2024/01/02 15:23:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 15:23:42 - mmengine - INFO - Iter(train) [ 62000/640000] base_lr: 1.9545e-04 lr: 1.9586e-05 eta: 9 days, 19:02:19 time: 1.4612 data_time: 0.0200 memory: 25721 grad_norm: 4.5980 loss: 1.5732 detection_loss_cls: 0.0488 detection_loss_reg: 0.3875 caption_loss_cls: 2.6197 grounding_loss_reg: 3.4938 semantic_segmentation_loss_cls: 0.0129 instance_segmentation_loss_cls: 0.0446 instance_segmentation_loss_reg: 0.3777 instance_segmentation_loss_poly: 1.0651 +2024/01/02 15:23:42 - mmengine - INFO - Saving checkpoint at 62000 iterations +2024/01/02 15:35:36 - mmengine - INFO - Iter(train) [ 62500/640000] base_lr: 1.9538e-04 lr: 1.9580e-05 eta: 9 days, 18:23:39 time: 1.4506 data_time: 0.0207 memory: 25721 grad_norm: 4.6614 loss: 1.5773 detection_loss_cls: 0.0488 detection_loss_reg: 0.3875 caption_loss_cls: 2.6171 grounding_loss_reg: 3.4848 semantic_segmentation_loss_cls: 0.0129 instance_segmentation_loss_cls: 0.0446 instance_segmentation_loss_reg: 0.3787 instance_segmentation_loss_poly: 1.0675 +2024/01/02 15:47:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 15:47:32 - mmengine - INFO - Iter(train) [ 63000/640000] base_lr: 1.9530e-04 lr: 1.9573e-05 eta: 9 days, 17:51:43 time: 1.4473 data_time: 0.0208 memory: 25721 grad_norm: 4.6993 loss: 1.5692 detection_loss_cls: 0.0487 detection_loss_reg: 0.3868 caption_loss_cls: 2.6103 grounding_loss_reg: 3.4776 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0445 instance_segmentation_loss_reg: 0.3773 instance_segmentation_loss_poly: 1.0642 +2024/01/02 15:59:49 - mmengine - INFO - Iter(train) [ 63500/640000] base_lr: 1.9523e-04 lr: 1.9566e-05 eta: 9 days, 17:49:02 time: 1.4523 data_time: 0.0212 memory: 25721 grad_norm: 4.5913 loss: 1.5757 detection_loss_cls: 0.0486 detection_loss_reg: 0.3870 caption_loss_cls: 2.6079 grounding_loss_reg: 3.4730 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0443 instance_segmentation_loss_reg: 0.3771 instance_segmentation_loss_poly: 1.0639 +2024/01/02 16:11:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 16:11:55 - mmengine - INFO - Iter(train) [ 64000/640000] base_lr: 1.9515e-04 lr: 1.9560e-05 eta: 9 days, 17:31:54 time: 1.4471 data_time: 0.0214 memory: 25721 grad_norm: 4.6896 loss: 1.5934 detection_loss_cls: 0.0485 detection_loss_reg: 0.3869 caption_loss_cls: 2.6080 grounding_loss_reg: 3.4618 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0444 instance_segmentation_loss_reg: 0.3777 instance_segmentation_loss_poly: 1.0645 +2024/01/02 16:11:55 - mmengine - INFO - Saving checkpoint at 64000 iterations +2024/01/02 16:24:11 - mmengine - INFO - Iter(train) [ 64500/640000] base_lr: 1.9508e-04 lr: 1.9553e-05 eta: 9 days, 17:25:46 time: 1.4604 data_time: 0.0257 memory: 25721 grad_norm: 4.6491 loss: 1.5776 detection_loss_cls: 0.0484 detection_loss_reg: 0.3878 caption_loss_cls: 2.6046 grounding_loss_reg: 3.4571 semantic_segmentation_loss_cls: 0.0128 instance_segmentation_loss_cls: 0.0443 instance_segmentation_loss_reg: 0.3774 instance_segmentation_loss_poly: 1.0643 +2024/01/02 16:36:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 16:36:10 - mmengine - INFO - Iter(train) [ 65000/640000] base_lr: 1.9500e-04 lr: 1.9546e-05 eta: 9 days, 17:02:35 time: 1.4505 data_time: 0.0255 memory: 25721 grad_norm: 4.7232 loss: 1.5847 detection_loss_cls: 0.0484 detection_loss_reg: 0.3876 caption_loss_cls: 2.5992 grounding_loss_reg: 3.4498 semantic_segmentation_loss_cls: 0.0127 instance_segmentation_loss_cls: 0.0442 instance_segmentation_loss_reg: 0.3776 instance_segmentation_loss_poly: 1.0641 +2024/01/02 16:49:12 - mmengine - INFO - Iter(train) [ 65500/640000] base_lr: 1.9493e-04 lr: 1.9539e-05 eta: 9 days, 17:42:41 time: 1.4636 data_time: 0.0257 memory: 25721 grad_norm: 4.6292 loss: 1.5704 detection_loss_cls: 0.0483 detection_loss_reg: 0.3872 caption_loss_cls: 2.5982 grounding_loss_reg: 3.4426 semantic_segmentation_loss_cls: 0.0127 instance_segmentation_loss_cls: 0.0440 instance_segmentation_loss_reg: 0.3770 instance_segmentation_loss_poly: 1.0625 +2024/01/02 17:01:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 17:01:15 - mmengine - INFO - Iter(train) [ 66000/640000] base_lr: 1.9485e-04 lr: 1.9532e-05 eta: 9 days, 17:22:02 time: 1.4632 data_time: 0.0257 memory: 25721 grad_norm: 3.1954 loss: 1.5604 detection_loss_cls: 0.0481 detection_loss_reg: 0.3855 caption_loss_cls: 2.5946 grounding_loss_reg: 3.4340 semantic_segmentation_loss_cls: 0.0127 instance_segmentation_loss_cls: 0.0439 instance_segmentation_loss_reg: 0.3764 instance_segmentation_loss_poly: 1.0609 +2024/01/02 17:01:15 - mmengine - INFO - Saving checkpoint at 66000 iterations +2024/01/02 17:14:17 - mmengine - INFO - Iter(train) [ 66500/640000] base_lr: 1.9477e-04 lr: 1.9525e-05 eta: 9 days, 17:55:17 time: 1.4801 data_time: 0.0254 memory: 25721 grad_norm: 3.0741 loss: 1.5365 detection_loss_cls: 0.0480 detection_loss_reg: 0.3868 caption_loss_cls: 2.5875 grounding_loss_reg: 3.4313 semantic_segmentation_loss_cls: 0.0127 instance_segmentation_loss_cls: 0.0437 instance_segmentation_loss_reg: 0.3755 instance_segmentation_loss_poly: 1.0590 +2024/01/02 17:26:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 17:26:57 - mmengine - INFO - Iter(train) [ 67000/640000] base_lr: 1.9469e-04 lr: 1.9518e-05 eta: 9 days, 18:04:59 time: 1.4909 data_time: 0.0256 memory: 25721 grad_norm: 2.9718 loss: 1.5281 detection_loss_cls: 0.0479 detection_loss_reg: 0.3863 caption_loss_cls: 2.5913 grounding_loss_reg: 3.4249 semantic_segmentation_loss_cls: 0.0127 instance_segmentation_loss_cls: 0.0436 instance_segmentation_loss_reg: 0.3763 instance_segmentation_loss_poly: 1.0599 +2024/01/02 17:39:03 - mmengine - INFO - Iter(train) [ 67500/640000] base_lr: 1.9462e-04 lr: 1.9510e-05 eta: 9 days, 17:44:47 time: 1.4881 data_time: 0.0254 memory: 25721 grad_norm: 2.9908 loss: 1.5264 detection_loss_cls: 0.0482 detection_loss_reg: 0.3873 caption_loss_cls: 2.5898 grounding_loss_reg: 3.4213 semantic_segmentation_loss_cls: 0.0127 instance_segmentation_loss_cls: 0.0436 instance_segmentation_loss_reg: 0.3762 instance_segmentation_loss_poly: 1.0602 +2024/01/02 17:50:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 17:50:14 - mmengine - INFO - Iter(train) [ 68000/640000] base_lr: 1.9454e-04 lr: 1.9503e-05 eta: 9 days, 16:42:13 time: 1.4746 data_time: 0.0251 memory: 25721 grad_norm: 2.9585 loss: 1.5169 detection_loss_cls: 0.0481 detection_loss_reg: 0.3873 caption_loss_cls: 2.5834 grounding_loss_reg: 3.4165 semantic_segmentation_loss_cls: 0.0126 instance_segmentation_loss_cls: 0.0436 instance_segmentation_loss_reg: 0.3758 instance_segmentation_loss_poly: 1.0595 +2024/01/02 17:50:14 - mmengine - INFO - Saving checkpoint at 68000 iterations +2024/01/02 18:02:50 - mmengine - INFO - Iter(train) [ 68500/640000] base_lr: 1.9446e-04 lr: 1.9496e-05 eta: 9 days, 16:48:09 time: 1.4798 data_time: 0.0253 memory: 25721 grad_norm: 3.0095 loss: 1.5233 detection_loss_cls: 0.0479 detection_loss_reg: 0.3864 caption_loss_cls: 2.5828 grounding_loss_reg: 3.4117 semantic_segmentation_loss_cls: 0.0126 instance_segmentation_loss_cls: 0.0435 instance_segmentation_loss_reg: 0.3756 instance_segmentation_loss_poly: 1.0585 +2024/01/02 18:14:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 18:14:21 - mmengine - INFO - Iter(train) [ 69000/640000] base_lr: 1.9438e-04 lr: 1.9489e-05 eta: 9 days, 16:04:36 time: 1.4725 data_time: 0.0253 memory: 25721 grad_norm: 2.9637 loss: 1.5264 detection_loss_cls: 0.0477 detection_loss_reg: 0.3836 caption_loss_cls: 2.5799 grounding_loss_reg: 3.4074 semantic_segmentation_loss_cls: 0.0126 instance_segmentation_loss_cls: 0.0434 instance_segmentation_loss_reg: 0.3750 instance_segmentation_loss_poly: 1.0572 +2024/01/02 18:26:23 - mmengine - INFO - Iter(train) [ 69500/640000] base_lr: 1.9429e-04 lr: 1.9481e-05 eta: 9 days, 15:45:23 time: 1.4575 data_time: 0.0252 memory: 25721 grad_norm: 2.9825 loss: 1.5451 detection_loss_cls: 0.0476 detection_loss_reg: 0.3833 caption_loss_cls: 2.5823 grounding_loss_reg: 3.4027 semantic_segmentation_loss_cls: 0.0125 instance_segmentation_loss_cls: 0.0432 instance_segmentation_loss_reg: 0.3740 instance_segmentation_loss_poly: 1.0549 +2024/01/02 18:38:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 18:38:48 - mmengine - INFO - Iter(train) [ 70000/640000] base_lr: 1.9421e-04 lr: 1.9474e-05 eta: 9 days, 15:43:04 time: 1.4631 data_time: 0.0254 memory: 25721 grad_norm: 2.9767 loss: 1.5452 detection_loss_cls: 0.0476 detection_loss_reg: 0.3837 caption_loss_cls: 2.5770 grounding_loss_reg: 3.3965 semantic_segmentation_loss_cls: 0.0125 instance_segmentation_loss_cls: 0.0430 instance_segmentation_loss_reg: 0.3724 instance_segmentation_loss_poly: 1.0512 +2024/01/02 18:38:48 - mmengine - INFO - Saving checkpoint at 70000 iterations +2024/01/02 18:50:50 - mmengine - INFO - Iter(train) [ 70500/640000] base_lr: 1.9413e-04 lr: 1.9466e-05 eta: 9 days, 15:24:02 time: 1.4480 data_time: 0.0254 memory: 25721 grad_norm: 3.0270 loss: 1.5699 detection_loss_cls: 0.0475 detection_loss_reg: 0.3836 caption_loss_cls: 2.5718 grounding_loss_reg: 3.3903 semantic_segmentation_loss_cls: 0.0125 instance_segmentation_loss_cls: 0.0430 instance_segmentation_loss_reg: 0.3727 instance_segmentation_loss_poly: 1.0518 +2024/01/02 19:02:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 19:02:43 - mmengine - INFO - Iter(train) [ 71000/640000] base_lr: 1.9405e-04 lr: 1.9459e-05 eta: 9 days, 14:59:59 time: 1.4363 data_time: 0.0253 memory: 25721 grad_norm: 3.0747 loss: 1.5775 detection_loss_cls: 0.0472 detection_loss_reg: 0.3826 caption_loss_cls: 2.5715 grounding_loss_reg: 3.3856 semantic_segmentation_loss_cls: 0.0125 instance_segmentation_loss_cls: 0.0432 instance_segmentation_loss_reg: 0.3740 instance_segmentation_loss_poly: 1.0530 +2024/01/02 19:14:51 - mmengine - INFO - Iter(train) [ 71500/640000] base_lr: 1.9396e-04 lr: 1.9451e-05 eta: 9 days, 14:46:29 time: 1.4370 data_time: 0.0253 memory: 25721 grad_norm: 3.0995 loss: 1.5732 detection_loss_cls: 0.0470 detection_loss_reg: 0.3819 caption_loss_cls: 2.5689 grounding_loss_reg: 3.3789 semantic_segmentation_loss_cls: 0.0125 instance_segmentation_loss_cls: 0.0433 instance_segmentation_loss_reg: 0.3739 instance_segmentation_loss_poly: 1.0516 +2024/01/02 19:27:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 19:27:02 - mmengine - INFO - Iter(train) [ 72000/640000] base_lr: 1.9388e-04 lr: 1.9444e-05 eta: 9 days, 14:34:23 time: 1.4518 data_time: 0.0255 memory: 25721 grad_norm: 3.0453 loss: 1.5682 detection_loss_cls: 0.0469 detection_loss_reg: 0.3812 caption_loss_cls: 2.5612 grounding_loss_reg: 3.3713 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0433 instance_segmentation_loss_reg: 0.3741 instance_segmentation_loss_poly: 1.0519 +2024/01/02 19:27:02 - mmengine - INFO - Saving checkpoint at 72000 iterations +2024/01/02 19:39:16 - mmengine - INFO - Iter(train) [ 72500/640000] base_lr: 1.9380e-04 lr: 1.9436e-05 eta: 9 days, 14:24:16 time: 1.4464 data_time: 0.0249 memory: 25721 grad_norm: 2.9829 loss: 1.5570 detection_loss_cls: 0.0469 detection_loss_reg: 0.3821 caption_loss_cls: 2.5588 grounding_loss_reg: 3.3681 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0433 instance_segmentation_loss_reg: 0.3741 instance_segmentation_loss_poly: 1.0516 +2024/01/02 19:52:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 19:52:17 - mmengine - INFO - Iter(train) [ 73000/640000] base_lr: 1.9371e-04 lr: 1.9428e-05 eta: 9 days, 14:39:38 time: 1.4688 data_time: 0.0252 memory: 25721 grad_norm: 2.9351 loss: 1.5478 detection_loss_cls: 0.0467 detection_loss_reg: 0.3810 caption_loss_cls: 2.5587 grounding_loss_reg: 3.3616 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0433 instance_segmentation_loss_reg: 0.3750 instance_segmentation_loss_poly: 1.0532 +2024/01/02 20:04:33 - mmengine - INFO - Iter(train) [ 73500/640000] base_lr: 1.9363e-04 lr: 1.9421e-05 eta: 9 days, 14:29:38 time: 1.4725 data_time: 0.0250 memory: 25721 grad_norm: 2.9181 loss: 1.5415 detection_loss_cls: 0.0468 detection_loss_reg: 0.3807 caption_loss_cls: 2.5518 grounding_loss_reg: 3.3576 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0432 instance_segmentation_loss_reg: 0.3744 instance_segmentation_loss_poly: 1.0514 +2024/01/02 20:16:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 20:16:18 - mmengine - INFO - Iter(train) [ 74000/640000] base_lr: 1.9354e-04 lr: 1.9413e-05 eta: 9 days, 14:02:52 time: 1.4622 data_time: 0.0248 memory: 25721 grad_norm: 2.9199 loss: 1.5514 detection_loss_cls: 0.0468 detection_loss_reg: 0.3811 caption_loss_cls: 2.5467 grounding_loss_reg: 3.3525 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0432 instance_segmentation_loss_reg: 0.3738 instance_segmentation_loss_poly: 1.0504 +2024/01/02 20:16:18 - mmengine - INFO - Saving checkpoint at 74000 iterations +2024/01/02 20:28:13 - mmengine - INFO - Iter(train) [ 74500/640000] base_lr: 1.9345e-04 lr: 1.9405e-05 eta: 9 days, 13:42:11 time: 1.4606 data_time: 0.0241 memory: 25721 grad_norm: 2.9659 loss: 1.5516 detection_loss_cls: 0.0468 detection_loss_reg: 0.3808 caption_loss_cls: 2.5464 grounding_loss_reg: 3.3485 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0431 instance_segmentation_loss_reg: 0.3732 instance_segmentation_loss_poly: 1.0487 +2024/01/02 20:40:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 20:40:59 - mmengine - INFO - Iter(train) [ 75000/640000] base_lr: 1.9337e-04 lr: 1.9397e-05 eta: 9 days, 13:47:10 time: 1.4739 data_time: 0.0241 memory: 25721 grad_norm: 2.9364 loss: 1.5455 detection_loss_cls: 0.0466 detection_loss_reg: 0.3788 caption_loss_cls: 2.5459 grounding_loss_reg: 3.3445 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0430 instance_segmentation_loss_reg: 0.3722 instance_segmentation_loss_poly: 1.0463 +2024/01/02 20:54:10 - mmengine - INFO - Iter(train) [ 75500/640000] base_lr: 1.9328e-04 lr: 1.9389e-05 eta: 9 days, 14:03:24 time: 1.4895 data_time: 0.0240 memory: 25721 grad_norm: 2.8551 loss: 1.5243 detection_loss_cls: 0.0462 detection_loss_reg: 0.3766 caption_loss_cls: 2.5413 grounding_loss_reg: 3.3385 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0427 instance_segmentation_loss_reg: 0.3699 instance_segmentation_loss_poly: 1.0410 +2024/01/02 21:06:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 21:06:22 - mmengine - INFO - Iter(train) [ 76000/640000] base_lr: 1.9319e-04 lr: 1.9381e-05 eta: 9 days, 13:50:28 time: 1.4898 data_time: 0.0241 memory: 25721 grad_norm: 2.8526 loss: 1.5379 detection_loss_cls: 0.0464 detection_loss_reg: 0.3793 caption_loss_cls: 2.5428 grounding_loss_reg: 3.3377 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0427 instance_segmentation_loss_reg: 0.3702 instance_segmentation_loss_poly: 1.0417 +2024/01/02 21:06:22 - mmengine - INFO - Saving checkpoint at 76000 iterations +2024/01/02 21:19:15 - mmengine - INFO - Iter(train) [ 76500/640000] base_lr: 1.9310e-04 lr: 1.9373e-05 eta: 9 days, 13:56:14 time: 1.4995 data_time: 0.0239 memory: 25721 grad_norm: 2.8279 loss: 1.5282 detection_loss_cls: 0.0463 detection_loss_reg: 0.3785 caption_loss_cls: 2.5393 grounding_loss_reg: 3.3352 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0426 instance_segmentation_loss_reg: 0.3700 instance_segmentation_loss_poly: 1.0406 +2024/01/02 21:31:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 21:31:14 - mmengine - INFO - Iter(train) [ 77000/640000] base_lr: 1.9301e-04 lr: 1.9365e-05 eta: 9 days, 13:37:16 time: 1.4842 data_time: 0.0236 memory: 25721 grad_norm: 2.8631 loss: 1.5349 detection_loss_cls: 0.0464 detection_loss_reg: 0.3791 caption_loss_cls: 2.5345 grounding_loss_reg: 3.3297 semantic_segmentation_loss_cls: 0.0124 instance_segmentation_loss_cls: 0.0426 instance_segmentation_loss_reg: 0.3704 instance_segmentation_loss_poly: 1.0417 +2024/01/02 21:43:42 - mmengine - INFO - Iter(train) [ 77500/640000] base_lr: 1.9292e-04 lr: 1.9357e-05 eta: 9 days, 13:30:43 time: 1.4870 data_time: 0.0236 memory: 25721 grad_norm: 2.8624 loss: 1.5373 detection_loss_cls: 0.0463 detection_loss_reg: 0.3776 caption_loss_cls: 2.5345 grounding_loss_reg: 3.3268 semantic_segmentation_loss_cls: 0.0123 instance_segmentation_loss_cls: 0.0424 instance_segmentation_loss_reg: 0.3686 instance_segmentation_loss_poly: 1.0391 +2024/01/02 21:56:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 21:56:31 - mmengine - INFO - Iter(train) [ 78000/640000] base_lr: 1.9283e-04 lr: 1.9348e-05 eta: 9 days, 13:33:18 time: 1.5031 data_time: 0.0237 memory: 25721 grad_norm: 2.8387 loss: 1.5127 detection_loss_cls: 0.0464 detection_loss_reg: 0.3772 caption_loss_cls: 2.5355 grounding_loss_reg: 3.3229 semantic_segmentation_loss_cls: 0.0123 instance_segmentation_loss_cls: 0.0422 instance_segmentation_loss_reg: 0.3679 instance_segmentation_loss_poly: 1.0375 +2024/01/02 21:56:31 - mmengine - INFO - Saving checkpoint at 78000 iterations +2024/01/02 22:09:05 - mmengine - INFO - Iter(train) [ 78500/640000] base_lr: 1.9274e-04 lr: 1.9340e-05 eta: 9 days, 13:28:41 time: 1.5128 data_time: 0.0238 memory: 25721 grad_norm: 2.7951 loss: 1.5025 detection_loss_cls: 0.0462 detection_loss_reg: 0.3756 caption_loss_cls: 2.5356 grounding_loss_reg: 3.3162 semantic_segmentation_loss_cls: 0.0123 instance_segmentation_loss_cls: 0.0421 instance_segmentation_loss_reg: 0.3678 instance_segmentation_loss_poly: 1.0373 +2024/01/02 22:20:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 22:20:53 - mmengine - INFO - Iter(train) [ 79000/640000] base_lr: 1.9265e-04 lr: 1.9332e-05 eta: 9 days, 13:05:13 time: 1.4984 data_time: 0.0236 memory: 25721 grad_norm: 2.8027 loss: 1.5014 detection_loss_cls: 0.0462 detection_loss_reg: 0.3742 caption_loss_cls: 2.5390 grounding_loss_reg: 3.3104 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0420 instance_segmentation_loss_reg: 0.3664 instance_segmentation_loss_poly: 1.0335 +2024/01/02 22:32:46 - mmengine - INFO - Iter(train) [ 79500/640000] base_lr: 1.9256e-04 lr: 1.9323e-05 eta: 9 days, 12:44:17 time: 1.4789 data_time: 0.0233 memory: 25721 grad_norm: 2.8277 loss: 1.5176 detection_loss_cls: 0.0461 detection_loss_reg: 0.3732 caption_loss_cls: 2.5435 grounding_loss_reg: 3.3063 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0419 instance_segmentation_loss_reg: 0.3650 instance_segmentation_loss_poly: 1.0305 +2024/01/02 22:44:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 22:44:16 - mmengine - INFO - Iter(train) [ 80000/640000] base_lr: 1.9246e-04 lr: 1.9315e-05 eta: 9 days, 12:14:41 time: 1.4684 data_time: 0.0231 memory: 25721 grad_norm: 2.8240 loss: 1.5133 detection_loss_cls: 0.0461 detection_loss_reg: 0.3739 caption_loss_cls: 2.5427 grounding_loss_reg: 3.3051 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0418 instance_segmentation_loss_reg: 0.3645 instance_segmentation_loss_poly: 1.0280 +2024/01/02 22:44:16 - mmengine - INFO - Saving checkpoint at 80000 iterations +2024/01/02 22:56:38 - mmengine - INFO - Evaluating bbox... +2024/01/02 22:57:33 - mmengine - INFO - bbox_mAP_copypaste: 0.407 0.590 0.450 0.268 0.463 0.517 +2024/01/02 22:57:33 - mmengine - INFO - Evaluating segm... +2024/01/02 22:58:44 - mmengine - INFO - segm_mAP_copypaste: 0.262 0.511 0.245 0.138 0.308 0.401 +2024/01/02 23:05:34 - mmengine - INFO - per class results: +2024/01/02 23:05:34 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 76.34 | 91.72 | +| building | 82.98 | 92.18 | +| sky | 93.35 | 97.19 | +| floor | 77.21 | 93.26 | +| tree | 72.98 | 84.43 | +| ceiling | 82.52 | 88.33 | +| road | 80.25 | 87.76 | +| bed | 86.37 | 94.26 | +| windowpane | 60.35 | 71.67 | +| grass | 64.23 | 79.54 | +| cabinet | 51.79 | 57.72 | +| sidewalk | 63.21 | 83.97 | +| person | 79.37 | 86.96 | +| earth | 33.56 | 42.5 | +| door | 39.68 | 46.47 | +| table | 51.29 | 58.36 | +| mountain | 60.17 | 71.09 | +| plant | 51.7 | 62.4 | +| curtain | 68.67 | 82.38 | +| chair | 51.05 | 58.67 | +| car | 82.12 | 90.12 | +| water | 31.89 | 35.91 | +| painting | 68.25 | 83.38 | +| sofa | 55.6 | 93.51 | +| shelf | 40.72 | 71.6 | +| house | 41.35 | 50.33 | +| sea | 45.39 | 70.42 | +| mirror | 62.31 | 67.6 | +| rug | 54.32 | 57.3 | +| field | 33.26 | 58.68 | +| armchair | 24.78 | 31.74 | +| seat | 62.57 | 74.73 | +| fence | 40.48 | 71.94 | +| desk | 39.47 | 56.66 | +| rock | 42.2 | 66.47 | +| wardrobe | 49.29 | 54.29 | +| lamp | 57.23 | 66.48 | +| bathtub | 73.56 | 84.41 | +| railing | 32.13 | 52.9 | +| cushion | 44.78 | 49.37 | +| base | 21.55 | 51.12 | +| box | 22.06 | 27.27 | +| column | 33.86 | 35.96 | +| signboard | 36.46 | 46.48 | +| chest of drawers | 20.85 | 85.95 | +| counter | 33.34 | 59.6 | +| sand | 33.11 | 53.16 | +| sink | 64.88 | 72.24 | +| skyscraper | 62.22 | 88.93 | +| fireplace | 70.65 | 89.2 | +| refrigerator | 69.36 | 88.14 | +| grandstand | 46.64 | 72.9 | +| path | 17.57 | 25.84 | +| stairs | 24.18 | 30.02 | +| runway | 66.81 | 82.34 | +| case | 4.06 | 4.13 | +| pool table | 75.06 | 97.75 | +| pillow | 46.07 | 52.29 | +| screen door | 43.57 | 48.66 | +| stairway | 27.24 | 44.76 | +| river | 16.48 | 37.38 | +| bridge | 73.21 | 88.86 | +| bookcase | 36.5 | 61.36 | +| blind | 27.75 | 30.31 | +| coffee table | 45.15 | 82.13 | +| toilet | 82.93 | 85.44 | +| flower | 28.3 | 35.28 | +| book | 40.52 | 50.96 | +| hill | 4.4 | 5.46 | +| bench | 47.54 | 70.65 | +| countertop | 54.46 | 80.05 | +| stove | 68.69 | 73.45 | +| palm | 51.15 | 73.1 | +| kitchen island | 37.44 | 85.86 | +| computer | 56.7 | 60.8 | +| swivel chair | 34.6 | 41.11 | +| boat | 73.04 | 88.38 | +| bar | 42.95 | 65.28 | +| arcade machine | 41.94 | 43.42 | +| hovel | 30.78 | 47.08 | +| bus | 90.68 | 95.99 | +| towel | 60.57 | 72.05 | +| light | 33.14 | 35.44 | +| truck | 32.41 | 53.89 | +| tower | 25.66 | 37.67 | +| chandelier | 59.25 | 75.67 | +| awning | 32.33 | 47.65 | +| streetlight | 27.95 | 39.84 | +| booth | 30.33 | 52.23 | +| television receiver | 56.78 | 82.8 | +| airplane | 57.53 | 68.33 | +| dirt track | 0.0 | 0.0 | +| apparel | 26.87 | 36.89 | +| pole | 26.09 | 38.12 | +| land | 5.74 | 9.75 | +| bannister | 0.0 | 0.0 | +| escalator | 11.88 | 11.93 | +| ottoman | 49.85 | 60.09 | +| bottle | 17.18 | 20.3 | +| buffet | 41.66 | 63.02 | +| poster | 5.15 | 5.89 | +| stage | 5.56 | 7.68 | +| van | 44.71 | 66.12 | +| ship | 6.22 | 6.29 | +| fountain | 7.71 | 7.74 | +| conveyer belt | 62.77 | 73.2 | +| canopy | 32.06 | 53.29 | +| washer | 61.63 | 67.89 | +| plaything | 25.94 | 45.01 | +| swimming pool | 39.29 | 80.37 | +| stool | 40.8 | 46.34 | +| barrel | 9.81 | 64.72 | +| basket | 25.15 | 31.02 | +| waterfall | 57.04 | 73.14 | +| tent | 70.27 | 71.63 | +| bag | 7.84 | 8.58 | +| minibike | 67.37 | 82.05 | +| cradle | 54.75 | 95.45 | +| oven | 43.35 | 60.49 | +| ball | 30.73 | 35.8 | +| food | 23.22 | 24.58 | +| step | 13.15 | 18.66 | +| tank | 43.81 | 55.32 | +| trade name | 23.24 | 28.55 | +| microwave | 73.02 | 80.48 | +| pot | 38.86 | 44.1 | +| animal | 62.31 | 68.48 | +| bicycle | 55.49 | 73.3 | +| lake | 23.11 | 93.46 | +| dishwasher | 57.81 | 71.24 | +| screen | 62.78 | 66.1 | +| blanket | 9.18 | 10.56 | +| sculpture | 45.47 | 49.58 | +| hood | 47.42 | 50.95 | +| sconce | 30.81 | 38.37 | +| vase | 39.14 | 54.98 | +| traffic light | 27.91 | 37.77 | +| tray | 5.21 | 7.15 | +| ashcan | 34.42 | 43.35 | +| fan | 50.11 | 58.42 | +| pier | 44.17 | 66.21 | +| crt screen | 12.02 | 33.19 | +| plate | 44.71 | 52.25 | +| monitor | 29.5 | 39.62 | +| bulletin board | 17.4 | 19.2 | +| shower | 0.0 | 0.0 | +| radiator | 44.23 | 54.23 | +| glass | 10.28 | 10.61 | +| clock | 20.22 | 29.11 | +| flag | 29.48 | 32.04 | ++---------------------+-------+-------+ +2024/01/02 23:05:51 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4070 coco/bbox_mAP_50: 0.5900 coco/bbox_mAP_75: 0.4500 coco/bbox_mAP_s: 0.2680 coco/bbox_mAP_m: 0.4630 coco/bbox_mAP_l: 0.5170 coco/segm_mAP: 0.2620 coco/segm_mAP_50: 0.5110 coco/segm_mAP_75: 0.2450 coco/segm_mAP_s: 0.1380 coco/segm_mAP_m: 0.3080 coco/segm_mAP_l: 0.4010 Bleu_1: 0.7035 Bleu_2: 0.5290 Bleu_3: 0.3857 Bleu_4: 0.2783 METEOR: 0.2404 ROUGE_L: 0.5153 CIDEr: 0.8808 SPICE: 0.1724 aAcc: 80.8700 mIoU: 42.8400 mAcc: 55.8500 visual-grounding/miou: 0.7141 visual-grounding/acc: 0.7870 data_time: 0.0042 time: 1.3505 +2024/01/02 23:17:56 - mmengine - INFO - Iter(train) [ 80500/640000] base_lr: 1.9237e-04 lr: 1.9306e-05 eta: 9 days, 11:59:50 time: 1.4569 data_time: 0.0193 memory: 25721 grad_norm: 2.8784 loss: 1.5337 detection_loss_cls: 0.0462 detection_loss_reg: 0.3744 caption_loss_cls: 2.5411 grounding_loss_reg: 3.2986 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0420 instance_segmentation_loss_reg: 0.3663 instance_segmentation_loss_poly: 1.0310 +2024/01/02 23:30:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 23:30:36 - mmengine - INFO - Iter(train) [ 81000/640000] base_lr: 1.9228e-04 lr: 1.9298e-05 eta: 9 days, 11:57:28 time: 1.4670 data_time: 0.0195 memory: 25721 grad_norm: 2.8583 loss: 1.5245 detection_loss_cls: 0.0464 detection_loss_reg: 0.3758 caption_loss_cls: 2.5434 grounding_loss_reg: 3.2972 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0420 instance_segmentation_loss_reg: 0.3660 instance_segmentation_loss_poly: 1.0296 +2024/01/02 23:43:18 - mmengine - INFO - Iter(train) [ 81500/640000] base_lr: 1.9218e-04 lr: 1.9289e-05 eta: 9 days, 11:55:33 time: 1.4708 data_time: 0.0195 memory: 25721 grad_norm: 2.8443 loss: 1.5152 detection_loss_cls: 0.0464 detection_loss_reg: 0.3769 caption_loss_cls: 2.5432 grounding_loss_reg: 3.2923 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0422 instance_segmentation_loss_reg: 0.3666 instance_segmentation_loss_poly: 1.0302 +2024/01/02 23:55:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/02 23:55:55 - mmengine - INFO - Iter(train) [ 82000/640000] base_lr: 1.9209e-04 lr: 1.9281e-05 eta: 9 days, 11:51:21 time: 1.4677 data_time: 0.0196 memory: 25721 grad_norm: 2.8267 loss: 1.5332 detection_loss_cls: 0.0462 detection_loss_reg: 0.3754 caption_loss_cls: 2.5453 grounding_loss_reg: 3.2878 semantic_segmentation_loss_cls: 0.0122 instance_segmentation_loss_cls: 0.0423 instance_segmentation_loss_reg: 0.3673 instance_segmentation_loss_poly: 1.0323 +2024/01/02 23:55:55 - mmengine - INFO - Saving checkpoint at 82000 iterations +2024/01/03 00:08:52 - mmengine - INFO - Iter(train) [ 82500/640000] base_lr: 1.9199e-04 lr: 1.9272e-05 eta: 9 days, 11:53:33 time: 1.4734 data_time: 0.0197 memory: 25721 grad_norm: 2.7818 loss: 1.5246 detection_loss_cls: 0.0460 detection_loss_reg: 0.3737 caption_loss_cls: 2.5472 grounding_loss_reg: 3.2899 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0420 instance_segmentation_loss_reg: 0.3649 instance_segmentation_loss_poly: 1.0271 +2024/01/03 00:21:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 00:21:35 - mmengine - INFO - Iter(train) [ 83000/640000] base_lr: 1.9190e-04 lr: 1.9263e-05 eta: 9 days, 11:50:40 time: 1.4871 data_time: 0.0198 memory: 25721 grad_norm: 2.7509 loss: 1.5138 detection_loss_cls: 0.0458 detection_loss_reg: 0.3731 caption_loss_cls: 2.5490 grounding_loss_reg: 3.2851 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0419 instance_segmentation_loss_reg: 0.3641 instance_segmentation_loss_poly: 1.0246 +2024/01/03 00:34:55 - mmengine - INFO - Iter(train) [ 83500/640000] base_lr: 1.9180e-04 lr: 1.9255e-05 eta: 9 days, 11:59:58 time: 1.5089 data_time: 0.0202 memory: 25721 grad_norm: 2.7217 loss: 1.5042 detection_loss_cls: 0.0457 detection_loss_reg: 0.3720 caption_loss_cls: 2.5512 grounding_loss_reg: 3.2839 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0418 instance_segmentation_loss_reg: 0.3628 instance_segmentation_loss_poly: 1.0218 +2024/01/03 00:46:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 00:46:48 - mmengine - INFO - Iter(train) [ 84000/640000] base_lr: 1.9170e-04 lr: 1.9246e-05 eta: 9 days, 11:39:26 time: 1.5146 data_time: 0.0203 memory: 25721 grad_norm: 2.7119 loss: 1.4983 detection_loss_cls: 0.0455 detection_loss_reg: 0.3708 caption_loss_cls: 2.5464 grounding_loss_reg: 3.2797 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0416 instance_segmentation_loss_reg: 0.3619 instance_segmentation_loss_poly: 1.0194 +2024/01/03 00:46:48 - mmengine - INFO - Saving checkpoint at 84000 iterations +2024/01/03 00:59:09 - mmengine - INFO - Iter(train) [ 84500/640000] base_lr: 1.9161e-04 lr: 1.9237e-05 eta: 9 days, 11:28:27 time: 1.5181 data_time: 0.0242 memory: 25721 grad_norm: 2.6819 loss: 1.4968 detection_loss_cls: 0.0456 detection_loss_reg: 0.3711 caption_loss_cls: 2.5448 grounding_loss_reg: 3.2788 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0417 instance_segmentation_loss_reg: 0.3631 instance_segmentation_loss_poly: 1.0210 +2024/01/03 01:11:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 01:11:39 - mmengine - INFO - Iter(train) [ 85000/640000] base_lr: 1.9151e-04 lr: 1.9228e-05 eta: 9 days, 11:20:07 time: 1.5155 data_time: 0.0241 memory: 25721 grad_norm: 2.6968 loss: 1.4951 detection_loss_cls: 0.0455 detection_loss_reg: 0.3699 caption_loss_cls: 2.5436 grounding_loss_reg: 3.2769 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0416 instance_segmentation_loss_reg: 0.3629 instance_segmentation_loss_poly: 1.0205 +2024/01/03 01:23:45 - mmengine - INFO - Iter(train) [ 85500/640000] base_lr: 1.9141e-04 lr: 1.9219e-05 eta: 9 days, 11:04:21 time: 1.5065 data_time: 0.0239 memory: 25721 grad_norm: 2.7065 loss: 1.5015 detection_loss_cls: 0.0455 detection_loss_reg: 0.3699 caption_loss_cls: 2.5408 grounding_loss_reg: 3.2728 semantic_segmentation_loss_cls: 0.0121 instance_segmentation_loss_cls: 0.0416 instance_segmentation_loss_reg: 0.3621 instance_segmentation_loss_poly: 1.0184 +2024/01/03 01:35:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 01:35:39 - mmengine - INFO - Iter(train) [ 86000/640000] base_lr: 1.9131e-04 lr: 1.9210e-05 eta: 9 days, 10:45:04 time: 1.4958 data_time: 0.0237 memory: 25721 grad_norm: 2.7199 loss: 1.4934 detection_loss_cls: 0.0453 detection_loss_reg: 0.3688 caption_loss_cls: 2.5416 grounding_loss_reg: 3.2705 semantic_segmentation_loss_cls: 0.0120 instance_segmentation_loss_cls: 0.0415 instance_segmentation_loss_reg: 0.3616 instance_segmentation_loss_poly: 1.0168 +2024/01/03 01:35:39 - mmengine - INFO - Saving checkpoint at 86000 iterations +2024/01/03 01:48:33 - mmengine - INFO - Iter(train) [ 86500/640000] base_lr: 1.9121e-04 lr: 1.9201e-05 eta: 9 days, 10:44:02 time: 1.4952 data_time: 0.0236 memory: 25721 grad_norm: 2.7450 loss: 1.4932 detection_loss_cls: 0.0453 detection_loss_reg: 0.3696 caption_loss_cls: 2.5363 grounding_loss_reg: 3.2667 semantic_segmentation_loss_cls: 0.0120 instance_segmentation_loss_cls: 0.0414 instance_segmentation_loss_reg: 0.3608 instance_segmentation_loss_poly: 1.0147 +2024/01/03 02:00:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 02:00:08 - mmengine - INFO - Iter(train) [ 87000/640000] base_lr: 1.9111e-04 lr: 1.9192e-05 eta: 9 days, 10:18:57 time: 1.4780 data_time: 0.0235 memory: 25721 grad_norm: 2.8053 loss: 1.5206 detection_loss_cls: 0.0453 detection_loss_reg: 0.3690 caption_loss_cls: 2.5324 grounding_loss_reg: 3.2620 semantic_segmentation_loss_cls: 0.0120 instance_segmentation_loss_cls: 0.0416 instance_segmentation_loss_reg: 0.3621 instance_segmentation_loss_poly: 1.0179 +2024/01/03 02:12:07 - mmengine - INFO - Iter(train) [ 87500/640000] base_lr: 1.9101e-04 lr: 1.9183e-05 eta: 9 days, 10:01:27 time: 1.4577 data_time: 0.0233 memory: 25721 grad_norm: 2.8529 loss: 1.5196 detection_loss_cls: 0.0450 detection_loss_reg: 0.3682 caption_loss_cls: 2.5307 grounding_loss_reg: 3.2530 semantic_segmentation_loss_cls: 0.0120 instance_segmentation_loss_cls: 0.0415 instance_segmentation_loss_reg: 0.3614 instance_segmentation_loss_poly: 1.0155 +2024/01/03 02:23:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 02:23:46 - mmengine - INFO - Iter(train) [ 88000/640000] base_lr: 1.9091e-04 lr: 1.9173e-05 eta: 9 days, 9:38:30 time: 1.4543 data_time: 0.0231 memory: 25721 grad_norm: 2.8829 loss: 1.5102 detection_loss_cls: 0.0450 detection_loss_reg: 0.3685 caption_loss_cls: 2.5243 grounding_loss_reg: 3.2485 semantic_segmentation_loss_cls: 0.0119 instance_segmentation_loss_cls: 0.0414 instance_segmentation_loss_reg: 0.3605 instance_segmentation_loss_poly: 1.0137 +2024/01/03 02:23:46 - mmengine - INFO - Saving checkpoint at 88000 iterations +2024/01/03 02:35:38 - mmengine - INFO - Iter(train) [ 88500/640000] base_lr: 1.9080e-04 lr: 1.9164e-05 eta: 9 days, 9:19:21 time: 1.4469 data_time: 0.0227 memory: 25721 grad_norm: 2.9057 loss: 1.5007 detection_loss_cls: 0.0448 detection_loss_reg: 0.3673 caption_loss_cls: 2.5270 grounding_loss_reg: 3.2405 semantic_segmentation_loss_cls: 0.0119 instance_segmentation_loss_cls: 0.0414 instance_segmentation_loss_reg: 0.3603 instance_segmentation_loss_poly: 1.0138 +2024/01/03 02:47:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 02:47:30 - mmengine - INFO - Iter(train) [ 89000/640000] base_lr: 1.9070e-04 lr: 1.9155e-05 eta: 9 days, 9:00:42 time: 1.4377 data_time: 0.0226 memory: 25721 grad_norm: 2.9405 loss: 1.5043 detection_loss_cls: 0.0447 detection_loss_reg: 0.3673 caption_loss_cls: 2.5240 grounding_loss_reg: 3.2347 semantic_segmentation_loss_cls: 0.0119 instance_segmentation_loss_cls: 0.0412 instance_segmentation_loss_reg: 0.3587 instance_segmentation_loss_poly: 1.0107 +2024/01/03 02:59:28 - mmengine - INFO - Iter(train) [ 89500/640000] base_lr: 1.9060e-04 lr: 1.9145e-05 eta: 9 days, 8:43:47 time: 1.4356 data_time: 0.0226 memory: 25721 grad_norm: 3.0086 loss: 1.5081 detection_loss_cls: 0.0447 detection_loss_reg: 0.3676 caption_loss_cls: 2.5264 grounding_loss_reg: 3.2342 semantic_segmentation_loss_cls: 0.0119 instance_segmentation_loss_cls: 0.0413 instance_segmentation_loss_reg: 0.3595 instance_segmentation_loss_poly: 1.0119 +2024/01/03 03:11:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 03:11:42 - mmengine - INFO - Iter(train) [ 90000/640000] base_lr: 1.9050e-04 lr: 1.9136e-05 eta: 9 days, 8:31:21 time: 1.4406 data_time: 0.0227 memory: 25721 grad_norm: 3.0235 loss: 1.5060 detection_loss_cls: 0.0447 detection_loss_reg: 0.3673 caption_loss_cls: 2.5280 grounding_loss_reg: 3.2318 semantic_segmentation_loss_cls: 0.0119 instance_segmentation_loss_cls: 0.0413 instance_segmentation_loss_reg: 0.3598 instance_segmentation_loss_poly: 1.0120 +2024/01/03 03:11:42 - mmengine - INFO - Saving checkpoint at 90000 iterations +2024/01/03 03:24:05 - mmengine - INFO - Iter(train) [ 90500/640000] base_lr: 1.9039e-04 lr: 1.9126e-05 eta: 9 days, 8:21:07 time: 1.4327 data_time: 0.0226 memory: 25721 grad_norm: 3.0014 loss: 1.5075 detection_loss_cls: 0.0447 detection_loss_reg: 0.3672 caption_loss_cls: 2.5248 grounding_loss_reg: 3.2286 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0414 instance_segmentation_loss_reg: 0.3602 instance_segmentation_loss_poly: 1.0119 +2024/01/03 03:36:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 03:36:32 - mmengine - INFO - Iter(train) [ 91000/640000] base_lr: 1.9029e-04 lr: 1.9117e-05 eta: 9 days, 8:11:59 time: 1.4458 data_time: 0.0227 memory: 25721 grad_norm: 2.9762 loss: 1.4962 detection_loss_cls: 0.0449 detection_loss_reg: 0.3679 caption_loss_cls: 2.5247 grounding_loss_reg: 3.2239 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0412 instance_segmentation_loss_reg: 0.3601 instance_segmentation_loss_poly: 1.0128 +2024/01/03 03:49:55 - mmengine - INFO - Iter(train) [ 91500/640000] base_lr: 1.9018e-04 lr: 1.9107e-05 eta: 9 days, 8:17:19 time: 1.4669 data_time: 0.0231 memory: 25721 grad_norm: 2.9194 loss: 1.4956 detection_loss_cls: 0.0450 detection_loss_reg: 0.3679 caption_loss_cls: 2.5222 grounding_loss_reg: 3.2244 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0411 instance_segmentation_loss_reg: 0.3598 instance_segmentation_loss_poly: 1.0130 +2024/01/03 04:02:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 04:02:44 - mmengine - INFO - Iter(train) [ 92000/640000] base_lr: 1.9008e-04 lr: 1.9098e-05 eta: 9 days, 8:13:16 time: 1.4843 data_time: 0.0234 memory: 25721 grad_norm: 2.8499 loss: 1.4901 detection_loss_cls: 0.0448 detection_loss_reg: 0.3677 caption_loss_cls: 2.5225 grounding_loss_reg: 3.2212 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0410 instance_segmentation_loss_reg: 0.3590 instance_segmentation_loss_poly: 1.0110 +2024/01/03 04:02:44 - mmengine - INFO - Saving checkpoint at 92000 iterations +2024/01/03 04:14:39 - mmengine - INFO - Iter(train) [ 92500/640000] base_lr: 1.8997e-04 lr: 1.9088e-05 eta: 9 days, 7:55:44 time: 1.4853 data_time: 0.0235 memory: 25721 grad_norm: 2.8210 loss: 1.4990 detection_loss_cls: 0.0447 detection_loss_reg: 0.3671 caption_loss_cls: 2.5234 grounding_loss_reg: 3.2205 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0409 instance_segmentation_loss_reg: 0.3581 instance_segmentation_loss_poly: 1.0084 +2024/01/03 04:26:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 04:26:36 - mmengine - INFO - Iter(train) [ 93000/640000] base_lr: 1.8986e-04 lr: 1.9078e-05 eta: 9 days, 7:38:35 time: 1.4863 data_time: 0.0236 memory: 25721 grad_norm: 2.8013 loss: 1.5085 detection_loss_cls: 0.0446 detection_loss_reg: 0.3668 caption_loss_cls: 2.5236 grounding_loss_reg: 3.2197 semantic_segmentation_loss_cls: 0.0118 instance_segmentation_loss_cls: 0.0409 instance_segmentation_loss_reg: 0.3587 instance_segmentation_loss_poly: 1.0089 +2024/01/03 04:39:04 - mmengine - INFO - Iter(train) [ 93500/640000] base_lr: 1.8975e-04 lr: 1.9069e-05 eta: 9 days, 7:29:18 time: 1.4938 data_time: 0.0238 memory: 25721 grad_norm: 2.7290 loss: 1.5042 detection_loss_cls: 0.0444 detection_loss_reg: 0.3659 caption_loss_cls: 2.5287 grounding_loss_reg: 3.2184 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0408 instance_segmentation_loss_reg: 0.3583 instance_segmentation_loss_poly: 1.0071 +2024/01/03 04:51:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 04:51:06 - mmengine - INFO - Iter(train) [ 94000/640000] base_lr: 1.8965e-04 lr: 1.9059e-05 eta: 9 days, 7:13:40 time: 1.4908 data_time: 0.0238 memory: 25721 grad_norm: 2.7280 loss: 1.5189 detection_loss_cls: 0.0443 detection_loss_reg: 0.3647 caption_loss_cls: 2.5295 grounding_loss_reg: 3.2176 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0408 instance_segmentation_loss_reg: 0.3578 instance_segmentation_loss_poly: 1.0059 +2024/01/03 04:51:06 - mmengine - INFO - Saving checkpoint at 94000 iterations +2024/01/03 05:04:12 - mmengine - INFO - Iter(train) [ 94500/640000] base_lr: 1.8954e-04 lr: 1.9049e-05 eta: 9 days, 7:13:01 time: 1.5015 data_time: 0.0239 memory: 25721 grad_norm: 2.7206 loss: 1.5126 detection_loss_cls: 0.0441 detection_loss_reg: 0.3645 caption_loss_cls: 2.5295 grounding_loss_reg: 3.2178 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0406 instance_segmentation_loss_reg: 0.3572 instance_segmentation_loss_poly: 1.0047 +2024/01/03 05:16:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 05:16:28 - mmengine - INFO - Iter(train) [ 95000/640000] base_lr: 1.8943e-04 lr: 1.9039e-05 eta: 9 days, 7:00:37 time: 1.4988 data_time: 0.0239 memory: 25721 grad_norm: 2.7247 loss: 1.5087 detection_loss_cls: 0.0440 detection_loss_reg: 0.3638 caption_loss_cls: 2.5281 grounding_loss_reg: 3.2122 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0405 instance_segmentation_loss_reg: 0.3566 instance_segmentation_loss_poly: 1.0027 +2024/01/03 05:28:45 - mmengine - INFO - Iter(train) [ 95500/640000] base_lr: 1.8932e-04 lr: 1.9029e-05 eta: 9 days, 6:48:24 time: 1.4821 data_time: 0.0235 memory: 25721 grad_norm: 2.7594 loss: 1.5028 detection_loss_cls: 0.0442 detection_loss_reg: 0.3655 caption_loss_cls: 2.5258 grounding_loss_reg: 3.2079 semantic_segmentation_loss_cls: 0.0117 instance_segmentation_loss_cls: 0.0405 instance_segmentation_loss_reg: 0.3575 instance_segmentation_loss_poly: 1.0052 +2024/01/03 05:41:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 05:41:22 - mmengine - INFO - Iter(train) [ 96000/640000] base_lr: 1.8921e-04 lr: 1.9019e-05 eta: 9 days, 6:40:53 time: 1.4794 data_time: 0.0234 memory: 25721 grad_norm: 2.7597 loss: 1.4960 detection_loss_cls: 0.0440 detection_loss_reg: 0.3644 caption_loss_cls: 2.5264 grounding_loss_reg: 3.2039 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0403 instance_segmentation_loss_reg: 0.3558 instance_segmentation_loss_poly: 1.0007 +2024/01/03 05:41:22 - mmengine - INFO - Saving checkpoint at 96000 iterations +2024/01/03 05:54:17 - mmengine - INFO - Iter(train) [ 96500/640000] base_lr: 1.8910e-04 lr: 1.9009e-05 eta: 9 days, 6:37:05 time: 1.4942 data_time: 0.0237 memory: 25721 grad_norm: 2.7520 loss: 1.4866 detection_loss_cls: 0.0440 detection_loss_reg: 0.3644 caption_loss_cls: 2.5319 grounding_loss_reg: 3.1981 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0405 instance_segmentation_loss_reg: 0.3579 instance_segmentation_loss_poly: 1.0046 +2024/01/03 06:06:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 06:06:55 - mmengine - INFO - Iter(train) [ 97000/640000] base_lr: 1.8899e-04 lr: 1.8999e-05 eta: 9 days, 6:29:23 time: 1.5046 data_time: 0.0238 memory: 25721 grad_norm: 2.7016 loss: 1.4637 detection_loss_cls: 0.0438 detection_loss_reg: 0.3633 caption_loss_cls: 2.5286 grounding_loss_reg: 3.1916 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0405 instance_segmentation_loss_reg: 0.3577 instance_segmentation_loss_poly: 1.0037 +2024/01/03 06:19:08 - mmengine - INFO - Iter(train) [ 97500/640000] base_lr: 1.8888e-04 lr: 1.8989e-05 eta: 9 days, 6:15:59 time: 1.5007 data_time: 0.0238 memory: 25721 grad_norm: 2.7387 loss: 1.4680 detection_loss_cls: 0.0439 detection_loss_reg: 0.3642 caption_loss_cls: 2.5274 grounding_loss_reg: 3.1896 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0404 instance_segmentation_loss_reg: 0.3579 instance_segmentation_loss_poly: 1.0031 +2024/01/03 06:31:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 06:31:25 - mmengine - INFO - Iter(train) [ 98000/640000] base_lr: 1.8876e-04 lr: 1.8979e-05 eta: 9 days, 6:03:32 time: 1.5044 data_time: 0.0238 memory: 25721 grad_norm: 2.7310 loss: 1.4524 detection_loss_cls: 0.0440 detection_loss_reg: 0.3654 caption_loss_cls: 2.5251 grounding_loss_reg: 3.1862 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0405 instance_segmentation_loss_reg: 0.3585 instance_segmentation_loss_poly: 1.0044 +2024/01/03 06:31:25 - mmengine - INFO - Saving checkpoint at 98000 iterations +2024/01/03 06:44:12 - mmengine - INFO - Iter(train) [ 98500/640000] base_lr: 1.8865e-04 lr: 1.8968e-05 eta: 9 days, 5:57:36 time: 1.4999 data_time: 0.0238 memory: 25721 grad_norm: 2.7751 loss: 1.4611 detection_loss_cls: 0.0439 detection_loss_reg: 0.3657 caption_loss_cls: 2.5246 grounding_loss_reg: 3.1852 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0407 instance_segmentation_loss_reg: 0.3596 instance_segmentation_loss_poly: 1.0070 +2024/01/03 06:56:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 06:56:19 - mmengine - INFO - Iter(train) [ 99000/640000] base_lr: 1.8854e-04 lr: 1.8958e-05 eta: 9 days, 5:43:02 time: 1.4977 data_time: 0.0238 memory: 25721 grad_norm: 2.7951 loss: 1.4643 detection_loss_cls: 0.0438 detection_loss_reg: 0.3651 caption_loss_cls: 2.5187 grounding_loss_reg: 3.1832 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0407 instance_segmentation_loss_reg: 0.3600 instance_segmentation_loss_poly: 1.0088 +2024/01/03 07:08:53 - mmengine - INFO - Iter(train) [ 99500/640000] base_lr: 1.8842e-04 lr: 1.8948e-05 eta: 9 days, 5:34:03 time: 1.5019 data_time: 0.0239 memory: 25721 grad_norm: 2.8039 loss: 1.4711 detection_loss_cls: 0.0439 detection_loss_reg: 0.3667 caption_loss_cls: 2.5161 grounding_loss_reg: 3.1809 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0407 instance_segmentation_loss_reg: 0.3596 instance_segmentation_loss_poly: 1.0070 +2024/01/03 07:20:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 07:20:36 - mmengine - INFO - Iter(train) [100000/640000] base_lr: 1.8831e-04 lr: 1.8937e-05 eta: 9 days, 5:14:39 time: 1.4883 data_time: 0.0238 memory: 25721 grad_norm: 2.8756 loss: 1.4995 detection_loss_cls: 0.0440 detection_loss_reg: 0.3673 caption_loss_cls: 2.5084 grounding_loss_reg: 3.1792 semantic_segmentation_loss_cls: 0.0116 instance_segmentation_loss_cls: 0.0406 instance_segmentation_loss_reg: 0.3588 instance_segmentation_loss_poly: 1.0066 +2024/01/03 07:20:36 - mmengine - INFO - Saving checkpoint at 100000 iterations +2024/01/03 07:33:10 - mmengine - INFO - Evaluating bbox... +2024/01/03 07:34:05 - mmengine - INFO - bbox_mAP_copypaste: 0.416 0.601 0.459 0.263 0.467 0.535 +2024/01/03 07:34:05 - mmengine - INFO - Evaluating segm... +2024/01/03 07:35:14 - mmengine - INFO - segm_mAP_copypaste: 0.236 0.477 0.210 0.102 0.274 0.396 +2024/01/03 07:41:44 - mmengine - INFO - per class results: +2024/01/03 07:41:44 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 75.03 | 92.25 | +| building | 81.86 | 90.2 | +| sky | 93.24 | 96.41 | +| floor | 80.31 | 91.28 | +| tree | 71.31 | 91.81 | +| ceiling | 83.63 | 89.2 | +| road | 81.58 | 86.28 | +| bed | 86.08 | 94.08 | +| windowpane | 59.82 | 74.46 | +| grass | 66.73 | 77.59 | +| cabinet | 58.12 | 83.42 | +| sidewalk | 61.77 | 80.97 | +| person | 79.69 | 89.1 | +| earth | 43.97 | 66.1 | +| door | 28.68 | 29.79 | +| table | 59.82 | 76.31 | +| mountain | 52.03 | 61.93 | +| plant | 46.38 | 55.96 | +| curtain | 71.54 | 80.78 | +| chair | 56.58 | 70.15 | +| car | 82.49 | 92.18 | +| water | 39.85 | 48.82 | +| painting | 72.3 | 84.3 | +| sofa | 67.29 | 85.87 | +| shelf | 41.23 | 71.9 | +| house | 49.52 | 69.17 | +| sea | 55.87 | 78.21 | +| mirror | 52.84 | 55.06 | +| rug | 59.72 | 62.57 | +| field | 25.65 | 41.83 | +| armchair | 40.49 | 51.58 | +| seat | 60.22 | 78.68 | +| fence | 25.3 | 31.04 | +| desk | 47.98 | 67.83 | +| rock | 45.17 | 62.36 | +| wardrobe | 48.44 | 57.35 | +| lamp | 58.24 | 73.74 | +| bathtub | 70.98 | 74.37 | +| railing | 30.51 | 39.69 | +| cushion | 54.44 | 64.74 | +| base | 26.98 | 37.57 | +| box | 17.72 | 20.02 | +| column | 46.4 | 54.18 | +| signboard | 31.8 | 40.08 | +| chest of drawers | 34.08 | 39.35 | +| counter | 38.68 | 42.74 | +| sand | 38.93 | 42.54 | +| sink | 64.91 | 75.11 | +| skyscraper | 51.19 | 66.44 | +| fireplace | 61.46 | 69.34 | +| refrigerator | 69.39 | 75.24 | +| grandstand | 52.73 | 73.78 | +| path | 19.76 | 25.95 | +| stairs | 33.99 | 42.56 | +| runway | 81.04 | 88.78 | +| case | 21.62 | 22.06 | +| pool table | 91.21 | 95.62 | +| pillow | 50.87 | 58.61 | +| screen door | 57.15 | 91.53 | +| stairway | 29.46 | 31.53 | +| river | 12.49 | 49.42 | +| bridge | 58.9 | 83.96 | +| bookcase | 39.4 | 48.6 | +| blind | 41.58 | 44.77 | +| coffee table | 59.92 | 72.1 | +| toilet | 84.63 | 88.68 | +| flower | 30.76 | 40.49 | +| book | 46.43 | 66.37 | +| hill | 14.21 | 18.3 | +| bench | 51.04 | 63.96 | +| countertop | 0.0 | 0.0 | +| stove | 64.59 | 73.22 | +| palm | 45.71 | 64.97 | +| kitchen island | 33.5 | 46.87 | +| computer | 58.24 | 66.06 | +| swivel chair | 32.06 | 39.56 | +| boat | 66.11 | 74.71 | +| bar | 37.11 | 48.25 | +| arcade machine | 54.4 | 57.27 | +| hovel | 45.32 | 74.78 | +| bus | 90.19 | 95.63 | +| towel | 57.93 | 63.01 | +| light | 49.99 | 62.98 | +| truck | 36.0 | 48.38 | +| tower | 23.71 | 35.45 | +| chandelier | 58.87 | 72.34 | +| awning | 27.67 | 36.93 | +| streetlight | 27.65 | 46.94 | +| booth | 23.89 | 85.34 | +| television receiver | 64.43 | 71.93 | +| airplane | 57.9 | 63.37 | +| dirt track | 0.0 | 0.0 | +| apparel | 26.15 | 34.22 | +| pole | 22.27 | 31.01 | +| land | 5.32 | 9.49 | +| bannister | 1.79 | 1.97 | +| escalator | 15.26 | 17.2 | +| ottoman | 42.97 | 70.91 | +| bottle | 15.58 | 17.26 | +| buffet | 39.53 | 61.81 | +| poster | 12.76 | 15.06 | +| stage | 10.48 | 16.61 | +| van | 28.76 | 34.87 | +| ship | 73.23 | 83.87 | +| fountain | 6.0 | 6.04 | +| conveyer belt | 63.08 | 92.95 | +| canopy | 31.74 | 35.69 | +| washer | 45.05 | 45.23 | +| plaything | 12.85 | 14.55 | +| swimming pool | 32.15 | 55.65 | +| stool | 40.38 | 59.75 | +| barrel | 13.36 | 64.57 | +| basket | 27.42 | 30.85 | +| waterfall | 62.09 | 73.27 | +| tent | 89.73 | 94.64 | +| bag | 15.43 | 17.45 | +| minibike | 69.64 | 81.99 | +| cradle | 60.51 | 79.27 | +| oven | 26.87 | 60.37 | +| ball | 37.21 | 41.54 | +| food | 40.78 | 47.17 | +| step | 0.0 | 0.0 | +| tank | 26.8 | 27.89 | +| trade name | 5.01 | 5.02 | +| microwave | 54.43 | 56.82 | +| pot | 42.55 | 49.51 | +| animal | 65.57 | 71.5 | +| bicycle | 57.9 | 71.8 | +| lake | 0.0 | 0.0 | +| dishwasher | 46.88 | 47.51 | +| screen | 67.45 | 81.99 | +| blanket | 12.54 | 14.97 | +| sculpture | 49.26 | 52.44 | +| hood | 52.41 | 55.39 | +| sconce | 22.76 | 24.78 | +| vase | 39.79 | 50.24 | +| traffic light | 28.77 | 40.49 | +| tray | 5.96 | 7.09 | +| ashcan | 32.26 | 42.48 | +| fan | 45.25 | 49.34 | +| pier | 20.52 | 27.63 | +| crt screen | 0.0 | 0.0 | +| plate | 50.64 | 58.73 | +| monitor | 45.64 | 51.33 | +| bulletin board | 29.51 | 33.43 | +| shower | 0.0 | 0.0 | +| radiator | 39.84 | 40.6 | +| glass | 11.06 | 11.54 | +| clock | 18.2 | 20.55 | +| flag | 32.21 | 37.35 | ++---------------------+-------+-------+ +2024/01/03 07:42:00 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4160 coco/bbox_mAP_50: 0.6010 coco/bbox_mAP_75: 0.4590 coco/bbox_mAP_s: 0.2630 coco/bbox_mAP_m: 0.4670 coco/bbox_mAP_l: 0.5350 coco/segm_mAP: 0.2360 coco/segm_mAP_50: 0.4770 coco/segm_mAP_75: 0.2100 coco/segm_mAP_s: 0.1020 coco/segm_mAP_m: 0.2740 coco/segm_mAP_l: 0.3960 Bleu_1: 0.7185 Bleu_2: 0.5450 Bleu_3: 0.4002 Bleu_4: 0.2891 METEOR: 0.2434 ROUGE_L: 0.5243 CIDEr: 0.9181 SPICE: 0.1787 aAcc: 81.5200 mIoU: 43.6800 mAcc: 53.9500 visual-grounding/miou: 0.7310 visual-grounding/acc: 0.8074 data_time: 0.0045 time: 1.3505 +2024/01/03 07:55:22 - mmengine - INFO - Iter(train) [100500/640000] base_lr: 1.8820e-04 lr: 1.8927e-05 eta: 9 days, 5:15:40 time: 1.4955 data_time: 0.0203 memory: 25721 grad_norm: 2.8291 loss: 1.4887 detection_loss_cls: 0.0438 detection_loss_reg: 0.3670 caption_loss_cls: 2.5071 grounding_loss_reg: 3.1757 semantic_segmentation_loss_cls: 0.0115 instance_segmentation_loss_cls: 0.0406 instance_segmentation_loss_reg: 0.3593 instance_segmentation_loss_poly: 1.0076 +2024/01/03 08:08:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 08:08:15 - mmengine - INFO - Iter(train) [101000/640000] base_lr: 1.8808e-04 lr: 1.8916e-05 eta: 9 days, 5:10:27 time: 1.4994 data_time: 0.0204 memory: 25721 grad_norm: 2.8358 loss: 1.4975 detection_loss_cls: 0.0437 detection_loss_reg: 0.3661 caption_loss_cls: 2.5091 grounding_loss_reg: 3.1754 semantic_segmentation_loss_cls: 0.0115 instance_segmentation_loss_cls: 0.0404 instance_segmentation_loss_reg: 0.3581 instance_segmentation_loss_poly: 1.0041 +2024/01/03 08:20:26 - mmengine - INFO - Iter(train) [101500/640000] base_lr: 1.8796e-04 lr: 1.8906e-05 eta: 9 days, 4:56:28 time: 1.4988 data_time: 0.0205 memory: 25721 grad_norm: 2.8147 loss: 1.4967 detection_loss_cls: 0.0436 detection_loss_reg: 0.3651 caption_loss_cls: 2.5055 grounding_loss_reg: 3.1724 semantic_segmentation_loss_cls: 0.0115 instance_segmentation_loss_cls: 0.0406 instance_segmentation_loss_reg: 0.3593 instance_segmentation_loss_poly: 1.0059 +2024/01/03 08:32:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 08:32:54 - mmengine - INFO - Iter(train) [102000/640000] base_lr: 1.8785e-04 lr: 1.8895e-05 eta: 9 days, 4:46:02 time: 1.5016 data_time: 0.0205 memory: 25721 grad_norm: 2.8076 loss: 1.5042 detection_loss_cls: 0.0436 detection_loss_reg: 0.3647 caption_loss_cls: 2.5048 grounding_loss_reg: 3.1729 semantic_segmentation_loss_cls: 0.0115 instance_segmentation_loss_cls: 0.0406 instance_segmentation_loss_reg: 0.3595 instance_segmentation_loss_poly: 1.0067 +2024/01/03 08:32:54 - mmengine - INFO - Saving checkpoint at 102000 iterations +2024/01/03 08:45:06 - mmengine - INFO - Iter(train) [102500/640000] base_lr: 1.8773e-04 lr: 1.8885e-05 eta: 9 days, 4:32:30 time: 1.4929 data_time: 0.0204 memory: 25721 grad_norm: 2.8354 loss: 1.5115 detection_loss_cls: 0.0438 detection_loss_reg: 0.3658 caption_loss_cls: 2.5081 grounding_loss_reg: 3.1734 semantic_segmentation_loss_cls: 0.0115 instance_segmentation_loss_cls: 0.0406 instance_segmentation_loss_reg: 0.3604 instance_segmentation_loss_poly: 1.0091 +2024/01/03 08:57:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 08:57:50 - mmengine - INFO - Iter(train) [103000/640000] base_lr: 1.8761e-04 lr: 1.8874e-05 eta: 9 days, 4:24:55 time: 1.5019 data_time: 0.0205 memory: 25721 grad_norm: 2.7786 loss: 1.5037 detection_loss_cls: 0.0439 detection_loss_reg: 0.3669 caption_loss_cls: 2.5034 grounding_loss_reg: 3.1705 semantic_segmentation_loss_cls: 0.0115 instance_segmentation_loss_cls: 0.0408 instance_segmentation_loss_reg: 0.3619 instance_segmentation_loss_poly: 1.0124 +2024/01/03 09:09:39 - mmengine - INFO - Iter(train) [103500/640000] base_lr: 1.8750e-04 lr: 1.8863e-05 eta: 9 days, 4:06:59 time: 1.4908 data_time: 0.0203 memory: 25721 grad_norm: 2.7596 loss: 1.5077 detection_loss_cls: 0.0441 detection_loss_reg: 0.3688 caption_loss_cls: 2.4966 grounding_loss_reg: 3.1678 semantic_segmentation_loss_cls: 0.0115 instance_segmentation_loss_cls: 0.0409 instance_segmentation_loss_reg: 0.3619 instance_segmentation_loss_poly: 1.0119 +2024/01/03 09:21:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 09:21:41 - mmengine - INFO - Iter(train) [104000/640000] base_lr: 1.8738e-04 lr: 1.8852e-05 eta: 9 days, 3:51:40 time: 1.4956 data_time: 0.0204 memory: 25721 grad_norm: 2.7047 loss: 1.4986 detection_loss_cls: 0.0444 detection_loss_reg: 0.3699 caption_loss_cls: 2.4959 grounding_loss_reg: 3.1614 semantic_segmentation_loss_cls: 0.0114 instance_segmentation_loss_cls: 0.0410 instance_segmentation_loss_reg: 0.3626 instance_segmentation_loss_poly: 1.0127 +2024/01/03 09:21:41 - mmengine - INFO - Saving checkpoint at 104000 iterations +2024/01/03 09:34:11 - mmengine - INFO - Iter(train) [104500/640000] base_lr: 1.8726e-04 lr: 1.8842e-05 eta: 9 days, 3:41:20 time: 1.4820 data_time: 0.0239 memory: 25721 grad_norm: 2.7331 loss: 1.5096 detection_loss_cls: 0.0445 detection_loss_reg: 0.3703 caption_loss_cls: 2.4995 grounding_loss_reg: 3.1594 semantic_segmentation_loss_cls: 0.0114 instance_segmentation_loss_cls: 0.0410 instance_segmentation_loss_reg: 0.3623 instance_segmentation_loss_poly: 1.0126 +2024/01/03 09:46:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 09:46:54 - mmengine - INFO - Iter(train) [105000/640000] base_lr: 1.8714e-04 lr: 1.8831e-05 eta: 9 days, 3:33:35 time: 1.4795 data_time: 0.0240 memory: 25721 grad_norm: 2.7493 loss: 1.5167 detection_loss_cls: 0.0444 detection_loss_reg: 0.3705 caption_loss_cls: 2.5022 grounding_loss_reg: 3.1512 semantic_segmentation_loss_cls: 0.0114 instance_segmentation_loss_cls: 0.0412 instance_segmentation_loss_reg: 0.3640 instance_segmentation_loss_poly: 1.0158 +2024/01/03 09:59:25 - mmengine - INFO - Iter(train) [105500/640000] base_lr: 1.8702e-04 lr: 1.8820e-05 eta: 9 days, 3:23:29 time: 1.4847 data_time: 0.0240 memory: 25721 grad_norm: 2.7366 loss: 1.5080 detection_loss_cls: 0.0443 detection_loss_reg: 0.3701 caption_loss_cls: 2.5036 grounding_loss_reg: 3.1478 semantic_segmentation_loss_cls: 0.0114 instance_segmentation_loss_cls: 0.0413 instance_segmentation_loss_reg: 0.3651 instance_segmentation_loss_poly: 1.0183 +2024/01/03 10:11:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 10:11:43 - mmengine - INFO - Iter(train) [106000/640000] base_lr: 1.8690e-04 lr: 1.8809e-05 eta: 9 days, 3:10:57 time: 1.4820 data_time: 0.0239 memory: 25721 grad_norm: 2.7256 loss: 1.4998 detection_loss_cls: 0.0443 detection_loss_reg: 0.3713 caption_loss_cls: 2.5027 grounding_loss_reg: 3.1500 semantic_segmentation_loss_cls: 0.0113 instance_segmentation_loss_cls: 0.0413 instance_segmentation_loss_reg: 0.3657 instance_segmentation_loss_poly: 1.0199 +2024/01/03 10:11:43 - mmengine - INFO - Saving checkpoint at 106000 iterations +2024/01/03 10:24:12 - mmengine - INFO - Iter(train) [106500/640000] base_lr: 1.8678e-04 lr: 1.8798e-05 eta: 9 days, 3:00:28 time: 1.4863 data_time: 0.0240 memory: 25721 grad_norm: 2.6617 loss: 1.4860 detection_loss_cls: 0.0444 detection_loss_reg: 0.3726 caption_loss_cls: 2.5050 grounding_loss_reg: 3.1474 semantic_segmentation_loss_cls: 0.0113 instance_segmentation_loss_cls: 0.0413 instance_segmentation_loss_reg: 0.3653 instance_segmentation_loss_poly: 1.0191 +2024/01/03 10:36:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 10:36:23 - mmengine - INFO - Iter(train) [107000/640000] base_lr: 1.8666e-04 lr: 1.8787e-05 eta: 9 days, 2:46:43 time: 1.4781 data_time: 0.0240 memory: 25721 grad_norm: 2.6678 loss: 1.4913 detection_loss_cls: 0.0443 detection_loss_reg: 0.3723 caption_loss_cls: 2.5009 grounding_loss_reg: 3.1497 semantic_segmentation_loss_cls: 0.0113 instance_segmentation_loss_cls: 0.0412 instance_segmentation_loss_reg: 0.3653 instance_segmentation_loss_poly: 1.0198 +2024/01/03 10:48:19 - mmengine - INFO - Iter(train) [107500/640000] base_lr: 1.8653e-04 lr: 1.8776e-05 eta: 9 days, 2:30:24 time: 1.4797 data_time: 0.0240 memory: 25721 grad_norm: 2.6735 loss: 1.4879 detection_loss_cls: 0.0443 detection_loss_reg: 0.3723 caption_loss_cls: 2.5028 grounding_loss_reg: 3.1458 semantic_segmentation_loss_cls: 0.0113 instance_segmentation_loss_cls: 0.0412 instance_segmentation_loss_reg: 0.3664 instance_segmentation_loss_poly: 1.0225 +2024/01/03 11:00:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 11:00:28 - mmengine - INFO - Iter(train) [108000/640000] base_lr: 1.8641e-04 lr: 1.8765e-05 eta: 9 days, 2:16:25 time: 1.4814 data_time: 0.0239 memory: 25721 grad_norm: 2.6769 loss: 1.4843 detection_loss_cls: 0.0445 detection_loss_reg: 0.3740 caption_loss_cls: 2.5072 grounding_loss_reg: 3.1459 semantic_segmentation_loss_cls: 0.0113 instance_segmentation_loss_cls: 0.0411 instance_segmentation_loss_reg: 0.3666 instance_segmentation_loss_poly: 1.0230 +2024/01/03 11:00:28 - mmengine - INFO - Saving checkpoint at 108000 iterations +2024/01/03 11:13:15 - mmengine - INFO - Iter(train) [108500/640000] base_lr: 1.8629e-04 lr: 1.8753e-05 eta: 9 days, 2:08:52 time: 1.4858 data_time: 0.0239 memory: 25721 grad_norm: 2.6809 loss: 1.4798 detection_loss_cls: 0.0446 detection_loss_reg: 0.3750 caption_loss_cls: 2.5049 grounding_loss_reg: 3.1453 semantic_segmentation_loss_cls: 0.0113 instance_segmentation_loss_cls: 0.0412 instance_segmentation_loss_reg: 0.3677 instance_segmentation_loss_poly: 1.0249 +2024/01/03 11:25:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 11:25:39 - mmengine - INFO - Iter(train) [109000/640000] base_lr: 1.8616e-04 lr: 1.8742e-05 eta: 9 days, 1:57:33 time: 1.4811 data_time: 0.0238 memory: 25721 grad_norm: 2.6882 loss: 1.4824 detection_loss_cls: 0.0447 detection_loss_reg: 0.3764 caption_loss_cls: 2.5048 grounding_loss_reg: 3.1463 semantic_segmentation_loss_cls: 0.0113 instance_segmentation_loss_cls: 0.0412 instance_segmentation_loss_reg: 0.3684 instance_segmentation_loss_poly: 1.0256 +2024/01/03 11:37:32 - mmengine - INFO - Iter(train) [109500/640000] base_lr: 1.8604e-04 lr: 1.8731e-05 eta: 9 days, 1:40:53 time: 1.4715 data_time: 0.0235 memory: 25721 grad_norm: 2.6776 loss: 1.4805 detection_loss_cls: 0.0448 detection_loss_reg: 0.3771 caption_loss_cls: 2.5055 grounding_loss_reg: 3.1506 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0413 instance_segmentation_loss_reg: 0.3693 instance_segmentation_loss_poly: 1.0265 +2024/01/03 11:49:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 11:49:57 - mmengine - INFO - Iter(train) [110000/640000] base_lr: 1.8592e-04 lr: 1.8720e-05 eta: 9 days, 1:29:39 time: 1.4734 data_time: 0.0236 memory: 25721 grad_norm: 2.6714 loss: 1.4938 detection_loss_cls: 0.0448 detection_loss_reg: 0.3779 caption_loss_cls: 2.5060 grounding_loss_reg: 3.1490 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0413 instance_segmentation_loss_reg: 0.3696 instance_segmentation_loss_poly: 1.0281 +2024/01/03 11:49:57 - mmengine - INFO - Saving checkpoint at 110000 iterations +2024/01/03 12:02:09 - mmengine - INFO - Iter(train) [110500/640000] base_lr: 1.8579e-04 lr: 1.8708e-05 eta: 9 days, 1:16:12 time: 1.4690 data_time: 0.0237 memory: 25721 grad_norm: 2.6813 loss: 1.5070 detection_loss_cls: 0.0447 detection_loss_reg: 0.3767 caption_loss_cls: 2.5089 grounding_loss_reg: 3.1463 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0413 instance_segmentation_loss_reg: 0.3696 instance_segmentation_loss_poly: 1.0281 +2024/01/03 12:14:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240102_123251 +2024/01/03 12:14:55 - mmengine - INFO - Iter(train) [111000/640000] base_lr: 1.8566e-04 lr: 1.8697e-05 eta: 9 days, 1:08:14 time: 1.4777 data_time: 0.0238 memory: 25721 grad_norm: 2.7010 loss: 1.5022 detection_loss_cls: 0.0447 detection_loss_reg: 0.3777 caption_loss_cls: 2.5087 grounding_loss_reg: 3.1459 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0413 instance_segmentation_loss_reg: 0.3700 instance_segmentation_loss_poly: 1.0283 +2024/01/03 12:27:35 - mmengine - INFO - Iter(train) [111500/640000] base_lr: 1.8554e-04 lr: 1.8685e-05 eta: 9 days, 0:59:21 time: 1.4889 data_time: 0.0241 memory: 25721 grad_norm: 2.7334 loss: 1.5055 detection_loss_cls: 0.0447 detection_loss_reg: 0.3780 caption_loss_cls: 2.5095 grounding_loss_reg: 3.1454 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0413 instance_segmentation_loss_reg: 0.3709 instance_segmentation_loss_poly: 1.0303 +2024/01/03 14:12:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 14:12:31 - mmengine - INFO - Iter(train) [112000/640000] base_lr: 1.8541e-04 lr: 1.8674e-05 eta: 8 days, 23:08:29 time: 1.4757 data_time: 0.0191 memory: 25718 grad_norm: 2.6593 loss: 1.4880 detection_loss_cls: 0.0445 detection_loss_reg: 0.3770 caption_loss_cls: 2.5010 grounding_loss_reg: 3.1407 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0413 instance_segmentation_loss_reg: 0.3698 instance_segmentation_loss_poly: 1.0260 +2024/01/03 14:12:31 - mmengine - INFO - Saving checkpoint at 112000 iterations +2024/01/03 14:25:10 - mmengine - INFO - Iter(train) [112500/640000] base_lr: 1.8528e-04 lr: 1.8662e-05 eta: 9 days, 0:26:30 time: 1.4738 data_time: 0.0195 memory: 25718 grad_norm: 2.6563 loss: 1.4822 detection_loss_cls: 0.0443 detection_loss_reg: 0.3757 caption_loss_cls: 2.4930 grounding_loss_reg: 3.1374 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0412 instance_segmentation_loss_reg: 0.3684 instance_segmentation_loss_poly: 1.0230 +2024/01/03 14:37:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 14:37:13 - mmengine - INFO - Iter(train) [113000/640000] base_lr: 1.8516e-04 lr: 1.8651e-05 eta: 8 days, 23:28:43 time: 1.4684 data_time: 0.0194 memory: 25718 grad_norm: 2.6428 loss: 1.4764 detection_loss_cls: 0.0442 detection_loss_reg: 0.3748 caption_loss_cls: 2.4891 grounding_loss_reg: 3.1370 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0411 instance_segmentation_loss_reg: 0.3687 instance_segmentation_loss_poly: 1.0239 +2024/01/03 14:49:13 - mmengine - INFO - Iter(train) [113500/640000] base_lr: 1.8503e-04 lr: 1.8639e-05 eta: 8 days, 22:35:40 time: 1.4702 data_time: 0.0195 memory: 25718 grad_norm: 2.6512 loss: 1.4770 detection_loss_cls: 0.0443 detection_loss_reg: 0.3765 caption_loss_cls: 2.4829 grounding_loss_reg: 3.1337 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0408 instance_segmentation_loss_reg: 0.3682 instance_segmentation_loss_poly: 1.0226 +2024/01/03 15:01:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 15:01:46 - mmengine - INFO - Iter(train) [114000/640000] base_lr: 1.8490e-04 lr: 1.8627e-05 eta: 8 days, 23:05:11 time: 1.4721 data_time: 0.0195 memory: 25718 grad_norm: 2.6422 loss: 1.4602 detection_loss_cls: 0.0442 detection_loss_reg: 0.3764 caption_loss_cls: 2.4790 grounding_loss_reg: 3.1324 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0408 instance_segmentation_loss_reg: 0.3680 instance_segmentation_loss_poly: 1.0225 +2024/01/03 15:01:46 - mmengine - INFO - Saving checkpoint at 114000 iterations +2024/01/03 15:13:30 - mmengine - INFO - Iter(train) [114500/640000] base_lr: 1.8477e-04 lr: 1.8616e-05 eta: 8 days, 21:51:24 time: 1.4649 data_time: 0.0238 memory: 25718 grad_norm: 2.7062 loss: 1.4750 detection_loss_cls: 0.0442 detection_loss_reg: 0.3761 caption_loss_cls: 2.4779 grounding_loss_reg: 3.1285 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0407 instance_segmentation_loss_reg: 0.3683 instance_segmentation_loss_poly: 1.0226 +2024/01/03 15:26:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 15:26:17 - mmengine - INFO - Iter(train) [115000/640000] base_lr: 1.8464e-04 lr: 1.8604e-05 eta: 8 days, 22:39:09 time: 1.4710 data_time: 0.0240 memory: 25718 grad_norm: 2.6728 loss: 1.4608 detection_loss_cls: 0.0443 detection_loss_reg: 0.3771 caption_loss_cls: 2.4749 grounding_loss_reg: 3.1258 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0408 instance_segmentation_loss_reg: 0.3690 instance_segmentation_loss_poly: 1.0236 +2024/01/03 15:38:31 - mmengine - INFO - Iter(train) [115500/640000] base_lr: 1.8451e-04 lr: 1.8592e-05 eta: 8 days, 22:23:38 time: 1.4720 data_time: 0.0242 memory: 25718 grad_norm: 2.6970 loss: 1.4690 detection_loss_cls: 0.0444 detection_loss_reg: 0.3777 caption_loss_cls: 2.4747 grounding_loss_reg: 3.1246 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0408 instance_segmentation_loss_reg: 0.3697 instance_segmentation_loss_poly: 1.0247 +2024/01/03 15:50:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 15:50:45 - mmengine - INFO - Iter(train) [116000/640000] base_lr: 1.8438e-04 lr: 1.8580e-05 eta: 8 days, 22:08:25 time: 1.4734 data_time: 0.0243 memory: 25718 grad_norm: 2.7216 loss: 1.4716 detection_loss_cls: 0.0441 detection_loss_reg: 0.3763 caption_loss_cls: 2.4782 grounding_loss_reg: 3.1218 semantic_segmentation_loss_cls: 0.0112 instance_segmentation_loss_cls: 0.0408 instance_segmentation_loss_reg: 0.3692 instance_segmentation_loss_poly: 1.0239 +2024/01/03 15:50:45 - mmengine - INFO - Saving checkpoint at 116000 iterations +2024/01/03 16:02:42 - mmengine - INFO - Iter(train) [116500/640000] base_lr: 1.8425e-04 lr: 1.8568e-05 eta: 8 days, 21:31:23 time: 1.4629 data_time: 0.0239 memory: 25718 grad_norm: 2.7501 loss: 1.4750 detection_loss_cls: 0.0439 detection_loss_reg: 0.3749 caption_loss_cls: 2.4725 grounding_loss_reg: 3.1219 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0406 instance_segmentation_loss_reg: 0.3674 instance_segmentation_loss_poly: 1.0202 +2024/01/03 16:14:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 16:14:51 - mmengine - INFO - Iter(train) [117000/640000] base_lr: 1.8412e-04 lr: 1.8556e-05 eta: 8 days, 21:12:06 time: 1.4642 data_time: 0.0238 memory: 25718 grad_norm: 2.7601 loss: 1.4675 detection_loss_cls: 0.0439 detection_loss_reg: 0.3752 caption_loss_cls: 2.4734 grounding_loss_reg: 3.1198 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0404 instance_segmentation_loss_reg: 0.3661 instance_segmentation_loss_poly: 1.0171 +2024/01/03 16:27:18 - mmengine - INFO - Iter(train) [117500/640000] base_lr: 1.8398e-04 lr: 1.8544e-05 eta: 8 days, 21:14:52 time: 1.4710 data_time: 0.0240 memory: 25718 grad_norm: 2.7599 loss: 1.4640 detection_loss_cls: 0.0439 detection_loss_reg: 0.3750 caption_loss_cls: 2.4720 grounding_loss_reg: 3.1155 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0402 instance_segmentation_loss_reg: 0.3652 instance_segmentation_loss_poly: 1.0147 +2024/01/03 16:39:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 16:39:33 - mmengine - INFO - Iter(train) [118000/640000] base_lr: 1.8385e-04 lr: 1.8532e-05 eta: 8 days, 21:02:30 time: 1.4664 data_time: 0.0239 memory: 25718 grad_norm: 2.8014 loss: 1.4744 detection_loss_cls: 0.0439 detection_loss_reg: 0.3744 caption_loss_cls: 2.4679 grounding_loss_reg: 3.1137 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0402 instance_segmentation_loss_reg: 0.3648 instance_segmentation_loss_poly: 1.0138 +2024/01/03 16:39:33 - mmengine - INFO - Saving checkpoint at 118000 iterations +2024/01/03 16:51:56 - mmengine - INFO - Iter(train) [118500/640000] base_lr: 1.8372e-04 lr: 1.8520e-05 eta: 8 days, 20:58:36 time: 1.4760 data_time: 0.0241 memory: 25718 grad_norm: 2.7750 loss: 1.4646 detection_loss_cls: 0.0437 detection_loss_reg: 0.3731 caption_loss_cls: 2.4701 grounding_loss_reg: 3.1127 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3642 instance_segmentation_loss_poly: 1.0114 +2024/01/03 17:04:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 17:04:01 - mmengine - INFO - Iter(train) [119000/640000] base_lr: 1.8358e-04 lr: 1.8508e-05 eta: 8 days, 20:37:14 time: 1.4657 data_time: 0.0238 memory: 25718 grad_norm: 2.8165 loss: 1.4680 detection_loss_cls: 0.0436 detection_loss_reg: 0.3722 caption_loss_cls: 2.4693 grounding_loss_reg: 3.1113 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0400 instance_segmentation_loss_reg: 0.3633 instance_segmentation_loss_poly: 1.0094 +2024/01/03 17:17:13 - mmengine - INFO - Iter(train) [119500/640000] base_lr: 1.8345e-04 lr: 1.8496e-05 eta: 8 days, 21:16:32 time: 1.4800 data_time: 0.0239 memory: 25718 grad_norm: 2.7740 loss: 1.4467 detection_loss_cls: 0.0435 detection_loss_reg: 0.3712 caption_loss_cls: 2.4680 grounding_loss_reg: 3.1100 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0398 instance_segmentation_loss_reg: 0.3629 instance_segmentation_loss_poly: 1.0098 +2024/01/03 17:29:26 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 17:29:26 - mmengine - INFO - Iter(train) [120000/640000] base_lr: 1.8332e-04 lr: 1.8483e-05 eta: 8 days, 21:00:59 time: 1.4800 data_time: 0.0238 memory: 25718 grad_norm: 2.7696 loss: 1.4368 detection_loss_cls: 0.0433 detection_loss_reg: 0.3693 caption_loss_cls: 2.4690 grounding_loss_reg: 3.1062 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0395 instance_segmentation_loss_reg: 0.3611 instance_segmentation_loss_poly: 1.0051 +2024/01/03 17:29:26 - mmengine - INFO - Saving checkpoint at 120000 iterations +2024/01/03 17:41:47 - mmengine - INFO - Evaluating bbox... +2024/01/03 17:42:44 - mmengine - INFO - bbox_mAP_copypaste: 0.433 0.613 0.475 0.283 0.485 0.554 +2024/01/03 17:42:44 - mmengine - INFO - Evaluating segm... +2024/01/03 17:43:58 - mmengine - INFO - segm_mAP_copypaste: 0.281 0.524 0.268 0.144 0.319 0.433 +2024/01/03 17:49:58 - mmengine - INFO - per class results: +2024/01/03 17:49:58 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 76.03 | 87.11 | +| building | 79.9 | 90.76 | +| sky | 93.08 | 97.32 | +| floor | 81.41 | 89.04 | +| tree | 74.01 | 87.22 | +| ceiling | 83.92 | 93.59 | +| road | 80.49 | 91.02 | +| bed | 87.06 | 93.23 | +| windowpane | 61.56 | 77.8 | +| grass | 64.42 | 82.08 | +| cabinet | 59.68 | 73.22 | +| sidewalk | 62.08 | 74.76 | +| person | 79.64 | 89.61 | +| earth | 37.29 | 50.27 | +| door | 45.77 | 58.06 | +| table | 56.03 | 71.05 | +| mountain | 56.02 | 68.91 | +| plant | 50.99 | 67.36 | +| curtain | 73.04 | 89.97 | +| chair | 54.9 | 70.36 | +| car | 81.58 | 92.03 | +| water | 29.21 | 33.01 | +| painting | 66.06 | 87.41 | +| sofa | 68.71 | 85.03 | +| shelf | 44.53 | 69.08 | +| house | 44.28 | 75.06 | +| sea | 51.46 | 91.23 | +| mirror | 64.68 | 75.79 | +| rug | 65.05 | 69.33 | +| field | 29.59 | 52.61 | +| armchair | 40.67 | 61.33 | +| seat | 63.72 | 81.13 | +| fence | 42.85 | 56.81 | +| desk | 37.86 | 66.76 | +| rock | 41.78 | 59.75 | +| wardrobe | 45.32 | 58.77 | +| lamp | 57.21 | 67.26 | +| bathtub | 78.61 | 83.18 | +| railing | 33.4 | 43.56 | +| cushion | 52.83 | 68.91 | +| base | 23.84 | 31.28 | +| box | 24.5 | 41.05 | +| column | 49.44 | 55.76 | +| signboard | 33.55 | 39.9 | +| chest of drawers | 34.88 | 60.11 | +| counter | 23.17 | 23.93 | +| sand | 37.67 | 43.97 | +| sink | 67.26 | 76.74 | +| skyscraper | 48.29 | 61.52 | +| fireplace | 65.74 | 84.01 | +| refrigerator | 73.18 | 83.66 | +| grandstand | 51.37 | 79.32 | +| path | 21.59 | 32.55 | +| stairs | 28.67 | 37.0 | +| runway | 66.79 | 78.23 | +| case | 51.85 | 68.97 | +| pool table | 90.14 | 94.57 | +| pillow | 49.16 | 55.32 | +| screen door | 6.63 | 6.64 | +| stairway | 31.16 | 40.96 | +| river | 16.64 | 37.72 | +| bridge | 70.27 | 85.71 | +| bookcase | 32.98 | 38.91 | +| blind | 45.35 | 54.73 | +| coffee table | 60.37 | 75.38 | +| toilet | 84.82 | 90.06 | +| flower | 24.53 | 32.22 | +| book | 41.99 | 68.31 | +| hill | 9.54 | 18.22 | +| bench | 50.19 | 56.63 | +| countertop | 48.39 | 71.67 | +| stove | 71.0 | 75.45 | +| palm | 42.94 | 80.1 | +| kitchen island | 36.96 | 52.33 | +| computer | 67.36 | 78.07 | +| swivel chair | 36.64 | 45.18 | +| boat | 51.09 | 59.14 | +| bar | 26.41 | 33.44 | +| arcade machine | 43.62 | 45.1 | +| hovel | 11.09 | 11.69 | +| bus | 91.75 | 95.06 | +| towel | 60.05 | 81.26 | +| light | 44.61 | 49.6 | +| truck | 34.61 | 58.45 | +| tower | 17.25 | 27.98 | +| chandelier | 54.77 | 66.82 | +| awning | 29.06 | 41.81 | +| streetlight | 25.21 | 31.85 | +| booth | 38.19 | 39.05 | +| television receiver | 61.72 | 81.48 | +| airplane | 60.24 | 72.71 | +| dirt track | 3.66 | 7.12 | +| apparel | 21.58 | 41.48 | +| pole | 24.35 | 32.37 | +| land | 4.71 | 10.59 | +| bannister | 10.91 | 12.74 | +| escalator | 58.48 | 69.08 | +| ottoman | 48.72 | 66.29 | +| bottle | 18.83 | 22.87 | +| buffet | 30.64 | 31.35 | +| poster | 18.81 | 19.95 | +| stage | 9.23 | 19.03 | +| van | 6.94 | 7.4 | +| ship | 19.42 | 26.56 | +| fountain | 17.61 | 17.78 | +| conveyer belt | 60.25 | 86.67 | +| canopy | 23.84 | 30.31 | +| washer | 64.37 | 70.93 | +| plaything | 19.66 | 25.3 | +| swimming pool | 26.3 | 37.76 | +| stool | 29.07 | 34.09 | +| barrel | 11.02 | 68.51 | +| basket | 34.21 | 43.38 | +| waterfall | 54.64 | 66.44 | +| tent | 80.6 | 90.11 | +| bag | 23.02 | 31.16 | +| minibike | 72.25 | 83.52 | +| cradle | 66.15 | 88.19 | +| oven | 41.67 | 56.52 | +| ball | 47.39 | 70.08 | +| food | 49.76 | 55.46 | +| step | 10.93 | 12.55 | +| tank | 32.92 | 41.62 | +| trade name | 27.15 | 36.84 | +| microwave | 75.77 | 87.69 | +| pot | 40.64 | 46.75 | +| animal | 67.41 | 71.77 | +| bicycle | 54.34 | 67.94 | +| lake | 25.6 | 76.39 | +| dishwasher | 52.01 | 61.84 | +| screen | 55.65 | 80.63 | +| blanket | 17.87 | 23.9 | +| sculpture | 41.8 | 62.41 | +| hood | 55.39 | 62.87 | +| sconce | 36.52 | 55.66 | +| vase | 38.78 | 51.05 | +| traffic light | 33.09 | 43.63 | +| tray | 10.06 | 23.5 | +| ashcan | 29.61 | 39.48 | +| fan | 56.13 | 70.6 | +| pier | 50.55 | 59.05 | +| crt screen | 5.28 | 14.44 | +| plate | 49.07 | 62.91 | +| monitor | 42.57 | 48.13 | +| bulletin board | 36.92 | 56.91 | +| shower | 0.73 | 15.15 | +| radiator | 52.06 | 69.21 | +| glass | 14.12 | 15.16 | +| clock | 26.95 | 37.48 | +| flag | 25.29 | 26.6 | ++---------------------+-------+-------+ +2024/01/03 17:50:16 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4330 coco/bbox_mAP_50: 0.6130 coco/bbox_mAP_75: 0.4750 coco/bbox_mAP_s: 0.2830 coco/bbox_mAP_m: 0.4850 coco/bbox_mAP_l: 0.5540 coco/segm_mAP: 0.2810 coco/segm_mAP_50: 0.5240 coco/segm_mAP_75: 0.2680 coco/segm_mAP_s: 0.1440 coco/segm_mAP_m: 0.3190 coco/segm_mAP_l: 0.4330 Bleu_1: 0.7052 Bleu_2: 0.5316 Bleu_3: 0.3883 Bleu_4: 0.2805 METEOR: 0.2452 ROUGE_L: 0.5225 CIDEr: 0.9156 SPICE: 0.1790 aAcc: 81.5300 mIoU: 44.8600 mAcc: 57.1800 visual-grounding/miou: 0.7473 visual-grounding/acc: 0.8234 data_time: 0.0119 time: 1.3860 +2024/01/03 18:02:58 - mmengine - INFO - Iter(train) [120500/640000] base_lr: 1.8318e-04 lr: 1.8471e-05 eta: 8 days, 21:10:04 time: 1.4916 data_time: 0.0202 memory: 25719 grad_norm: 2.7237 loss: 1.4107 detection_loss_cls: 0.0431 detection_loss_reg: 0.3679 caption_loss_cls: 2.4622 grounding_loss_reg: 3.1000 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0393 instance_segmentation_loss_reg: 0.3596 instance_segmentation_loss_poly: 1.0014 +2024/01/03 18:15:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 18:15:38 - mmengine - INFO - Iter(train) [121000/640000] base_lr: 1.8304e-04 lr: 1.8459e-05 eta: 8 days, 21:14:23 time: 1.4994 data_time: 0.0205 memory: 25719 grad_norm: 2.7415 loss: 1.4042 detection_loss_cls: 0.0432 detection_loss_reg: 0.3682 caption_loss_cls: 2.4624 grounding_loss_reg: 3.0992 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0392 instance_segmentation_loss_reg: 0.3590 instance_segmentation_loss_poly: 1.0002 +2024/01/03 18:27:46 - mmengine - INFO - Iter(train) [121500/640000] base_lr: 1.8291e-04 lr: 1.8446e-05 eta: 8 days, 20:53:20 time: 1.4947 data_time: 0.0205 memory: 25719 grad_norm: 2.7863 loss: 1.4093 detection_loss_cls: 0.0430 detection_loss_reg: 0.3678 caption_loss_cls: 2.4626 grounding_loss_reg: 3.0964 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0392 instance_segmentation_loss_reg: 0.3596 instance_segmentation_loss_poly: 1.0016 +2024/01/03 18:39:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 18:39:00 - mmengine - INFO - Iter(train) [122000/640000] base_lr: 1.8277e-04 lr: 1.8434e-05 eta: 8 days, 19:54:02 time: 1.4795 data_time: 0.0204 memory: 25719 grad_norm: 2.8661 loss: 1.4133 detection_loss_cls: 0.0430 detection_loss_reg: 0.3685 caption_loss_cls: 2.4631 grounding_loss_reg: 3.0917 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0390 instance_segmentation_loss_reg: 0.3583 instance_segmentation_loss_poly: 0.9989 +2024/01/03 18:39:00 - mmengine - INFO - Saving checkpoint at 122000 iterations +2024/01/03 18:51:37 - mmengine - INFO - Iter(train) [122500/640000] base_lr: 1.8263e-04 lr: 1.8421e-05 eta: 8 days, 19:56:09 time: 1.4831 data_time: 0.0213 memory: 25719 grad_norm: 2.8904 loss: 1.4149 detection_loss_cls: 0.0430 detection_loss_reg: 0.3687 caption_loss_cls: 2.4590 grounding_loss_reg: 3.0906 semantic_segmentation_loss_cls: 0.0111 instance_segmentation_loss_cls: 0.0390 instance_segmentation_loss_reg: 0.3584 instance_segmentation_loss_poly: 0.9982 +2024/01/03 19:03:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 19:03:02 - mmengine - INFO - Iter(train) [123000/640000] base_lr: 1.8250e-04 lr: 1.8409e-05 eta: 8 days, 19:09:29 time: 1.4730 data_time: 0.0214 memory: 25719 grad_norm: 2.9124 loss: 1.4188 detection_loss_cls: 0.0430 detection_loss_reg: 0.3695 caption_loss_cls: 2.4535 grounding_loss_reg: 3.0835 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0391 instance_segmentation_loss_reg: 0.3598 instance_segmentation_loss_poly: 1.0017 +2024/01/03 19:15:03 - mmengine - INFO - Iter(train) [123500/640000] base_lr: 1.8236e-04 lr: 1.8396e-05 eta: 8 days, 18:47:40 time: 1.4553 data_time: 0.0217 memory: 25719 grad_norm: 2.9559 loss: 1.4434 detection_loss_cls: 0.0429 detection_loss_reg: 0.3691 caption_loss_cls: 2.4579 grounding_loss_reg: 3.0793 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0389 instance_segmentation_loss_reg: 0.3591 instance_segmentation_loss_poly: 0.9996 +2024/01/03 19:27:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 19:27:31 - mmengine - INFO - Iter(train) [124000/640000] base_lr: 1.8222e-04 lr: 1.8384e-05 eta: 8 days, 18:44:02 time: 1.4590 data_time: 0.0220 memory: 25719 grad_norm: 2.9644 loss: 1.4455 detection_loss_cls: 0.0425 detection_loss_reg: 0.3676 caption_loss_cls: 2.4545 grounding_loss_reg: 3.0781 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0386 instance_segmentation_loss_reg: 0.3576 instance_segmentation_loss_poly: 0.9959 +2024/01/03 19:27:31 - mmengine - INFO - Saving checkpoint at 124000 iterations +2024/01/03 19:39:39 - mmengine - INFO - Iter(train) [124500/640000] base_lr: 1.8208e-04 lr: 1.8371e-05 eta: 8 days, 18:27:22 time: 1.4501 data_time: 0.0261 memory: 25719 grad_norm: 3.0324 loss: 1.4771 detection_loss_cls: 0.0421 detection_loss_reg: 0.3650 caption_loss_cls: 2.4560 grounding_loss_reg: 3.0740 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0383 instance_segmentation_loss_reg: 0.3551 instance_segmentation_loss_poly: 0.9915 +2024/01/03 19:51:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 19:51:35 - mmengine - INFO - Iter(train) [125000/640000] base_lr: 1.8194e-04 lr: 1.8358e-05 eta: 8 days, 18:03:50 time: 1.4390 data_time: 0.0261 memory: 25719 grad_norm: 3.0015 loss: 1.4875 detection_loss_cls: 0.0418 detection_loss_reg: 0.3639 caption_loss_cls: 2.4526 grounding_loss_reg: 3.0767 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0383 instance_segmentation_loss_reg: 0.3546 instance_segmentation_loss_poly: 0.9893 +2024/01/03 20:03:47 - mmengine - INFO - Iter(train) [125500/640000] base_lr: 1.8180e-04 lr: 1.8346e-05 eta: 8 days, 17:50:44 time: 1.4401 data_time: 0.0262 memory: 25719 grad_norm: 3.0076 loss: 1.4948 detection_loss_cls: 0.0418 detection_loss_reg: 0.3636 caption_loss_cls: 2.4528 grounding_loss_reg: 3.0775 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0383 instance_segmentation_loss_reg: 0.3549 instance_segmentation_loss_poly: 0.9887 +2024/01/03 20:16:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 20:16:01 - mmengine - INFO - Iter(train) [126000/640000] base_lr: 1.8166e-04 lr: 1.8333e-05 eta: 8 days, 17:38:09 time: 1.4551 data_time: 0.0264 memory: 25719 grad_norm: 2.9194 loss: 1.4824 detection_loss_cls: 0.0418 detection_loss_reg: 0.3634 caption_loss_cls: 2.4511 grounding_loss_reg: 3.0755 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0384 instance_segmentation_loss_reg: 0.3545 instance_segmentation_loss_poly: 0.9877 +2024/01/03 20:16:01 - mmengine - INFO - Saving checkpoint at 126000 iterations +2024/01/03 20:28:15 - mmengine - INFO - Iter(train) [126500/640000] base_lr: 1.8152e-04 lr: 1.8320e-05 eta: 8 days, 17:25:43 time: 1.4492 data_time: 0.0259 memory: 25719 grad_norm: 2.8890 loss: 1.4750 detection_loss_cls: 0.0418 detection_loss_reg: 0.3632 caption_loss_cls: 2.4513 grounding_loss_reg: 3.0731 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0384 instance_segmentation_loss_reg: 0.3543 instance_segmentation_loss_poly: 0.9878 +2024/01/03 20:41:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 20:41:18 - mmengine - INFO - Iter(train) [127000/640000] base_lr: 1.8138e-04 lr: 1.8307e-05 eta: 8 days, 17:38:02 time: 1.4736 data_time: 0.0263 memory: 25719 grad_norm: 2.8319 loss: 1.4665 detection_loss_cls: 0.0417 detection_loss_reg: 0.3623 caption_loss_cls: 2.4507 grounding_loss_reg: 3.0706 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0383 instance_segmentation_loss_reg: 0.3544 instance_segmentation_loss_poly: 0.9874 +2024/01/03 20:53:37 - mmengine - INFO - Iter(train) [127500/640000] base_lr: 1.8124e-04 lr: 1.8294e-05 eta: 8 days, 17:27:10 time: 1.4782 data_time: 0.0262 memory: 25719 grad_norm: 2.8493 loss: 1.4666 detection_loss_cls: 0.0417 detection_loss_reg: 0.3631 caption_loss_cls: 2.4523 grounding_loss_reg: 3.0678 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0383 instance_segmentation_loss_reg: 0.3541 instance_segmentation_loss_poly: 0.9851 +2024/01/03 21:05:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 21:05:19 - mmengine - INFO - Iter(train) [128000/640000] base_lr: 1.8109e-04 lr: 1.8281e-05 eta: 8 days, 16:58:52 time: 1.4665 data_time: 0.0261 memory: 25719 grad_norm: 2.8403 loss: 1.4719 detection_loss_cls: 0.0416 detection_loss_reg: 0.3617 caption_loss_cls: 2.4505 grounding_loss_reg: 3.0668 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0383 instance_segmentation_loss_reg: 0.3538 instance_segmentation_loss_poly: 0.9838 +2024/01/03 21:05:19 - mmengine - INFO - Saving checkpoint at 128000 iterations +2024/01/03 21:17:16 - mmengine - INFO - Iter(train) [128500/640000] base_lr: 1.8095e-04 lr: 1.8268e-05 eta: 8 days, 16:38:38 time: 1.4639 data_time: 0.0263 memory: 25719 grad_norm: 2.8478 loss: 1.4754 detection_loss_cls: 0.0416 detection_loss_reg: 0.3614 caption_loss_cls: 2.4504 grounding_loss_reg: 3.0616 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0384 instance_segmentation_loss_reg: 0.3539 instance_segmentation_loss_poly: 0.9841 +2024/01/03 21:30:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 21:30:06 - mmengine - INFO - Iter(train) [129000/640000] base_lr: 1.8081e-04 lr: 1.8255e-05 eta: 8 days, 16:42:13 time: 1.4775 data_time: 0.0264 memory: 25719 grad_norm: 2.8398 loss: 1.4669 detection_loss_cls: 0.0416 detection_loss_reg: 0.3609 caption_loss_cls: 2.4483 grounding_loss_reg: 3.0561 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0383 instance_segmentation_loss_reg: 0.3534 instance_segmentation_loss_poly: 0.9827 +2024/01/03 21:43:18 - mmengine - INFO - Iter(train) [129500/640000] base_lr: 1.8066e-04 lr: 1.8242e-05 eta: 8 days, 16:54:54 time: 1.4924 data_time: 0.0266 memory: 25719 grad_norm: 2.7650 loss: 1.4485 detection_loss_cls: 0.0416 detection_loss_reg: 0.3605 caption_loss_cls: 2.4454 grounding_loss_reg: 3.0498 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0382 instance_segmentation_loss_reg: 0.3524 instance_segmentation_loss_poly: 0.9807 +2024/01/03 21:55:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 21:55:28 - mmengine - INFO - Iter(train) [130000/640000] base_lr: 1.8052e-04 lr: 1.8229e-05 eta: 8 days, 16:39:50 time: 1.4915 data_time: 0.0268 memory: 25719 grad_norm: 2.7623 loss: 1.4640 detection_loss_cls: 0.0416 detection_loss_reg: 0.3607 caption_loss_cls: 2.4435 grounding_loss_reg: 3.0508 semantic_segmentation_loss_cls: 0.0110 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3525 instance_segmentation_loss_poly: 0.9811 +2024/01/03 21:55:28 - mmengine - INFO - Saving checkpoint at 130000 iterations +2024/01/03 22:08:21 - mmengine - INFO - Iter(train) [130500/640000] base_lr: 1.8037e-04 lr: 1.8216e-05 eta: 8 days, 16:42:16 time: 1.5011 data_time: 0.0271 memory: 25719 grad_norm: 2.9271 loss: 1.4557 detection_loss_cls: 0.0417 detection_loss_reg: 0.3608 caption_loss_cls: 2.4387 grounding_loss_reg: 3.0478 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3514 instance_segmentation_loss_poly: 0.9786 +2024/01/03 22:20:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 22:20:16 - mmengine - INFO - Iter(train) [131000/640000] base_lr: 1.8023e-04 lr: 1.8202e-05 eta: 8 days, 16:21:12 time: 1.4843 data_time: 0.0268 memory: 25719 grad_norm: 3.0379 loss: 1.4677 detection_loss_cls: 0.0419 detection_loss_reg: 0.3619 caption_loss_cls: 2.4378 grounding_loss_reg: 3.0474 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0382 instance_segmentation_loss_reg: 0.3525 instance_segmentation_loss_poly: 0.9805 +2024/01/03 22:32:43 - mmengine - INFO - Iter(train) [131500/640000] base_lr: 1.8008e-04 lr: 1.8189e-05 eta: 8 days, 16:12:45 time: 1.4863 data_time: 0.0268 memory: 25719 grad_norm: 3.0570 loss: 1.4551 detection_loss_cls: 0.0419 detection_loss_reg: 0.3611 caption_loss_cls: 2.4376 grounding_loss_reg: 3.0454 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3512 instance_segmentation_loss_poly: 0.9777 +2024/01/03 22:45:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 22:45:35 - mmengine - INFO - Iter(train) [132000/640000] base_lr: 1.7994e-04 lr: 1.8176e-05 eta: 8 days, 16:13:58 time: 1.5039 data_time: 0.0271 memory: 25719 grad_norm: 3.0100 loss: 1.4388 detection_loss_cls: 0.0419 detection_loss_reg: 0.3609 caption_loss_cls: 2.4393 grounding_loss_reg: 3.0431 semantic_segmentation_loss_cls: 0.0109 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3505 instance_segmentation_loss_poly: 0.9765 +2024/01/03 22:45:35 - mmengine - INFO - Saving checkpoint at 132000 iterations +2024/01/03 22:58:10 - mmengine - INFO - Iter(train) [132500/640000] base_lr: 1.7979e-04 lr: 1.8163e-05 eta: 8 days, 16:08:03 time: 1.5132 data_time: 0.0271 memory: 25719 grad_norm: 2.9815 loss: 1.4337 detection_loss_cls: 0.0418 detection_loss_reg: 0.3597 caption_loss_cls: 2.4419 grounding_loss_reg: 3.0447 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3501 instance_segmentation_loss_poly: 0.9748 +2024/01/03 23:10:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 23:10:02 - mmengine - INFO - Iter(train) [133000/640000] base_lr: 1.7964e-04 lr: 1.8149e-05 eta: 8 days, 15:45:50 time: 1.4987 data_time: 0.0269 memory: 25719 grad_norm: 2.9942 loss: 1.4346 detection_loss_cls: 0.0417 detection_loss_reg: 0.3595 caption_loss_cls: 2.4434 grounding_loss_reg: 3.0418 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3510 instance_segmentation_loss_poly: 0.9766 +2024/01/03 23:21:55 - mmengine - INFO - Iter(train) [133500/640000] base_lr: 1.7949e-04 lr: 1.8136e-05 eta: 8 days, 15:24:42 time: 1.4788 data_time: 0.0265 memory: 25719 grad_norm: 3.0364 loss: 1.4405 detection_loss_cls: 0.0417 detection_loss_reg: 0.3583 caption_loss_cls: 2.4469 grounding_loss_reg: 3.0393 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3500 instance_segmentation_loss_poly: 0.9742 +2024/01/03 23:33:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 23:33:25 - mmengine - INFO - Iter(train) [134000/640000] base_lr: 1.7934e-04 lr: 1.8122e-05 eta: 8 days, 14:55:57 time: 1.4689 data_time: 0.0262 memory: 25719 grad_norm: 3.0431 loss: 1.4296 detection_loss_cls: 0.0416 detection_loss_reg: 0.3581 caption_loss_cls: 2.4473 grounding_loss_reg: 3.0338 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3493 instance_segmentation_loss_poly: 0.9732 +2024/01/03 23:33:25 - mmengine - INFO - Saving checkpoint at 134000 iterations +2024/01/03 23:45:47 - mmengine - INFO - Iter(train) [134500/640000] base_lr: 1.7920e-04 lr: 1.8109e-05 eta: 8 days, 14:45:35 time: 1.4613 data_time: 0.0260 memory: 25719 grad_norm: 2.8796 loss: 1.4442 detection_loss_cls: 0.0417 detection_loss_reg: 0.3584 caption_loss_cls: 2.4467 grounding_loss_reg: 3.0310 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3497 instance_segmentation_loss_poly: 0.9736 +2024/01/03 23:58:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/03 23:58:27 - mmengine - INFO - Iter(train) [135000/640000] base_lr: 1.7905e-04 lr: 1.8095e-05 eta: 8 days, 14:41:11 time: 1.4723 data_time: 0.0262 memory: 25719 grad_norm: 2.7659 loss: 1.4300 detection_loss_cls: 0.0415 detection_loss_reg: 0.3571 caption_loss_cls: 2.4449 grounding_loss_reg: 3.0278 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3495 instance_segmentation_loss_poly: 0.9735 +2024/01/04 00:11:10 - mmengine - INFO - Iter(train) [135500/640000] base_lr: 1.7890e-04 lr: 1.8082e-05 eta: 8 days, 14:37:40 time: 1.4765 data_time: 0.0262 memory: 25719 grad_norm: 2.7022 loss: 1.4258 detection_loss_cls: 0.0414 detection_loss_reg: 0.3566 caption_loss_cls: 2.4407 grounding_loss_reg: 3.0269 semantic_segmentation_loss_cls: 0.0108 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3491 instance_segmentation_loss_poly: 0.9733 +2024/01/04 00:23:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 00:23:50 - mmengine - INFO - Iter(train) [136000/640000] base_lr: 1.7875e-04 lr: 1.8068e-05 eta: 8 days, 14:32:40 time: 1.4734 data_time: 0.0262 memory: 25719 grad_norm: 2.7256 loss: 1.4366 detection_loss_cls: 0.0412 detection_loss_reg: 0.3564 caption_loss_cls: 2.4427 grounding_loss_reg: 3.0273 semantic_segmentation_loss_cls: 0.0107 instance_segmentation_loss_cls: 0.0379 instance_segmentation_loss_reg: 0.3485 instance_segmentation_loss_poly: 0.9712 +2024/01/04 00:23:50 - mmengine - INFO - Saving checkpoint at 136000 iterations +2024/01/04 00:36:52 - mmengine - INFO - Iter(train) [136500/640000] base_lr: 1.7860e-04 lr: 1.8054e-05 eta: 8 days, 14:34:18 time: 1.4801 data_time: 0.0264 memory: 25719 grad_norm: 2.6829 loss: 1.4236 detection_loss_cls: 0.0413 detection_loss_reg: 0.3573 caption_loss_cls: 2.4404 grounding_loss_reg: 3.0256 semantic_segmentation_loss_cls: 0.0107 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3493 instance_segmentation_loss_poly: 0.9729 +2024/01/04 00:49:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 00:49:33 - mmengine - INFO - Iter(train) [137000/640000] base_lr: 1.7844e-04 lr: 1.8040e-05 eta: 8 days, 14:28:57 time: 1.4925 data_time: 0.0268 memory: 25719 grad_norm: 2.6521 loss: 1.4189 detection_loss_cls: 0.0414 detection_loss_reg: 0.3586 caption_loss_cls: 2.4417 grounding_loss_reg: 3.0234 semantic_segmentation_loss_cls: 0.0107 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3501 instance_segmentation_loss_poly: 0.9747 +2024/01/04 01:02:56 - mmengine - INFO - Iter(train) [137500/640000] base_lr: 1.7829e-04 lr: 1.8027e-05 eta: 8 days, 14:36:05 time: 1.5150 data_time: 0.0272 memory: 25719 grad_norm: 2.6010 loss: 1.4144 detection_loss_cls: 0.0413 detection_loss_reg: 0.3587 caption_loss_cls: 2.4459 grounding_loss_reg: 3.0261 semantic_segmentation_loss_cls: 0.0107 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3505 instance_segmentation_loss_poly: 0.9757 +2024/01/04 01:14:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 01:14:47 - mmengine - INFO - Iter(train) [138000/640000] base_lr: 1.7814e-04 lr: 1.8013e-05 eta: 8 days, 14:15:10 time: 1.5202 data_time: 0.0274 memory: 25719 grad_norm: 2.5954 loss: 1.4144 detection_loss_cls: 0.0411 detection_loss_reg: 0.3578 caption_loss_cls: 2.4474 grounding_loss_reg: 3.0262 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0379 instance_segmentation_loss_reg: 0.3504 instance_segmentation_loss_poly: 0.9751 +2024/01/04 01:14:47 - mmengine - INFO - Saving checkpoint at 138000 iterations +2024/01/04 01:27:15 - mmengine - INFO - Iter(train) [138500/640000] base_lr: 1.7799e-04 lr: 1.7999e-05 eta: 8 days, 14:05:19 time: 1.5218 data_time: 0.0275 memory: 25719 grad_norm: 2.6046 loss: 1.4095 detection_loss_cls: 0.0410 detection_loss_reg: 0.3570 caption_loss_cls: 2.4444 grounding_loss_reg: 3.0227 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0378 instance_segmentation_loss_reg: 0.3499 instance_segmentation_loss_poly: 0.9743 +2024/01/04 01:39:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 01:39:44 - mmengine - INFO - Iter(train) [139000/640000] base_lr: 1.7784e-04 lr: 1.7985e-05 eta: 8 days, 13:55:32 time: 1.5191 data_time: 0.0274 memory: 25719 grad_norm: 2.6630 loss: 1.4011 detection_loss_cls: 0.0408 detection_loss_reg: 0.3569 caption_loss_cls: 2.4395 grounding_loss_reg: 3.0169 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0377 instance_segmentation_loss_reg: 0.3494 instance_segmentation_loss_poly: 0.9725 +2024/01/04 01:51:47 - mmengine - INFO - Iter(train) [139500/640000] base_lr: 1.7768e-04 lr: 1.7971e-05 eta: 8 days, 13:38:15 time: 1.5088 data_time: 0.0273 memory: 25719 grad_norm: 2.7224 loss: 1.4151 detection_loss_cls: 0.0410 detection_loss_reg: 0.3580 caption_loss_cls: 2.4425 grounding_loss_reg: 3.0145 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0378 instance_segmentation_loss_reg: 0.3497 instance_segmentation_loss_poly: 0.9724 +2024/01/04 02:03:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 02:03:44 - mmengine - INFO - Iter(train) [140000/640000] base_lr: 1.7753e-04 lr: 1.7957e-05 eta: 8 days, 13:19:41 time: 1.4982 data_time: 0.0273 memory: 25719 grad_norm: 2.7294 loss: 1.4254 detection_loss_cls: 0.0412 detection_loss_reg: 0.3598 caption_loss_cls: 2.4426 grounding_loss_reg: 3.0148 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3525 instance_segmentation_loss_poly: 0.9787 +2024/01/04 02:03:44 - mmengine - INFO - Saving checkpoint at 140000 iterations +2024/01/04 02:16:26 - mmengine - INFO - Evaluating bbox... +2024/01/04 02:17:23 - mmengine - INFO - bbox_mAP_copypaste: 0.447 0.627 0.491 0.288 0.504 0.575 +2024/01/04 02:17:23 - mmengine - INFO - Evaluating segm... +2024/01/04 02:18:35 - mmengine - INFO - segm_mAP_copypaste: 0.290 0.539 0.278 0.149 0.338 0.454 +2024/01/04 02:24:56 - mmengine - INFO - per class results: +2024/01/04 02:24:56 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 76.53 | 88.29 | +| building | 80.84 | 88.49 | +| sky | 92.8 | 97.94 | +| floor | 79.93 | 90.07 | +| tree | 72.56 | 86.17 | +| ceiling | 82.85 | 94.43 | +| road | 82.13 | 86.68 | +| bed | 87.58 | 94.54 | +| windowpane | 62.26 | 77.96 | +| grass | 66.2 | 84.11 | +| cabinet | 56.7 | 64.74 | +| sidewalk | 62.4 | 78.1 | +| person | 78.6 | 88.37 | +| earth | 39.95 | 57.82 | +| door | 51.19 | 65.08 | +| table | 60.18 | 76.05 | +| mountain | 61.6 | 81.76 | +| plant | 48.17 | 56.65 | +| curtain | 70.54 | 87.1 | +| chair | 58.07 | 75.94 | +| car | 81.87 | 87.9 | +| water | 54.46 | 66.47 | +| painting | 72.43 | 86.72 | +| sofa | 69.17 | 84.12 | +| shelf | 46.11 | 72.1 | +| house | 48.65 | 68.04 | +| sea | 57.8 | 82.04 | +| mirror | 62.09 | 80.68 | +| rug | 63.86 | 68.02 | +| field | 27.29 | 40.98 | +| armchair | 43.65 | 56.84 | +| seat | 59.3 | 86.16 | +| fence | 45.35 | 67.87 | +| desk | 39.13 | 46.23 | +| rock | 37.41 | 47.57 | +| wardrobe | 45.53 | 55.85 | +| lamp | 57.09 | 74.79 | +| bathtub | 77.49 | 84.5 | +| railing | 32.6 | 48.58 | +| cushion | 51.07 | 59.96 | +| base | 26.82 | 33.78 | +| box | 25.08 | 31.04 | +| column | 48.15 | 58.7 | +| signboard | 36.8 | 56.13 | +| chest of drawers | 41.02 | 75.61 | +| counter | 35.31 | 42.36 | +| sand | 37.16 | 53.52 | +| sink | 66.72 | 80.82 | +| skyscraper | 57.67 | 83.26 | +| fireplace | 70.05 | 83.16 | +| refrigerator | 75.25 | 84.25 | +| grandstand | 27.34 | 87.14 | +| path | 19.92 | 33.06 | +| stairs | 32.93 | 43.41 | +| runway | 74.37 | 75.55 | +| case | 54.01 | 72.12 | +| pool table | 89.51 | 94.75 | +| pillow | 55.81 | 74.01 | +| screen door | 77.02 | 87.65 | +| stairway | 30.14 | 40.6 | +| river | 18.32 | 28.6 | +| bridge | 69.31 | 83.57 | +| bookcase | 33.53 | 44.6 | +| blind | 29.21 | 30.5 | +| coffee table | 60.57 | 69.85 | +| toilet | 76.26 | 88.89 | +| flower | 33.36 | 46.19 | +| book | 44.28 | 77.2 | +| hill | 7.58 | 11.36 | +| bench | 51.13 | 56.99 | +| countertop | 45.82 | 69.93 | +| stove | 67.2 | 74.91 | +| palm | 41.68 | 61.1 | +| kitchen island | 34.97 | 85.31 | +| computer | 70.76 | 86.45 | +| swivel chair | 46.19 | 64.6 | +| boat | 50.99 | 53.73 | +| bar | 38.04 | 46.19 | +| arcade machine | 62.54 | 75.57 | +| hovel | 41.06 | 51.56 | +| bus | 84.84 | 94.08 | +| towel | 54.26 | 70.45 | +| light | 44.28 | 51.03 | +| truck | 26.95 | 38.77 | +| tower | 26.58 | 47.72 | +| chandelier | 60.22 | 77.92 | +| awning | 36.34 | 51.53 | +| streetlight | 27.02 | 37.35 | +| booth | 23.72 | 23.8 | +| television receiver | 66.78 | 79.54 | +| airplane | 49.13 | 67.36 | +| dirt track | 1.94 | 6.18 | +| apparel | 30.64 | 40.99 | +| pole | 25.03 | 38.13 | +| land | 1.75 | 2.76 | +| bannister | 13.08 | 18.05 | +| escalator | 23.28 | 23.97 | +| ottoman | 50.01 | 68.33 | +| bottle | 21.68 | 29.48 | +| buffet | 39.47 | 47.83 | +| poster | 25.32 | 34.47 | +| stage | 5.7 | 7.51 | +| van | 38.18 | 44.44 | +| ship | 40.98 | 60.46 | +| fountain | 1.96 | 1.97 | +| conveyer belt | 70.65 | 92.25 | +| canopy | 21.09 | 22.34 | +| washer | 61.39 | 72.62 | +| plaything | 33.04 | 57.95 | +| swimming pool | 38.4 | 88.62 | +| stool | 43.75 | 58.45 | +| barrel | 27.91 | 53.84 | +| basket | 30.76 | 51.01 | +| waterfall | 63.94 | 86.21 | +| tent | 82.79 | 87.87 | +| bag | 17.12 | 19.55 | +| minibike | 68.51 | 74.18 | +| cradle | 63.77 | 77.19 | +| oven | 35.71 | 57.32 | +| ball | 42.64 | 67.16 | +| food | 51.95 | 56.58 | +| step | 10.59 | 12.19 | +| tank | 34.86 | 38.89 | +| trade name | 10.49 | 11.24 | +| microwave | 60.57 | 68.52 | +| pot | 48.1 | 55.48 | +| animal | 68.67 | 74.64 | +| bicycle | 52.69 | 80.55 | +| lake | 62.17 | 62.32 | +| dishwasher | 60.92 | 76.85 | +| screen | 61.95 | 80.23 | +| blanket | 7.26 | 8.18 | +| sculpture | 37.81 | 62.04 | +| hood | 47.73 | 59.02 | +| sconce | 33.98 | 48.76 | +| vase | 36.96 | 61.23 | +| traffic light | 34.72 | 52.83 | +| tray | 3.06 | 4.64 | +| ashcan | 38.2 | 56.53 | +| fan | 40.59 | 44.56 | +| pier | 27.93 | 33.95 | +| crt screen | 9.54 | 21.31 | +| plate | 51.31 | 69.97 | +| monitor | 26.34 | 34.32 | +| bulletin board | 28.99 | 44.45 | +| shower | 1.18 | 2.91 | +| radiator | 57.8 | 64.61 | +| glass | 15.54 | 17.79 | +| clock | 22.02 | 31.99 | +| flag | 30.24 | 37.01 | ++---------------------+-------+-------+ +2024/01/04 02:25:13 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4470 coco/bbox_mAP_50: 0.6270 coco/bbox_mAP_75: 0.4910 coco/bbox_mAP_s: 0.2880 coco/bbox_mAP_m: 0.5040 coco/bbox_mAP_l: 0.5750 coco/segm_mAP: 0.2900 coco/segm_mAP_50: 0.5390 coco/segm_mAP_75: 0.2780 coco/segm_mAP_s: 0.1490 coco/segm_mAP_m: 0.3380 coco/segm_mAP_l: 0.4540 Bleu_1: 0.7116 Bleu_2: 0.5403 Bleu_3: 0.3968 Bleu_4: 0.2895 METEOR: 0.2447 ROUGE_L: 0.5203 CIDEr: 0.9270 SPICE: 0.1807 aAcc: 82.1600 mIoU: 46.2800 mAcc: 59.2500 visual-grounding/miou: 0.7436 visual-grounding/acc: 0.8201 data_time: 0.0036 time: 1.3598 +2024/01/04 02:37:55 - mmengine - INFO - Iter(train) [140500/640000] base_lr: 1.7737e-04 lr: 1.7943e-05 eta: 8 days, 13:14:11 time: 1.4938 data_time: 0.0230 memory: 25719 grad_norm: 2.7436 loss: 1.4334 detection_loss_cls: 0.0412 detection_loss_reg: 0.3607 caption_loss_cls: 2.4436 grounding_loss_reg: 3.0119 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3540 instance_segmentation_loss_poly: 0.9817 +2024/01/04 02:49:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 02:49:28 - mmengine - INFO - Iter(train) [141000/640000] base_lr: 1.7722e-04 lr: 1.7929e-05 eta: 8 days, 12:49:11 time: 1.4766 data_time: 0.0226 memory: 25719 grad_norm: 2.7743 loss: 1.4517 detection_loss_cls: 0.0412 detection_loss_reg: 0.3616 caption_loss_cls: 2.4459 grounding_loss_reg: 3.0103 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3542 instance_segmentation_loss_poly: 0.9819 +2024/01/04 03:01:28 - mmengine - INFO - Iter(train) [141500/640000] base_lr: 1.7706e-04 lr: 1.7915e-05 eta: 8 days, 12:32:04 time: 1.4561 data_time: 0.0222 memory: 25719 grad_norm: 2.8058 loss: 1.4592 detection_loss_cls: 0.0413 detection_loss_reg: 0.3624 caption_loss_cls: 2.4468 grounding_loss_reg: 3.0109 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3536 instance_segmentation_loss_poly: 0.9809 +2024/01/04 03:13:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 03:13:07 - mmengine - INFO - Iter(train) [142000/640000] base_lr: 1.7691e-04 lr: 1.7901e-05 eta: 8 days, 12:09:25 time: 1.4529 data_time: 0.0222 memory: 25719 grad_norm: 2.8341 loss: 1.4702 detection_loss_cls: 0.0414 detection_loss_reg: 0.3631 caption_loss_cls: 2.4458 grounding_loss_reg: 3.0120 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0382 instance_segmentation_loss_reg: 0.3553 instance_segmentation_loss_poly: 0.9836 +2024/01/04 03:13:07 - mmengine - INFO - Saving checkpoint at 142000 iterations +2024/01/04 03:24:59 - mmengine - INFO - Iter(train) [142500/640000] base_lr: 1.7675e-04 lr: 1.7887e-05 eta: 8 days, 11:50:19 time: 1.4438 data_time: 0.0220 memory: 25719 grad_norm: 2.8316 loss: 1.4721 detection_loss_cls: 0.0412 detection_loss_reg: 0.3622 caption_loss_cls: 2.4491 grounding_loss_reg: 3.0081 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0383 instance_segmentation_loss_reg: 0.3558 instance_segmentation_loss_poly: 0.9848 +2024/01/04 03:36:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 03:36:54 - mmengine - INFO - Iter(train) [143000/640000] base_lr: 1.7660e-04 lr: 1.7872e-05 eta: 8 days, 11:32:19 time: 1.4353 data_time: 0.0218 memory: 25719 grad_norm: 2.8240 loss: 1.4876 detection_loss_cls: 0.0409 detection_loss_reg: 0.3607 caption_loss_cls: 2.4464 grounding_loss_reg: 3.0084 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3535 instance_segmentation_loss_poly: 0.9791 +2024/01/04 03:48:58 - mmengine - INFO - Iter(train) [143500/640000] base_lr: 1.7644e-04 lr: 1.7858e-05 eta: 8 days, 11:16:49 time: 1.4358 data_time: 0.0218 memory: 25719 grad_norm: 2.7752 loss: 1.4772 detection_loss_cls: 0.0411 detection_loss_reg: 0.3620 caption_loss_cls: 2.4395 grounding_loss_reg: 3.0041 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0379 instance_segmentation_loss_reg: 0.3533 instance_segmentation_loss_poly: 0.9788 +2024/01/04 04:01:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 04:01:15 - mmengine - INFO - Iter(train) [144000/640000] base_lr: 1.7628e-04 lr: 1.7844e-05 eta: 8 days, 11:04:35 time: 1.4408 data_time: 0.0217 memory: 25719 grad_norm: 2.7434 loss: 1.4621 detection_loss_cls: 0.0412 detection_loss_reg: 0.3626 caption_loss_cls: 2.4389 grounding_loss_reg: 3.0049 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3548 instance_segmentation_loss_poly: 0.9825 +2024/01/04 04:01:15 - mmengine - INFO - Saving checkpoint at 144000 iterations +2024/01/04 04:13:43 - mmengine - INFO - Iter(train) [144500/640000] base_lr: 1.7612e-04 lr: 1.7829e-05 eta: 8 days, 10:54:48 time: 1.4366 data_time: 0.0257 memory: 25719 grad_norm: 2.7272 loss: 1.4562 detection_loss_cls: 0.0413 detection_loss_reg: 0.3643 caption_loss_cls: 2.4323 grounding_loss_reg: 3.0046 semantic_segmentation_loss_cls: 0.0106 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3553 instance_segmentation_loss_poly: 0.9824 +2024/01/04 04:26:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 04:26:09 - mmengine - INFO - Iter(train) [145000/640000] base_lr: 1.7596e-04 lr: 1.7815e-05 eta: 8 days, 10:44:33 time: 1.4500 data_time: 0.0260 memory: 25719 grad_norm: 2.7265 loss: 1.4420 detection_loss_cls: 0.0413 detection_loss_reg: 0.3638 caption_loss_cls: 2.4299 grounding_loss_reg: 3.0007 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0382 instance_segmentation_loss_reg: 0.3559 instance_segmentation_loss_poly: 0.9836 +2024/01/04 04:39:33 - mmengine - INFO - Iter(train) [145500/640000] base_lr: 1.7581e-04 lr: 1.7800e-05 eta: 8 days, 10:47:51 time: 1.4709 data_time: 0.0266 memory: 25719 grad_norm: 2.6816 loss: 1.4368 detection_loss_cls: 0.0413 detection_loss_reg: 0.3630 caption_loss_cls: 2.4285 grounding_loss_reg: 2.9972 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3564 instance_segmentation_loss_poly: 0.9844 +2024/01/04 04:52:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 04:52:20 - mmengine - INFO - Iter(train) [146000/640000] base_lr: 1.7565e-04 lr: 1.7786e-05 eta: 8 days, 10:42:02 time: 1.4879 data_time: 0.0266 memory: 25719 grad_norm: 2.6037 loss: 1.4080 detection_loss_cls: 0.0412 detection_loss_reg: 0.3631 caption_loss_cls: 2.4269 grounding_loss_reg: 2.9960 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0381 instance_segmentation_loss_reg: 0.3560 instance_segmentation_loss_poly: 0.9833 +2024/01/04 04:52:20 - mmengine - INFO - Saving checkpoint at 146000 iterations +2024/01/04 05:04:20 - mmengine - INFO - Iter(train) [146500/640000] base_lr: 1.7549e-04 lr: 1.7771e-05 eta: 8 days, 10:25:27 time: 1.4900 data_time: 0.0267 memory: 25719 grad_norm: 2.6005 loss: 1.4091 detection_loss_cls: 0.0412 detection_loss_reg: 0.3631 caption_loss_cls: 2.4268 grounding_loss_reg: 2.9921 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3558 instance_segmentation_loss_poly: 0.9822 +2024/01/04 05:16:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 05:16:14 - mmengine - INFO - Iter(train) [147000/640000] base_lr: 1.7533e-04 lr: 1.7757e-05 eta: 8 days, 10:07:46 time: 1.4898 data_time: 0.0268 memory: 25719 grad_norm: 2.6008 loss: 1.4109 detection_loss_cls: 0.0409 detection_loss_reg: 0.3609 caption_loss_cls: 2.4233 grounding_loss_reg: 2.9899 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0380 instance_segmentation_loss_reg: 0.3558 instance_segmentation_loss_poly: 0.9827 +2024/01/04 05:28:45 - mmengine - INFO - Iter(train) [147500/640000] base_lr: 1.7516e-04 lr: 1.7742e-05 eta: 8 days, 9:58:16 time: 1.4964 data_time: 0.0269 memory: 25719 grad_norm: 2.6079 loss: 1.4040 detection_loss_cls: 0.0408 detection_loss_reg: 0.3600 caption_loss_cls: 2.4193 grounding_loss_reg: 2.9855 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0378 instance_segmentation_loss_reg: 0.3538 instance_segmentation_loss_poly: 0.9783 +2024/01/04 05:40:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 05:40:50 - mmengine - INFO - Iter(train) [148000/640000] base_lr: 1.7500e-04 lr: 1.7728e-05 eta: 8 days, 9:43:01 time: 1.4933 data_time: 0.0269 memory: 25719 grad_norm: 2.6300 loss: 1.4205 detection_loss_cls: 0.0409 detection_loss_reg: 0.3607 caption_loss_cls: 2.4228 grounding_loss_reg: 2.9839 semantic_segmentation_loss_cls: 0.0105 instance_segmentation_loss_cls: 0.0379 instance_segmentation_loss_reg: 0.3546 instance_segmentation_loss_poly: 0.9800 +2024/01/04 05:40:50 - mmengine - INFO - Saving checkpoint at 148000 iterations +2024/01/04 05:53:58 - mmengine - INFO - Iter(train) [148500/640000] base_lr: 1.7484e-04 lr: 1.7713e-05 eta: 8 days, 9:41:28 time: 1.5036 data_time: 0.0271 memory: 25719 grad_norm: 2.6280 loss: 1.4151 detection_loss_cls: 0.0407 detection_loss_reg: 0.3590 caption_loss_cls: 2.4216 grounding_loss_reg: 2.9837 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0379 instance_segmentation_loss_reg: 0.3546 instance_segmentation_loss_poly: 0.9798 +2024/01/04 06:06:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 06:06:13 - mmengine - INFO - Iter(train) [149000/640000] base_lr: 1.7468e-04 lr: 1.7698e-05 eta: 8 days, 9:28:20 time: 1.5008 data_time: 0.0270 memory: 25719 grad_norm: 2.6422 loss: 1.4140 detection_loss_cls: 0.0404 detection_loss_reg: 0.3572 caption_loss_cls: 2.4152 grounding_loss_reg: 2.9838 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0376 instance_segmentation_loss_reg: 0.3525 instance_segmentation_loss_poly: 0.9746 +2024/01/04 06:18:33 - mmengine - INFO - Iter(train) [149500/640000] base_lr: 1.7452e-04 lr: 1.7683e-05 eta: 8 days, 9:16:16 time: 1.4846 data_time: 0.0264 memory: 25719 grad_norm: 2.7073 loss: 1.4068 detection_loss_cls: 0.0404 detection_loss_reg: 0.3573 caption_loss_cls: 2.4175 grounding_loss_reg: 2.9873 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0375 instance_segmentation_loss_reg: 0.3512 instance_segmentation_loss_poly: 0.9718 +2024/01/04 06:31:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 06:31:12 - mmengine - INFO - Iter(train) [150000/640000] base_lr: 1.7435e-04 lr: 1.7669e-05 eta: 8 days, 9:07:59 time: 1.4826 data_time: 0.0264 memory: 25719 grad_norm: 2.8260 loss: 1.4132 detection_loss_cls: 0.0402 detection_loss_reg: 0.3556 caption_loss_cls: 2.4240 grounding_loss_reg: 2.9853 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0374 instance_segmentation_loss_reg: 0.3499 instance_segmentation_loss_poly: 0.9691 +2024/01/04 06:31:12 - mmengine - INFO - Saving checkpoint at 150000 iterations +2024/01/04 06:44:07 - mmengine - INFO - Iter(train) [150500/640000] base_lr: 1.7419e-04 lr: 1.7654e-05 eta: 8 days, 9:03:01 time: 1.4965 data_time: 0.0267 memory: 25719 grad_norm: 2.8016 loss: 1.4064 detection_loss_cls: 0.0399 detection_loss_reg: 0.3541 caption_loss_cls: 2.4245 grounding_loss_reg: 2.9828 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0372 instance_segmentation_loss_reg: 0.3493 instance_segmentation_loss_poly: 0.9677 +2024/01/04 06:56:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 06:56:47 - mmengine - INFO - Iter(train) [151000/640000] base_lr: 1.7403e-04 lr: 1.7639e-05 eta: 8 days, 8:54:47 time: 1.5080 data_time: 0.0267 memory: 25719 grad_norm: 2.7633 loss: 1.3862 detection_loss_cls: 0.0399 detection_loss_reg: 0.3549 caption_loss_cls: 2.4263 grounding_loss_reg: 2.9807 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0371 instance_segmentation_loss_reg: 0.3483 instance_segmentation_loss_poly: 0.9655 +2024/01/04 07:09:01 - mmengine - INFO - Iter(train) [151500/640000] base_lr: 1.7386e-04 lr: 1.7624e-05 eta: 8 days, 8:41:15 time: 1.5036 data_time: 0.0269 memory: 25719 grad_norm: 2.7993 loss: 1.4048 detection_loss_cls: 0.0398 detection_loss_reg: 0.3542 caption_loss_cls: 2.4257 grounding_loss_reg: 2.9760 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0371 instance_segmentation_loss_reg: 0.3495 instance_segmentation_loss_poly: 0.9667 +2024/01/04 07:21:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 07:21:21 - mmengine - INFO - Iter(train) [152000/640000] base_lr: 1.7370e-04 lr: 1.7609e-05 eta: 8 days, 8:29:01 time: 1.5075 data_time: 0.0269 memory: 25719 grad_norm: 2.8050 loss: 1.3792 detection_loss_cls: 0.0397 detection_loss_reg: 0.3536 caption_loss_cls: 2.4231 grounding_loss_reg: 2.9737 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0370 instance_segmentation_loss_reg: 0.3490 instance_segmentation_loss_poly: 0.9656 +2024/01/04 07:21:21 - mmengine - INFO - Saving checkpoint at 152000 iterations +2024/01/04 07:34:13 - mmengine - INFO - Iter(train) [152500/640000] base_lr: 1.7353e-04 lr: 1.7594e-05 eta: 8 days, 8:22:48 time: 1.5032 data_time: 0.0269 memory: 25719 grad_norm: 2.8180 loss: 1.3818 detection_loss_cls: 0.0395 detection_loss_reg: 0.3525 caption_loss_cls: 2.4241 grounding_loss_reg: 2.9707 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0369 instance_segmentation_loss_reg: 0.3488 instance_segmentation_loss_poly: 0.9649 +2024/01/04 07:46:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 07:46:24 - mmengine - INFO - Iter(train) [153000/640000] base_lr: 1.7337e-04 lr: 1.7579e-05 eta: 8 days, 8:08:47 time: 1.5023 data_time: 0.0270 memory: 25719 grad_norm: 2.7943 loss: 1.3867 detection_loss_cls: 0.0394 detection_loss_reg: 0.3530 caption_loss_cls: 2.4245 grounding_loss_reg: 2.9657 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0368 instance_segmentation_loss_reg: 0.3487 instance_segmentation_loss_poly: 0.9644 +2024/01/04 07:58:58 - mmengine - INFO - Iter(train) [153500/640000] base_lr: 1.7320e-04 lr: 1.7564e-05 eta: 8 days, 7:59:11 time: 1.5059 data_time: 0.0271 memory: 25719 grad_norm: 2.7528 loss: 1.3889 detection_loss_cls: 0.0394 detection_loss_reg: 0.3526 caption_loss_cls: 2.4243 grounding_loss_reg: 2.9643 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0367 instance_segmentation_loss_reg: 0.3484 instance_segmentation_loss_poly: 0.9630 +2024/01/04 08:10:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 08:10:41 - mmengine - INFO - Iter(train) [154000/640000] base_lr: 1.7304e-04 lr: 1.7549e-05 eta: 8 days, 7:40:03 time: 1.4921 data_time: 0.0270 memory: 25719 grad_norm: 2.7222 loss: 1.4047 detection_loss_cls: 0.0395 detection_loss_reg: 0.3532 caption_loss_cls: 2.4222 grounding_loss_reg: 2.9610 semantic_segmentation_loss_cls: 0.0104 instance_segmentation_loss_cls: 0.0366 instance_segmentation_loss_reg: 0.3474 instance_segmentation_loss_poly: 0.9621 +2024/01/04 08:10:41 - mmengine - INFO - Saving checkpoint at 154000 iterations +2024/01/04 08:24:20 - mmengine - INFO - Iter(train) [154500/640000] base_lr: 1.7287e-04 lr: 1.7533e-05 eta: 8 days, 7:42:06 time: 1.5029 data_time: 0.0272 memory: 25719 grad_norm: 2.6927 loss: 1.3946 detection_loss_cls: 0.0394 detection_loss_reg: 0.3533 caption_loss_cls: 2.4200 grounding_loss_reg: 2.9625 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0365 instance_segmentation_loss_reg: 0.3474 instance_segmentation_loss_poly: 0.9607 +2024/01/04 08:37:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 08:37:13 - mmengine - INFO - Iter(train) [155000/640000] base_lr: 1.7270e-04 lr: 1.7518e-05 eta: 8 days, 7:35:28 time: 1.5060 data_time: 0.0273 memory: 25719 grad_norm: 2.7150 loss: 1.4065 detection_loss_cls: 0.0395 detection_loss_reg: 0.3538 caption_loss_cls: 2.4239 grounding_loss_reg: 2.9600 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0365 instance_segmentation_loss_reg: 0.3465 instance_segmentation_loss_poly: 0.9574 +2024/01/04 08:49:22 - mmengine - INFO - Iter(train) [155500/640000] base_lr: 1.7253e-04 lr: 1.7503e-05 eta: 8 days, 7:21:08 time: 1.5050 data_time: 0.0270 memory: 25719 grad_norm: 2.6828 loss: 1.4042 detection_loss_cls: 0.0395 detection_loss_reg: 0.3535 caption_loss_cls: 2.4261 grounding_loss_reg: 2.9621 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0365 instance_segmentation_loss_reg: 0.3464 instance_segmentation_loss_poly: 0.9567 +2024/01/04 09:01:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 09:01:47 - mmengine - INFO - Iter(train) [156000/640000] base_lr: 1.7236e-04 lr: 1.7488e-05 eta: 8 days, 7:09:29 time: 1.5062 data_time: 0.0271 memory: 25719 grad_norm: 2.6683 loss: 1.4090 detection_loss_cls: 0.0394 detection_loss_reg: 0.3527 caption_loss_cls: 2.4227 grounding_loss_reg: 2.9616 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0364 instance_segmentation_loss_reg: 0.3458 instance_segmentation_loss_poly: 0.9543 +2024/01/04 09:01:47 - mmengine - INFO - Saving checkpoint at 156000 iterations +2024/01/04 09:13:59 - mmengine - INFO - Iter(train) [156500/640000] base_lr: 1.7220e-04 lr: 1.7472e-05 eta: 8 days, 6:55:40 time: 1.4963 data_time: 0.0268 memory: 25719 grad_norm: 2.6963 loss: 1.4182 detection_loss_cls: 0.0394 detection_loss_reg: 0.3514 caption_loss_cls: 2.4251 grounding_loss_reg: 2.9624 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0363 instance_segmentation_loss_reg: 0.3445 instance_segmentation_loss_poly: 0.9510 +2024/01/04 09:26:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 09:26:40 - mmengine - INFO - Iter(train) [157000/640000] base_lr: 1.7203e-04 lr: 1.7457e-05 eta: 8 days, 6:46:41 time: 1.5036 data_time: 0.0268 memory: 25719 grad_norm: 2.7483 loss: 1.4073 detection_loss_cls: 0.0393 detection_loss_reg: 0.3504 caption_loss_cls: 2.4255 grounding_loss_reg: 2.9619 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0365 instance_segmentation_loss_reg: 0.3444 instance_segmentation_loss_poly: 0.9499 +2024/01/04 09:38:26 - mmengine - INFO - Iter(train) [157500/640000] base_lr: 1.7186e-04 lr: 1.7442e-05 eta: 8 days, 6:28:23 time: 1.4915 data_time: 0.0266 memory: 25719 grad_norm: 2.8326 loss: 1.4181 detection_loss_cls: 0.0393 detection_loss_reg: 0.3499 caption_loss_cls: 2.4264 grounding_loss_reg: 2.9603 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0365 instance_segmentation_loss_reg: 0.3444 instance_segmentation_loss_poly: 0.9493 +2024/01/04 09:50:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 09:50:27 - mmengine - INFO - Iter(train) [158000/640000] base_lr: 1.7169e-04 lr: 1.7426e-05 eta: 8 days, 6:12:46 time: 1.4959 data_time: 0.0267 memory: 25719 grad_norm: 2.8027 loss: 1.4129 detection_loss_cls: 0.0392 detection_loss_reg: 0.3492 caption_loss_cls: 2.4220 grounding_loss_reg: 2.9569 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0367 instance_segmentation_loss_reg: 0.3459 instance_segmentation_loss_poly: 0.9537 +2024/01/04 09:50:27 - mmengine - INFO - Saving checkpoint at 158000 iterations +2024/01/04 10:02:59 - mmengine - INFO - Iter(train) [158500/640000] base_lr: 1.7152e-04 lr: 1.7411e-05 eta: 8 days, 6:02:30 time: 1.4795 data_time: 0.0264 memory: 25719 grad_norm: 2.8434 loss: 1.4170 detection_loss_cls: 0.0393 detection_loss_reg: 0.3497 caption_loss_cls: 2.4224 grounding_loss_reg: 2.9563 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0367 instance_segmentation_loss_reg: 0.3457 instance_segmentation_loss_poly: 0.9532 +2024/01/04 10:15:49 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 10:15:49 - mmengine - INFO - Iter(train) [159000/640000] base_lr: 1.7135e-04 lr: 1.7395e-05 eta: 8 days, 5:54:58 time: 1.4789 data_time: 0.0265 memory: 25719 grad_norm: 2.8624 loss: 1.4216 detection_loss_cls: 0.0393 detection_loss_reg: 0.3500 caption_loss_cls: 2.4235 grounding_loss_reg: 2.9605 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0367 instance_segmentation_loss_reg: 0.3458 instance_segmentation_loss_poly: 0.9517 +2024/01/04 10:28:22 - mmengine - INFO - Iter(train) [159500/640000] base_lr: 1.7118e-04 lr: 1.7380e-05 eta: 8 days, 5:44:28 time: 1.4845 data_time: 0.0265 memory: 25719 grad_norm: 2.8533 loss: 1.4079 detection_loss_cls: 0.0394 detection_loss_reg: 0.3504 caption_loss_cls: 2.4198 grounding_loss_reg: 2.9599 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0366 instance_segmentation_loss_reg: 0.3447 instance_segmentation_loss_poly: 0.9489 +2024/01/04 10:40:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 10:40:43 - mmengine - INFO - Iter(train) [160000/640000] base_lr: 1.7100e-04 lr: 1.7364e-05 eta: 8 days, 5:32:07 time: 1.4835 data_time: 0.0264 memory: 25719 grad_norm: 2.9351 loss: 1.4058 detection_loss_cls: 0.0393 detection_loss_reg: 0.3494 caption_loss_cls: 2.4179 grounding_loss_reg: 2.9572 semantic_segmentation_loss_cls: 0.0103 instance_segmentation_loss_cls: 0.0363 instance_segmentation_loss_reg: 0.3424 instance_segmentation_loss_poly: 0.9435 +2024/01/04 10:40:43 - mmengine - INFO - Saving checkpoint at 160000 iterations +2024/01/04 10:53:34 - mmengine - INFO - Evaluating bbox... +2024/01/04 10:54:31 - mmengine - INFO - bbox_mAP_copypaste: 0.454 0.635 0.498 0.308 0.499 0.578 +2024/01/04 10:54:31 - mmengine - INFO - Evaluating segm... +2024/01/04 10:55:44 - mmengine - INFO - segm_mAP_copypaste: 0.296 0.544 0.286 0.158 0.340 0.455 +2024/01/04 11:02:09 - mmengine - INFO - per class results: +2024/01/04 11:02:09 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 77.04 | 87.26 | +| building | 80.48 | 86.36 | +| sky | 92.96 | 98.08 | +| floor | 81.86 | 89.07 | +| tree | 72.21 | 88.77 | +| ceiling | 83.6 | 92.6 | +| road | 81.29 | 86.99 | +| bed | 88.11 | 93.87 | +| windowpane | 57.71 | 78.63 | +| grass | 66.36 | 81.97 | +| cabinet | 57.6 | 68.89 | +| sidewalk | 62.87 | 82.2 | +| person | 79.5 | 92.92 | +| earth | 37.4 | 50.15 | +| door | 47.08 | 59.39 | +| table | 61.38 | 79.1 | +| mountain | 60.51 | 75.3 | +| plant | 51.72 | 64.34 | +| curtain | 72.24 | 85.34 | +| chair | 56.39 | 67.86 | +| car | 83.18 | 91.37 | +| water | 51.06 | 61.65 | +| painting | 70.81 | 86.39 | +| sofa | 68.18 | 85.4 | +| shelf | 40.98 | 51.88 | +| house | 42.56 | 83.17 | +| sea | 57.15 | 65.78 | +| mirror | 66.63 | 76.79 | +| rug | 67.56 | 77.85 | +| field | 26.62 | 43.58 | +| armchair | 40.75 | 64.0 | +| seat | 63.63 | 81.47 | +| fence | 43.96 | 55.97 | +| desk | 46.6 | 59.07 | +| rock | 50.18 | 71.71 | +| wardrobe | 42.5 | 63.49 | +| lamp | 59.99 | 75.57 | +| bathtub | 76.5 | 83.14 | +| railing | 32.27 | 46.53 | +| cushion | 56.21 | 69.3 | +| base | 28.07 | 43.25 | +| box | 24.73 | 43.07 | +| column | 46.94 | 70.04 | +| signboard | 37.76 | 58.85 | +| chest of drawers | 42.03 | 60.11 | +| counter | 31.4 | 43.46 | +| sand | 47.11 | 64.04 | +| sink | 69.82 | 80.93 | +| skyscraper | 66.62 | 93.73 | +| fireplace | 70.49 | 89.08 | +| refrigerator | 77.21 | 83.76 | +| grandstand | 33.02 | 77.47 | +| path | 20.21 | 36.81 | +| stairs | 27.0 | 33.48 | +| runway | 65.25 | 74.02 | +| case | 50.13 | 57.11 | +| pool table | 91.39 | 94.93 | +| pillow | 56.43 | 72.85 | +| screen door | 57.78 | 58.69 | +| stairway | 31.52 | 54.87 | +| river | 15.6 | 56.99 | +| bridge | 71.76 | 84.46 | +| bookcase | 35.12 | 67.29 | +| blind | 44.67 | 68.71 | +| coffee table | 60.59 | 80.15 | +| toilet | 83.73 | 89.48 | +| flower | 30.65 | 49.48 | +| book | 42.14 | 52.62 | +| hill | 11.32 | 17.71 | +| bench | 55.84 | 70.41 | +| countertop | 51.64 | 56.04 | +| stove | 72.74 | 82.97 | +| palm | 21.46 | 21.96 | +| kitchen island | 42.39 | 66.64 | +| computer | 61.88 | 70.23 | +| swivel chair | 47.6 | 63.4 | +| boat | 75.63 | 83.72 | +| bar | 44.09 | 56.06 | +| arcade machine | 45.83 | 73.87 | +| hovel | 27.89 | 30.5 | +| bus | 87.37 | 95.02 | +| towel | 58.75 | 80.04 | +| light | 51.95 | 63.45 | +| truck | 35.07 | 58.95 | +| tower | 19.8 | 33.97 | +| chandelier | 63.29 | 85.01 | +| awning | 33.52 | 39.94 | +| streetlight | 32.52 | 49.13 | +| booth | 40.34 | 52.36 | +| television receiver | 62.8 | 82.8 | +| airplane | 54.13 | 71.02 | +| dirt track | 0.0 | 0.0 | +| apparel | 24.36 | 43.31 | +| pole | 23.91 | 39.32 | +| land | 2.54 | 3.0 | +| bannister | 16.14 | 24.35 | +| escalator | 19.93 | 21.21 | +| ottoman | 50.33 | 66.27 | +| bottle | 33.52 | 40.31 | +| buffet | 58.38 | 79.52 | +| poster | 22.73 | 27.52 | +| stage | 9.91 | 22.19 | +| van | 47.74 | 67.27 | +| ship | 35.79 | 40.48 | +| fountain | 6.8 | 7.02 | +| conveyer belt | 68.35 | 90.66 | +| canopy | 22.3 | 36.48 | +| washer | 70.9 | 73.43 | +| plaything | 30.01 | 50.71 | +| swimming pool | 67.99 | 74.2 | +| stool | 46.52 | 62.53 | +| barrel | 53.23 | 67.8 | +| basket | 33.62 | 58.85 | +| waterfall | 60.06 | 80.36 | +| tent | 85.23 | 96.62 | +| bag | 14.64 | 17.51 | +| minibike | 71.09 | 81.6 | +| cradle | 78.94 | 95.94 | +| oven | 30.07 | 72.78 | +| ball | 37.69 | 45.6 | +| food | 49.63 | 53.33 | +| step | 17.27 | 23.42 | +| tank | 37.87 | 55.47 | +| trade name | 21.88 | 25.89 | +| microwave | 58.25 | 61.03 | +| pot | 42.81 | 50.06 | +| animal | 69.29 | 74.64 | +| bicycle | 58.19 | 72.08 | +| lake | 60.32 | 63.55 | +| dishwasher | 55.91 | 72.64 | +| screen | 62.29 | 88.96 | +| blanket | 20.43 | 27.99 | +| sculpture | 39.75 | 56.62 | +| hood | 54.3 | 56.54 | +| sconce | 36.58 | 47.56 | +| vase | 37.84 | 46.63 | +| traffic light | 34.77 | 56.58 | +| tray | 8.65 | 18.43 | +| ashcan | 38.31 | 43.59 | +| fan | 56.83 | 79.07 | +| pier | 29.48 | 36.39 | +| crt screen | 7.25 | 12.28 | +| plate | 52.47 | 64.93 | +| monitor | 29.53 | 41.15 | +| bulletin board | 33.45 | 59.22 | +| shower | 0.0 | 0.0 | +| radiator | 59.01 | 66.57 | +| glass | 17.46 | 19.33 | +| clock | 22.59 | 32.27 | +| flag | 42.12 | 47.0 | ++---------------------+-------+-------+ +2024/01/04 11:02:25 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4540 coco/bbox_mAP_50: 0.6350 coco/bbox_mAP_75: 0.4980 coco/bbox_mAP_s: 0.3080 coco/bbox_mAP_m: 0.4990 coco/bbox_mAP_l: 0.5780 coco/segm_mAP: 0.2960 coco/segm_mAP_50: 0.5440 coco/segm_mAP_75: 0.2860 coco/segm_mAP_s: 0.1580 coco/segm_mAP_m: 0.3400 coco/segm_mAP_l: 0.4550 Bleu_1: 0.7128 Bleu_2: 0.5412 Bleu_3: 0.4000 Bleu_4: 0.2911 METEOR: 0.2500 ROUGE_L: 0.5241 CIDEr: 0.9335 SPICE: 0.1810 aAcc: 82.0700 mIoU: 47.9300 mAcc: 61.2500 visual-grounding/miou: 0.7559 visual-grounding/acc: 0.8282 data_time: 0.0051 time: 1.3570 +2024/01/04 11:14:43 - mmengine - INFO - Iter(train) [160500/640000] base_lr: 1.7083e-04 lr: 1.7348e-05 eta: 8 days, 5:19:32 time: 1.4853 data_time: 0.0221 memory: 25719 grad_norm: 2.9082 loss: 1.3880 detection_loss_cls: 0.0392 detection_loss_reg: 0.3484 caption_loss_cls: 2.4120 grounding_loss_reg: 2.9554 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0362 instance_segmentation_loss_reg: 0.3405 instance_segmentation_loss_poly: 0.9395 +2024/01/04 11:26:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 11:26:58 - mmengine - INFO - Iter(train) [161000/640000] base_lr: 1.7066e-04 lr: 1.7333e-05 eta: 8 days, 5:06:14 time: 1.4789 data_time: 0.0220 memory: 25719 grad_norm: 2.8498 loss: 1.3860 detection_loss_cls: 0.0393 detection_loss_reg: 0.3487 caption_loss_cls: 2.4012 grounding_loss_reg: 2.9548 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0362 instance_segmentation_loss_reg: 0.3402 instance_segmentation_loss_poly: 0.9385 +2024/01/04 11:38:55 - mmengine - INFO - Iter(train) [161500/640000] base_lr: 1.7049e-04 lr: 1.7317e-05 eta: 8 days, 4:50:17 time: 1.4818 data_time: 0.0221 memory: 25719 grad_norm: 2.7913 loss: 1.3818 detection_loss_cls: 0.0392 detection_loss_reg: 0.3488 caption_loss_cls: 2.3973 grounding_loss_reg: 2.9571 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0362 instance_segmentation_loss_reg: 0.3407 instance_segmentation_loss_poly: 0.9404 +2024/01/04 11:50:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 11:50:58 - mmengine - INFO - Iter(train) [162000/640000] base_lr: 1.7031e-04 lr: 1.7301e-05 eta: 8 days, 4:35:08 time: 1.4822 data_time: 0.0221 memory: 25719 grad_norm: 2.7852 loss: 1.3745 detection_loss_cls: 0.0390 detection_loss_reg: 0.3470 caption_loss_cls: 2.3943 grounding_loss_reg: 2.9539 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0361 instance_segmentation_loss_reg: 0.3400 instance_segmentation_loss_poly: 0.9380 +2024/01/04 11:50:58 - mmengine - INFO - Saving checkpoint at 162000 iterations +2024/01/04 12:03:47 - mmengine - INFO - Iter(train) [162500/640000] base_lr: 1.7014e-04 lr: 1.7285e-05 eta: 8 days, 4:27:15 time: 1.4864 data_time: 0.0222 memory: 25719 grad_norm: 2.7988 loss: 1.3790 detection_loss_cls: 0.0389 detection_loss_reg: 0.3463 caption_loss_cls: 2.3919 grounding_loss_reg: 2.9519 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0360 instance_segmentation_loss_reg: 0.3392 instance_segmentation_loss_poly: 0.9364 +2024/01/04 12:16:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 12:16:18 - mmengine - INFO - Iter(train) [163000/640000] base_lr: 1.6997e-04 lr: 1.7270e-05 eta: 8 days, 4:16:21 time: 1.4815 data_time: 0.0221 memory: 25719 grad_norm: 2.8012 loss: 1.3784 detection_loss_cls: 0.0388 detection_loss_reg: 0.3467 caption_loss_cls: 2.3932 grounding_loss_reg: 2.9533 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0360 instance_segmentation_loss_reg: 0.3394 instance_segmentation_loss_poly: 0.9359 +2024/01/04 12:28:13 - mmengine - INFO - Iter(train) [163500/640000] base_lr: 1.6979e-04 lr: 1.7254e-05 eta: 8 days, 4:00:14 time: 1.4723 data_time: 0.0218 memory: 25719 grad_norm: 2.7831 loss: 1.3674 detection_loss_cls: 0.0387 detection_loss_reg: 0.3446 caption_loss_cls: 2.3947 grounding_loss_reg: 2.9488 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3379 instance_segmentation_loss_poly: 0.9326 +2024/01/04 12:40:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 12:40:41 - mmengine - INFO - Iter(train) [164000/640000] base_lr: 1.6962e-04 lr: 1.7238e-05 eta: 8 days, 3:49:01 time: 1.4741 data_time: 0.0219 memory: 25719 grad_norm: 2.7199 loss: 1.3737 detection_loss_cls: 0.0385 detection_loss_reg: 0.3437 caption_loss_cls: 2.3953 grounding_loss_reg: 2.9516 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0358 instance_segmentation_loss_reg: 0.3373 instance_segmentation_loss_poly: 0.9324 +2024/01/04 12:40:41 - mmengine - INFO - Saving checkpoint at 164000 iterations +2024/01/04 12:53:03 - mmengine - INFO - Iter(train) [164500/640000] base_lr: 1.6944e-04 lr: 1.7222e-05 eta: 8 days, 3:36:52 time: 1.4748 data_time: 0.0262 memory: 25719 grad_norm: 2.7443 loss: 1.3949 detection_loss_cls: 0.0387 detection_loss_reg: 0.3455 caption_loss_cls: 2.3987 grounding_loss_reg: 2.9511 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3370 instance_segmentation_loss_poly: 0.9310 +2024/01/04 13:05:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240103_132037 +2024/01/04 14:10:47 - mmengine - INFO - Iter(train) [165000/640000] base_lr: 1.6926e-04 lr: 1.7206e-05 eta: 8 days, 3:15:02 time: 1.4756 data_time: 0.0211 memory: 25719 grad_norm: 2.8234 loss: 1.3922 detection_loss_cls: 0.0383 detection_loss_reg: 0.3415 caption_loss_cls: 2.3992 grounding_loss_reg: 2.9445 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3351 instance_segmentation_loss_poly: 0.9277 +2024/01/04 14:23:00 - mmengine - INFO - Iter(train) [165500/640000] base_lr: 1.6909e-04 lr: 1.7190e-05 eta: 8 days, 2:22:00 time: 1.4793 data_time: 0.0207 memory: 25719 grad_norm: 2.8302 loss: 1.3809 detection_loss_cls: 0.0382 detection_loss_reg: 0.3414 caption_loss_cls: 2.3960 grounding_loss_reg: 2.9464 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0353 instance_segmentation_loss_reg: 0.3343 instance_segmentation_loss_poly: 0.9266 +2024/01/04 14:35:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 14:35:11 - mmengine - INFO - Iter(train) [166000/640000] base_lr: 1.6891e-04 lr: 1.7174e-05 eta: 8 days, 1:47:18 time: 1.4817 data_time: 0.0204 memory: 25719 grad_norm: 2.8603 loss: 1.3783 detection_loss_cls: 0.0381 detection_loss_reg: 0.3405 caption_loss_cls: 2.3974 grounding_loss_reg: 2.9416 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0352 instance_segmentation_loss_reg: 0.3339 instance_segmentation_loss_poly: 0.9264 +2024/01/04 14:35:11 - mmengine - INFO - Saving checkpoint at 166000 iterations +2024/01/04 14:47:53 - mmengine - INFO - Iter(train) [166500/640000] base_lr: 1.6874e-04 lr: 1.7158e-05 eta: 8 days, 2:54:46 time: 1.4796 data_time: 0.0198 memory: 25719 grad_norm: 2.8535 loss: 1.3742 detection_loss_cls: 0.0379 detection_loss_reg: 0.3391 caption_loss_cls: 2.3956 grounding_loss_reg: 2.9407 semantic_segmentation_loss_cls: 0.0102 instance_segmentation_loss_cls: 0.0350 instance_segmentation_loss_reg: 0.3324 instance_segmentation_loss_poly: 0.9223 +2024/01/04 15:00:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 15:00:05 - mmengine - INFO - Iter(train) [167000/640000] base_lr: 1.6856e-04 lr: 1.7142e-05 eta: 8 days, 2:19:30 time: 1.4751 data_time: 0.0195 memory: 25719 grad_norm: 2.8319 loss: 1.3700 detection_loss_cls: 0.0380 detection_loss_reg: 0.3401 caption_loss_cls: 2.3936 grounding_loss_reg: 2.9388 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0350 instance_segmentation_loss_reg: 0.3326 instance_segmentation_loss_poly: 0.9232 +2024/01/04 15:12:05 - mmengine - INFO - Iter(train) [167500/640000] base_lr: 1.6838e-04 lr: 1.7125e-05 eta: 8 days, 1:23:07 time: 1.4762 data_time: 0.0195 memory: 25719 grad_norm: 2.9688 loss: 1.3857 detection_loss_cls: 0.0382 detection_loss_reg: 0.3413 caption_loss_cls: 2.3899 grounding_loss_reg: 2.9385 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0351 instance_segmentation_loss_reg: 0.3332 instance_segmentation_loss_poly: 0.9255 +2024/01/04 15:24:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 15:24:38 - mmengine - INFO - Iter(train) [168000/640000] base_lr: 1.6820e-04 lr: 1.7109e-05 eta: 8 days, 1:42:28 time: 1.4774 data_time: 0.0194 memory: 25719 grad_norm: 2.9906 loss: 1.3731 detection_loss_cls: 0.0380 detection_loss_reg: 0.3406 caption_loss_cls: 2.3797 grounding_loss_reg: 2.9392 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0351 instance_segmentation_loss_reg: 0.3330 instance_segmentation_loss_poly: 0.9242 +2024/01/04 15:24:38 - mmengine - INFO - Saving checkpoint at 168000 iterations +2024/01/04 15:36:24 - mmengine - INFO - Iter(train) [168500/640000] base_lr: 1.6802e-04 lr: 1.7093e-05 eta: 8 days, 0:32:50 time: 1.4698 data_time: 0.0239 memory: 25719 grad_norm: 3.0801 loss: 1.3856 detection_loss_cls: 0.0380 detection_loss_reg: 0.3411 caption_loss_cls: 2.3743 grounding_loss_reg: 2.9352 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0351 instance_segmentation_loss_reg: 0.3330 instance_segmentation_loss_poly: 0.9229 +2024/01/04 15:49:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 15:49:12 - mmengine - INFO - Iter(train) [169000/640000] base_lr: 1.6784e-04 lr: 1.7077e-05 eta: 8 days, 1:12:17 time: 1.4760 data_time: 0.0241 memory: 25719 grad_norm: 3.0771 loss: 1.3751 detection_loss_cls: 0.0381 detection_loss_reg: 0.3416 caption_loss_cls: 2.3756 grounding_loss_reg: 2.9321 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0352 instance_segmentation_loss_reg: 0.3347 instance_segmentation_loss_poly: 0.9269 +2024/01/04 16:01:30 - mmengine - INFO - Iter(train) [169500/640000] base_lr: 1.6766e-04 lr: 1.7060e-05 eta: 8 days, 0:58:40 time: 1.4773 data_time: 0.0242 memory: 25719 grad_norm: 3.0821 loss: 1.3720 detection_loss_cls: 0.0379 detection_loss_reg: 0.3408 caption_loss_cls: 2.3687 grounding_loss_reg: 2.9276 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0350 instance_segmentation_loss_reg: 0.3337 instance_segmentation_loss_poly: 0.9251 +2024/01/04 16:13:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 16:13:43 - mmengine - INFO - Iter(train) [170000/640000] base_lr: 1.6748e-04 lr: 1.7044e-05 eta: 8 days, 0:40:00 time: 1.4777 data_time: 0.0243 memory: 25719 grad_norm: 3.0506 loss: 1.3777 detection_loss_cls: 0.0379 detection_loss_reg: 0.3404 caption_loss_cls: 2.3623 grounding_loss_reg: 2.9243 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0350 instance_segmentation_loss_reg: 0.3331 instance_segmentation_loss_poly: 0.9246 +2024/01/04 16:13:43 - mmengine - INFO - Saving checkpoint at 170000 iterations +2024/01/04 16:25:41 - mmengine - INFO - Iter(train) [170500/640000] base_lr: 1.6730e-04 lr: 1.7028e-05 eta: 8 days, 0:03:16 time: 1.4668 data_time: 0.0242 memory: 25719 grad_norm: 3.0609 loss: 1.3811 detection_loss_cls: 0.0379 detection_loss_reg: 0.3410 caption_loss_cls: 2.3559 grounding_loss_reg: 2.9221 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0349 instance_segmentation_loss_reg: 0.3332 instance_segmentation_loss_poly: 0.9246 +2024/01/04 16:37:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 16:37:46 - mmengine - INFO - Iter(train) [171000/640000] base_lr: 1.6712e-04 lr: 1.7011e-05 eta: 7 days, 23:38:02 time: 1.4649 data_time: 0.0240 memory: 25719 grad_norm: 3.0608 loss: 1.3787 detection_loss_cls: 0.0379 detection_loss_reg: 0.3404 caption_loss_cls: 2.3552 grounding_loss_reg: 2.9208 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0349 instance_segmentation_loss_reg: 0.3339 instance_segmentation_loss_poly: 0.9260 +2024/01/04 16:50:10 - mmengine - INFO - Iter(train) [171500/640000] base_lr: 1.6694e-04 lr: 1.6995e-05 eta: 7 days, 23:33:54 time: 1.4708 data_time: 0.0242 memory: 25719 grad_norm: 2.9737 loss: 1.3752 detection_loss_cls: 0.0379 detection_loss_reg: 0.3403 caption_loss_cls: 2.3508 grounding_loss_reg: 2.9210 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0348 instance_segmentation_loss_reg: 0.3319 instance_segmentation_loss_poly: 0.9225 +2024/01/04 17:02:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 17:02:25 - mmengine - INFO - Iter(train) [172000/640000] base_lr: 1.6676e-04 lr: 1.6978e-05 eta: 7 days, 23:21:22 time: 1.4665 data_time: 0.0242 memory: 25719 grad_norm: 2.9676 loss: 1.3955 detection_loss_cls: 0.0379 detection_loss_reg: 0.3399 caption_loss_cls: 2.3522 grounding_loss_reg: 2.9198 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0348 instance_segmentation_loss_reg: 0.3332 instance_segmentation_loss_poly: 0.9249 +2024/01/04 17:02:25 - mmengine - INFO - Saving checkpoint at 172000 iterations +2024/01/04 17:14:53 - mmengine - INFO - Iter(train) [172500/640000] base_lr: 1.6658e-04 lr: 1.6962e-05 eta: 7 days, 23:19:12 time: 1.4768 data_time: 0.0243 memory: 25719 grad_norm: 2.8573 loss: 1.3890 detection_loss_cls: 0.0379 detection_loss_reg: 0.3408 caption_loss_cls: 2.3510 grounding_loss_reg: 2.9182 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3333 instance_segmentation_loss_poly: 0.9254 +2024/01/04 17:27:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 17:27:06 - mmengine - INFO - Iter(train) [173000/640000] base_lr: 1.6640e-04 lr: 1.6945e-05 eta: 7 days, 23:04:19 time: 1.4682 data_time: 0.0241 memory: 25719 grad_norm: 2.8054 loss: 1.3889 detection_loss_cls: 0.0379 detection_loss_reg: 0.3407 caption_loss_cls: 2.3490 grounding_loss_reg: 2.9159 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3334 instance_segmentation_loss_poly: 0.9261 +2024/01/04 17:40:14 - mmengine - INFO - Iter(train) [173500/640000] base_lr: 1.6621e-04 lr: 1.6929e-05 eta: 7 days, 23:34:08 time: 1.4808 data_time: 0.0245 memory: 25719 grad_norm: 2.7627 loss: 1.3926 detection_loss_cls: 0.0381 detection_loss_reg: 0.3425 caption_loss_cls: 2.3491 grounding_loss_reg: 2.9164 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0348 instance_segmentation_loss_reg: 0.3344 instance_segmentation_loss_poly: 0.9282 +2024/01/04 17:52:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 17:52:25 - mmengine - INFO - Iter(train) [174000/640000] base_lr: 1.6603e-04 lr: 1.6912e-05 eta: 7 days, 23:14:42 time: 1.4800 data_time: 0.0245 memory: 25719 grad_norm: 2.7765 loss: 1.3895 detection_loss_cls: 0.0380 detection_loss_reg: 0.3413 caption_loss_cls: 2.3510 grounding_loss_reg: 2.9163 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0348 instance_segmentation_loss_reg: 0.3349 instance_segmentation_loss_poly: 0.9284 +2024/01/04 17:52:25 - mmengine - INFO - Saving checkpoint at 174000 iterations +2024/01/04 18:05:27 - mmengine - INFO - Iter(train) [174500/640000] base_lr: 1.6585e-04 lr: 1.6895e-05 eta: 7 days, 23:34:45 time: 1.4962 data_time: 0.0246 memory: 25719 grad_norm: 2.7660 loss: 1.3718 detection_loss_cls: 0.0380 detection_loss_reg: 0.3414 caption_loss_cls: 2.3484 grounding_loss_reg: 2.9143 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3338 instance_segmentation_loss_poly: 0.9263 +2024/01/04 18:18:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 18:18:12 - mmengine - INFO - Iter(train) [175000/640000] base_lr: 1.6566e-04 lr: 1.6879e-05 eta: 7 days, 23:39:13 time: 1.5062 data_time: 0.0248 memory: 25719 grad_norm: 2.7640 loss: 1.3630 detection_loss_cls: 0.0379 detection_loss_reg: 0.3417 caption_loss_cls: 2.3437 grounding_loss_reg: 2.9150 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3345 instance_segmentation_loss_poly: 0.9276 +2024/01/04 18:30:26 - mmengine - INFO - Iter(train) [175500/640000] base_lr: 1.6548e-04 lr: 1.6862e-05 eta: 7 days, 23:21:34 time: 1.5039 data_time: 0.0247 memory: 25719 grad_norm: 2.7768 loss: 1.3624 detection_loss_cls: 0.0379 detection_loss_reg: 0.3412 caption_loss_cls: 2.3408 grounding_loss_reg: 2.9082 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0346 instance_segmentation_loss_reg: 0.3344 instance_segmentation_loss_poly: 0.9275 +2024/01/04 18:41:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 18:41:48 - mmengine - INFO - Iter(train) [176000/640000] base_lr: 1.6530e-04 lr: 1.6845e-05 eta: 7 days, 22:30:17 time: 1.4902 data_time: 0.0244 memory: 25719 grad_norm: 2.8509 loss: 1.3536 detection_loss_cls: 0.0379 detection_loss_reg: 0.3411 caption_loss_cls: 2.3357 grounding_loss_reg: 2.9075 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0346 instance_segmentation_loss_reg: 0.3345 instance_segmentation_loss_poly: 0.9283 +2024/01/04 18:41:48 - mmengine - INFO - Saving checkpoint at 176000 iterations +2024/01/04 18:54:31 - mmengine - INFO - Iter(train) [176500/640000] base_lr: 1.6511e-04 lr: 1.6828e-05 eta: 7 days, 22:32:37 time: 1.4942 data_time: 0.0243 memory: 25719 grad_norm: 2.9092 loss: 1.3604 detection_loss_cls: 0.0381 detection_loss_reg: 0.3427 caption_loss_cls: 2.3338 grounding_loss_reg: 2.9062 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3349 instance_segmentation_loss_poly: 0.9300 +2024/01/04 19:06:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 19:06:04 - mmengine - INFO - Iter(train) [177000/640000] base_lr: 1.6493e-04 lr: 1.6811e-05 eta: 7 days, 21:52:22 time: 1.4840 data_time: 0.0241 memory: 25719 grad_norm: 2.9814 loss: 1.3640 detection_loss_cls: 0.0381 detection_loss_reg: 0.3429 caption_loss_cls: 2.3305 grounding_loss_reg: 2.8992 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3361 instance_segmentation_loss_poly: 0.9318 +2024/01/04 19:18:12 - mmengine - INFO - Iter(train) [177500/640000] base_lr: 1.6474e-04 lr: 1.6795e-05 eta: 7 days, 21:34:27 time: 1.4691 data_time: 0.0239 memory: 25719 grad_norm: 3.0353 loss: 1.3734 detection_loss_cls: 0.0381 detection_loss_reg: 0.3431 caption_loss_cls: 2.3292 grounding_loss_reg: 2.8969 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3358 instance_segmentation_loss_poly: 0.9315 +2024/01/04 19:30:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 19:30:46 - mmengine - INFO - Iter(train) [178000/640000] base_lr: 1.6455e-04 lr: 1.6778e-05 eta: 7 days, 21:31:10 time: 1.4751 data_time: 0.0239 memory: 25719 grad_norm: 3.0432 loss: 1.3731 detection_loss_cls: 0.0380 detection_loss_reg: 0.3428 caption_loss_cls: 2.3265 grounding_loss_reg: 2.8969 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0343 instance_segmentation_loss_reg: 0.3342 instance_segmentation_loss_poly: 0.9277 +2024/01/04 19:30:46 - mmengine - INFO - Saving checkpoint at 178000 iterations +2024/01/04 19:42:56 - mmengine - INFO - Iter(train) [178500/640000] base_lr: 1.6437e-04 lr: 1.6761e-05 eta: 7 days, 21:14:16 time: 1.4619 data_time: 0.0235 memory: 25719 grad_norm: 3.1060 loss: 1.3960 detection_loss_cls: 0.0379 detection_loss_reg: 0.3423 caption_loss_cls: 2.3255 grounding_loss_reg: 2.8964 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0342 instance_segmentation_loss_reg: 0.3332 instance_segmentation_loss_poly: 0.9261 +2024/01/04 19:54:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 19:54:55 - mmengine - INFO - Iter(train) [179000/640000] base_lr: 1.6418e-04 lr: 1.6744e-05 eta: 7 days, 20:52:00 time: 1.4504 data_time: 0.0233 memory: 25719 grad_norm: 3.1344 loss: 1.4053 detection_loss_cls: 0.0379 detection_loss_reg: 0.3420 caption_loss_cls: 2.3250 grounding_loss_reg: 2.8956 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0343 instance_segmentation_loss_reg: 0.3337 instance_segmentation_loss_poly: 0.9269 +2024/01/04 20:07:13 - mmengine - INFO - Iter(train) [179500/640000] base_lr: 1.6399e-04 lr: 1.6727e-05 eta: 7 days, 20:39:49 time: 1.4513 data_time: 0.0234 memory: 25719 grad_norm: 3.1787 loss: 1.4162 detection_loss_cls: 0.0378 detection_loss_reg: 0.3433 caption_loss_cls: 2.3263 grounding_loss_reg: 2.8925 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0344 instance_segmentation_loss_reg: 0.3341 instance_segmentation_loss_poly: 0.9280 +2024/01/04 20:19:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 20:19:28 - mmengine - INFO - Iter(train) [180000/640000] base_lr: 1.6381e-04 lr: 1.6710e-05 eta: 7 days, 20:26:14 time: 1.4647 data_time: 0.0236 memory: 25719 grad_norm: 3.1242 loss: 1.4138 detection_loss_cls: 0.0378 detection_loss_reg: 0.3430 caption_loss_cls: 2.3262 grounding_loss_reg: 2.8910 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3343 instance_segmentation_loss_poly: 0.9278 +2024/01/04 20:19:28 - mmengine - INFO - Saving checkpoint at 180000 iterations +2024/01/04 20:31:44 - mmengine - INFO - Evaluating bbox... +2024/01/04 20:32:40 - mmengine - INFO - bbox_mAP_copypaste: 0.452 0.632 0.494 0.302 0.504 0.583 +2024/01/04 20:32:40 - mmengine - INFO - Evaluating segm... +2024/01/04 20:33:54 - mmengine - INFO - segm_mAP_copypaste: 0.296 0.544 0.288 0.161 0.338 0.447 +2024/01/04 20:40:57 - mmengine - INFO - per class results: +2024/01/04 20:40:57 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 77.19 | 88.64 | +| building | 80.7 | 89.96 | +| sky | 92.46 | 98.25 | +| floor | 81.39 | 88.93 | +| tree | 71.25 | 87.56 | +| ceiling | 84.14 | 93.28 | +| road | 82.02 | 89.14 | +| bed | 87.64 | 94.54 | +| windowpane | 61.77 | 75.54 | +| grass | 54.35 | 58.59 | +| cabinet | 60.58 | 72.95 | +| sidewalk | 61.19 | 69.81 | +| person | 80.72 | 90.07 | +| earth | 37.34 | 60.85 | +| door | 52.08 | 66.09 | +| table | 60.54 | 75.3 | +| mountain | 57.63 | 74.3 | +| plant | 48.67 | 57.02 | +| curtain | 71.42 | 85.24 | +| chair | 57.95 | 74.48 | +| car | 83.36 | 92.49 | +| water | 56.26 | 75.03 | +| painting | 58.31 | 90.86 | +| sofa | 69.13 | 80.71 | +| shelf | 49.52 | 71.43 | +| house | 26.48 | 34.06 | +| sea | 55.18 | 70.09 | +| mirror | 65.72 | 80.86 | +| rug | 70.55 | 76.82 | +| field | 19.86 | 45.01 | +| armchair | 46.07 | 62.4 | +| seat | 64.61 | 86.74 | +| fence | 39.51 | 61.29 | +| desk | 44.1 | 61.38 | +| rock | 38.79 | 62.0 | +| wardrobe | 41.18 | 55.95 | +| lamp | 58.66 | 70.14 | +| bathtub | 77.04 | 85.02 | +| railing | 29.08 | 38.49 | +| cushion | 54.58 | 66.69 | +| base | 29.44 | 46.09 | +| box | 26.43 | 40.14 | +| column | 47.51 | 61.77 | +| signboard | 39.74 | 54.02 | +| chest of drawers | 35.77 | 55.47 | +| counter | 26.57 | 41.07 | +| sand | 36.02 | 44.94 | +| sink | 67.83 | 74.44 | +| skyscraper | 36.21 | 42.74 | +| fireplace | 75.21 | 88.49 | +| refrigerator | 71.43 | 83.03 | +| grandstand | 36.65 | 76.47 | +| path | 17.58 | 21.81 | +| stairs | 35.26 | 41.1 | +| runway | 76.67 | 96.36 | +| case | 50.96 | 61.26 | +| pool table | 90.19 | 93.93 | +| pillow | 55.51 | 69.88 | +| screen door | 77.53 | 81.86 | +| stairway | 29.75 | 37.39 | +| river | 4.93 | 7.08 | +| bridge | 62.95 | 72.16 | +| bookcase | 37.05 | 49.51 | +| blind | 38.89 | 45.35 | +| coffee table | 59.14 | 79.97 | +| toilet | 74.77 | 91.38 | +| flower | 31.52 | 53.92 | +| book | 46.38 | 62.41 | +| hill | 7.68 | 10.29 | +| bench | 49.47 | 67.46 | +| countertop | 59.48 | 75.05 | +| stove | 69.9 | 74.7 | +| palm | 45.84 | 64.63 | +| kitchen island | 37.3 | 89.35 | +| computer | 72.35 | 86.4 | +| swivel chair | 38.28 | 49.91 | +| boat | 72.28 | 90.35 | +| bar | 39.42 | 52.38 | +| arcade machine | 71.64 | 77.6 | +| hovel | 38.76 | 62.61 | +| bus | 89.42 | 95.78 | +| towel | 60.96 | 69.18 | +| light | 50.68 | 58.34 | +| truck | 38.29 | 54.79 | +| tower | 22.9 | 34.52 | +| chandelier | 60.26 | 83.19 | +| awning | 28.23 | 36.0 | +| streetlight | 27.06 | 32.34 | +| booth | 42.14 | 85.55 | +| television receiver | 68.45 | 81.58 | +| airplane | 47.56 | 65.49 | +| dirt track | 4.61 | 24.03 | +| apparel | 26.91 | 46.1 | +| pole | 27.75 | 40.81 | +| land | 3.33 | 5.54 | +| bannister | 14.02 | 20.91 | +| escalator | 12.54 | 12.67 | +| ottoman | 44.26 | 75.48 | +| bottle | 18.88 | 21.49 | +| buffet | 35.91 | 40.97 | +| poster | 17.38 | 20.1 | +| stage | 10.39 | 27.1 | +| van | 20.37 | 26.13 | +| ship | 14.65 | 15.03 | +| fountain | 8.01 | 8.87 | +| conveyer belt | 78.32 | 92.14 | +| canopy | 25.57 | 33.2 | +| washer | 70.52 | 74.06 | +| plaything | 23.55 | 28.38 | +| swimming pool | 36.99 | 90.13 | +| stool | 42.29 | 53.14 | +| barrel | 15.83 | 64.47 | +| basket | 32.81 | 37.0 | +| waterfall | 69.15 | 83.72 | +| tent | 84.78 | 90.56 | +| bag | 22.02 | 27.09 | +| minibike | 71.13 | 80.1 | +| cradle | 69.49 | 81.25 | +| oven | 33.51 | 55.69 | +| ball | 45.81 | 66.59 | +| food | 52.22 | 61.41 | +| step | 13.55 | 16.7 | +| tank | 34.34 | 40.34 | +| trade name | 30.22 | 37.46 | +| microwave | 70.01 | 80.08 | +| pot | 49.8 | 60.94 | +| animal | 53.99 | 57.15 | +| bicycle | 53.79 | 72.83 | +| lake | 59.23 | 62.72 | +| dishwasher | 63.38 | 80.06 | +| screen | 68.1 | 87.89 | +| blanket | 10.49 | 11.14 | +| sculpture | 47.16 | 62.6 | +| hood | 59.38 | 67.4 | +| sconce | 38.34 | 46.85 | +| vase | 38.19 | 48.95 | +| traffic light | 37.36 | 66.09 | +| tray | 9.4 | 18.39 | +| ashcan | 40.23 | 63.66 | +| fan | 58.93 | 71.82 | +| pier | 44.95 | 57.82 | +| crt screen | 6.42 | 18.6 | +| plate | 55.24 | 74.04 | +| monitor | 15.49 | 18.33 | +| bulletin board | 28.04 | 33.29 | +| shower | 2.3 | 2.62 | +| radiator | 59.8 | 64.75 | +| glass | 18.46 | 21.11 | +| clock | 21.34 | 29.05 | +| flag | 35.37 | 41.21 | ++---------------------+-------+-------+ +2024/01/04 20:41:15 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4520 coco/bbox_mAP_50: 0.6320 coco/bbox_mAP_75: 0.4940 coco/bbox_mAP_s: 0.3020 coco/bbox_mAP_m: 0.5040 coco/bbox_mAP_l: 0.5830 coco/segm_mAP: 0.2960 coco/segm_mAP_50: 0.5440 coco/segm_mAP_75: 0.2880 coco/segm_mAP_s: 0.1610 coco/segm_mAP_m: 0.3380 coco/segm_mAP_l: 0.4470 Bleu_1: 0.7314 Bleu_2: 0.5653 Bleu_3: 0.4208 Bleu_4: 0.3084 METEOR: 0.2496 ROUGE_L: 0.5344 CIDEr: 0.9679 SPICE: 0.1826 aAcc: 81.8700 mIoU: 46.8100 mAcc: 59.6500 visual-grounding/miou: 0.7675 visual-grounding/acc: 0.8402 data_time: 0.0104 time: 1.3588 +2024/01/04 20:53:10 - mmengine - INFO - Iter(train) [180500/640000] base_lr: 1.6362e-04 lr: 1.6692e-05 eta: 7 days, 20:04:24 time: 1.4533 data_time: 0.0200 memory: 25719 grad_norm: 3.1036 loss: 1.4069 detection_loss_cls: 0.0377 detection_loss_reg: 0.3428 caption_loss_cls: 2.3321 grounding_loss_reg: 2.8935 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0346 instance_segmentation_loss_reg: 0.3355 instance_segmentation_loss_poly: 0.9305 +2024/01/04 21:06:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 21:06:14 - mmengine - INFO - Iter(train) [181000/640000] base_lr: 1.6343e-04 lr: 1.6675e-05 eta: 7 days, 20:13:15 time: 1.4759 data_time: 0.0206 memory: 25719 grad_norm: 3.0315 loss: 1.3983 detection_loss_cls: 0.0376 detection_loss_reg: 0.3425 caption_loss_cls: 2.3351 grounding_loss_reg: 2.8919 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3363 instance_segmentation_loss_poly: 0.9323 +2024/01/04 21:18:33 - mmengine - INFO - Iter(train) [181500/640000] base_lr: 1.6324e-04 lr: 1.6658e-05 eta: 7 days, 20:01:27 time: 1.4787 data_time: 0.0208 memory: 25719 grad_norm: 3.0349 loss: 1.4005 detection_loss_cls: 0.0375 detection_loss_reg: 0.3412 caption_loss_cls: 2.3377 grounding_loss_reg: 2.8877 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3370 instance_segmentation_loss_poly: 0.9339 +2024/01/04 21:30:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 21:30:17 - mmengine - INFO - Iter(train) [182000/640000] base_lr: 1.6305e-04 lr: 1.6641e-05 eta: 7 days, 19:34:29 time: 1.4660 data_time: 0.0210 memory: 25719 grad_norm: 3.0399 loss: 1.4067 detection_loss_cls: 0.0376 detection_loss_reg: 0.3420 caption_loss_cls: 2.3331 grounding_loss_reg: 2.8875 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0348 instance_segmentation_loss_reg: 0.3365 instance_segmentation_loss_poly: 0.9325 +2024/01/04 21:30:17 - mmengine - INFO - Saving checkpoint at 182000 iterations +2024/01/04 21:42:19 - mmengine - INFO - Iter(train) [182500/640000] base_lr: 1.6286e-04 lr: 1.6624e-05 eta: 7 days, 19:15:36 time: 1.4639 data_time: 0.0222 memory: 25719 grad_norm: 3.0379 loss: 1.4159 detection_loss_cls: 0.0376 detection_loss_reg: 0.3418 caption_loss_cls: 2.3360 grounding_loss_reg: 2.8845 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0349 instance_segmentation_loss_reg: 0.3365 instance_segmentation_loss_poly: 0.9333 +2024/01/04 21:55:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 21:55:05 - mmengine - INFO - Iter(train) [183000/640000] base_lr: 1.6267e-04 lr: 1.6607e-05 eta: 7 days, 19:15:21 time: 1.4759 data_time: 0.0227 memory: 25719 grad_norm: 3.0428 loss: 1.4209 detection_loss_cls: 0.0379 detection_loss_reg: 0.3440 caption_loss_cls: 2.3357 grounding_loss_reg: 2.8864 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0351 instance_segmentation_loss_reg: 0.3387 instance_segmentation_loss_poly: 0.9380 +2024/01/04 22:08:21 - mmengine - INFO - Iter(train) [183500/640000] base_lr: 1.6248e-04 lr: 1.6589e-05 eta: 7 days, 19:25:28 time: 1.4903 data_time: 0.0231 memory: 25719 grad_norm: 2.9955 loss: 1.4007 detection_loss_cls: 0.0379 detection_loss_reg: 0.3445 caption_loss_cls: 2.3337 grounding_loss_reg: 2.8871 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0351 instance_segmentation_loss_reg: 0.3384 instance_segmentation_loss_poly: 0.9383 +2024/01/04 22:20:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 22:20:35 - mmengine - INFO - Iter(train) [184000/640000] base_lr: 1.6229e-04 lr: 1.6572e-05 eta: 7 days, 19:11:20 time: 1.4901 data_time: 0.0234 memory: 25719 grad_norm: 3.0659 loss: 1.4092 detection_loss_cls: 0.0380 detection_loss_reg: 0.3445 caption_loss_cls: 2.3355 grounding_loss_reg: 2.8855 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0351 instance_segmentation_loss_reg: 0.3391 instance_segmentation_loss_poly: 0.9394 +2024/01/04 22:20:35 - mmengine - INFO - Saving checkpoint at 184000 iterations +2024/01/04 22:33:30 - mmengine - INFO - Iter(train) [184500/640000] base_lr: 1.6210e-04 lr: 1.6555e-05 eta: 7 days, 19:12:11 time: 1.5046 data_time: 0.0278 memory: 25719 grad_norm: 3.0581 loss: 1.4050 detection_loss_cls: 0.0380 detection_loss_reg: 0.3448 caption_loss_cls: 2.3337 grounding_loss_reg: 2.8860 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0351 instance_segmentation_loss_reg: 0.3398 instance_segmentation_loss_poly: 0.9403 +2024/01/04 22:45:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 22:45:25 - mmengine - INFO - Iter(train) [185000/640000] base_lr: 1.6191e-04 lr: 1.6537e-05 eta: 7 days, 18:50:50 time: 1.4873 data_time: 0.0274 memory: 25719 grad_norm: 3.1263 loss: 1.4156 detection_loss_cls: 0.0383 detection_loss_reg: 0.3461 caption_loss_cls: 2.3342 grounding_loss_reg: 2.8858 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0353 instance_segmentation_loss_reg: 0.3397 instance_segmentation_loss_poly: 0.9406 +2024/01/04 22:57:55 - mmengine - INFO - Iter(train) [185500/640000] base_lr: 1.6172e-04 lr: 1.6520e-05 eta: 7 days, 18:42:20 time: 1.4900 data_time: 0.0274 memory: 25719 grad_norm: 3.1396 loss: 1.4148 detection_loss_cls: 0.0383 detection_loss_reg: 0.3459 caption_loss_cls: 2.3337 grounding_loss_reg: 2.8858 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0353 instance_segmentation_loss_reg: 0.3391 instance_segmentation_loss_poly: 0.9397 +2024/01/04 23:10:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 23:10:47 - mmengine - INFO - Iter(train) [186000/640000] base_lr: 1.6152e-04 lr: 1.6502e-05 eta: 7 days, 18:41:18 time: 1.5072 data_time: 0.0275 memory: 25719 grad_norm: 3.1046 loss: 1.3936 detection_loss_cls: 0.0383 detection_loss_reg: 0.3464 caption_loss_cls: 2.3346 grounding_loss_reg: 2.8856 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0352 instance_segmentation_loss_reg: 0.3391 instance_segmentation_loss_poly: 0.9388 +2024/01/04 23:10:47 - mmengine - INFO - Saving checkpoint at 186000 iterations +2024/01/04 23:23:22 - mmengine - INFO - Iter(train) [186500/640000] base_lr: 1.6133e-04 lr: 1.6485e-05 eta: 7 days, 18:33:54 time: 1.5156 data_time: 0.0272 memory: 25719 grad_norm: 3.1008 loss: 1.3874 detection_loss_cls: 0.0386 detection_loss_reg: 0.3485 caption_loss_cls: 2.3361 grounding_loss_reg: 2.8890 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3409 instance_segmentation_loss_poly: 0.9414 +2024/01/04 23:35:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 23:35:12 - mmengine - INFO - Iter(train) [187000/640000] base_lr: 1.6114e-04 lr: 1.6467e-05 eta: 7 days, 18:11:23 time: 1.5013 data_time: 0.0270 memory: 25719 grad_norm: 3.0814 loss: 1.3798 detection_loss_cls: 0.0388 detection_loss_reg: 0.3500 caption_loss_cls: 2.3381 grounding_loss_reg: 2.8864 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3427 instance_segmentation_loss_poly: 0.9455 +2024/01/04 23:47:05 - mmengine - INFO - Iter(train) [187500/640000] base_lr: 1.6095e-04 lr: 1.6450e-05 eta: 7 days, 17:50:31 time: 1.4808 data_time: 0.0267 memory: 25719 grad_norm: 3.1019 loss: 1.3941 detection_loss_cls: 0.0387 detection_loss_reg: 0.3487 caption_loss_cls: 2.3440 grounding_loss_reg: 2.8867 semantic_segmentation_loss_cls: 0.0101 instance_segmentation_loss_cls: 0.0357 instance_segmentation_loss_reg: 0.3423 instance_segmentation_loss_poly: 0.9446 +2024/01/04 23:58:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/04 23:58:33 - mmengine - INFO - Iter(train) [188000/640000] base_lr: 1.6075e-04 lr: 1.6432e-05 eta: 7 days, 17:22:00 time: 1.4692 data_time: 0.0264 memory: 25719 grad_norm: 3.1017 loss: 1.3903 detection_loss_cls: 0.0388 detection_loss_reg: 0.3496 caption_loss_cls: 2.3433 grounding_loss_reg: 2.8877 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0357 instance_segmentation_loss_reg: 0.3427 instance_segmentation_loss_poly: 0.9450 +2024/01/04 23:58:33 - mmengine - INFO - Saving checkpoint at 188000 iterations +2024/01/05 00:10:57 - mmengine - INFO - Iter(train) [188500/640000] base_lr: 1.6056e-04 lr: 1.6414e-05 eta: 7 days, 17:11:19 time: 1.4614 data_time: 0.0264 memory: 25719 grad_norm: 3.1256 loss: 1.4081 detection_loss_cls: 0.0388 detection_loss_reg: 0.3500 caption_loss_cls: 2.3482 grounding_loss_reg: 2.8888 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0358 instance_segmentation_loss_reg: 0.3438 instance_segmentation_loss_poly: 0.9486 +2024/01/05 00:23:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 00:23:36 - mmengine - INFO - Iter(train) [189000/640000] base_lr: 1.6036e-04 lr: 1.6397e-05 eta: 7 days, 17:05:18 time: 1.4725 data_time: 0.0266 memory: 25719 grad_norm: 3.0641 loss: 1.3983 detection_loss_cls: 0.0389 detection_loss_reg: 0.3506 caption_loss_cls: 2.3509 grounding_loss_reg: 2.8893 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3422 instance_segmentation_loss_poly: 0.9452 +2024/01/05 00:36:20 - mmengine - INFO - Iter(train) [189500/640000] base_lr: 1.6017e-04 lr: 1.6379e-05 eta: 7 days, 17:00:12 time: 1.4758 data_time: 0.0267 memory: 25719 grad_norm: 3.0257 loss: 1.3919 detection_loss_cls: 0.0389 detection_loss_reg: 0.3514 caption_loss_cls: 2.3527 grounding_loss_reg: 2.8934 semantic_segmentation_loss_cls: 0.0100 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3432 instance_segmentation_loss_poly: 0.9472 +2024/01/05 00:49:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 00:49:00 - mmengine - INFO - Iter(train) [190000/640000] base_lr: 1.5997e-04 lr: 1.6361e-05 eta: 7 days, 16:53:47 time: 1.4727 data_time: 0.0269 memory: 25719 grad_norm: 3.0531 loss: 1.4121 detection_loss_cls: 0.0389 detection_loss_reg: 0.3518 caption_loss_cls: 2.3554 grounding_loss_reg: 2.8938 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3450 instance_segmentation_loss_poly: 0.9519 +2024/01/05 00:49:00 - mmengine - INFO - Saving checkpoint at 190000 iterations +2024/01/05 01:01:54 - mmengine - INFO - Iter(train) [190500/640000] base_lr: 1.5978e-04 lr: 1.6344e-05 eta: 7 days, 16:51:21 time: 1.4776 data_time: 0.0270 memory: 25719 grad_norm: 2.9863 loss: 1.4005 detection_loss_cls: 0.0389 detection_loss_reg: 0.3525 caption_loss_cls: 2.3577 grounding_loss_reg: 2.8931 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3455 instance_segmentation_loss_poly: 0.9523 +2024/01/05 01:14:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 01:14:40 - mmengine - INFO - Iter(train) [191000/640000] base_lr: 1.5958e-04 lr: 1.6326e-05 eta: 7 days, 16:46:06 time: 1.4917 data_time: 0.0271 memory: 25719 grad_norm: 2.9390 loss: 1.3925 detection_loss_cls: 0.0388 detection_loss_reg: 0.3517 caption_loss_cls: 2.3621 grounding_loss_reg: 2.8906 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3448 instance_segmentation_loss_poly: 0.9514 +2024/01/05 01:28:04 - mmengine - INFO - Iter(train) [191500/640000] base_lr: 1.5939e-04 lr: 1.6308e-05 eta: 7 days, 16:50:50 time: 1.5143 data_time: 0.0276 memory: 25719 grad_norm: 2.8626 loss: 1.3732 detection_loss_cls: 0.0388 detection_loss_reg: 0.3516 caption_loss_cls: 2.3611 grounding_loss_reg: 2.8916 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3451 instance_segmentation_loss_poly: 0.9519 +2024/01/05 01:40:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 01:40:01 - mmengine - INFO - Iter(train) [192000/640000] base_lr: 1.5919e-04 lr: 1.6290e-05 eta: 7 days, 16:31:38 time: 1.5214 data_time: 0.0277 memory: 25719 grad_norm: 2.7838 loss: 1.3775 detection_loss_cls: 0.0387 detection_loss_reg: 0.3510 caption_loss_cls: 2.3655 grounding_loss_reg: 2.8879 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3437 instance_segmentation_loss_poly: 0.9498 +2024/01/05 01:40:01 - mmengine - INFO - Saving checkpoint at 192000 iterations +2024/01/05 01:52:26 - mmengine - INFO - Iter(train) [192500/640000] base_lr: 1.5899e-04 lr: 1.6272e-05 eta: 7 days, 16:20:10 time: 1.5218 data_time: 0.0278 memory: 25719 grad_norm: 2.8298 loss: 1.3696 detection_loss_cls: 0.0387 detection_loss_reg: 0.3510 caption_loss_cls: 2.3639 grounding_loss_reg: 2.8900 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0358 instance_segmentation_loss_reg: 0.3439 instance_segmentation_loss_poly: 0.9501 +2024/01/05 02:04:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 02:04:53 - mmengine - INFO - Iter(train) [193000/640000] base_lr: 1.5880e-04 lr: 1.6254e-05 eta: 7 days, 16:09:11 time: 1.5187 data_time: 0.0278 memory: 25719 grad_norm: 2.8566 loss: 1.3817 detection_loss_cls: 0.0387 detection_loss_reg: 0.3518 caption_loss_cls: 2.3690 grounding_loss_reg: 2.8895 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3451 instance_segmentation_loss_poly: 0.9525 +2024/01/05 02:16:52 - mmengine - INFO - Iter(train) [193500/640000] base_lr: 1.5860e-04 lr: 1.6236e-05 eta: 7 days, 15:51:12 time: 1.5077 data_time: 0.0277 memory: 25719 grad_norm: 2.9804 loss: 1.3901 detection_loss_cls: 0.0386 detection_loss_reg: 0.3516 caption_loss_cls: 2.3665 grounding_loss_reg: 2.8905 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3448 instance_segmentation_loss_poly: 0.9526 +2024/01/05 02:28:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 02:28:45 - mmengine - INFO - Iter(train) [194000/640000] base_lr: 1.5840e-04 lr: 1.6218e-05 eta: 7 days, 15:31:54 time: 1.4960 data_time: 0.0274 memory: 25719 grad_norm: 3.0448 loss: 1.3893 detection_loss_cls: 0.0388 detection_loss_reg: 0.3535 caption_loss_cls: 2.3651 grounding_loss_reg: 2.8878 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0361 instance_segmentation_loss_reg: 0.3462 instance_segmentation_loss_poly: 0.9551 +2024/01/05 02:28:45 - mmengine - INFO - Saving checkpoint at 194000 iterations +2024/01/05 02:41:43 - mmengine - INFO - Iter(train) [194500/640000] base_lr: 1.5820e-04 lr: 1.6200e-05 eta: 7 days, 15:28:31 time: 1.4968 data_time: 0.0276 memory: 25719 grad_norm: 3.1330 loss: 1.3937 detection_loss_cls: 0.0389 detection_loss_reg: 0.3546 caption_loss_cls: 2.3682 grounding_loss_reg: 2.8840 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0362 instance_segmentation_loss_reg: 0.3478 instance_segmentation_loss_poly: 0.9588 +2024/01/05 02:53:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 02:53:17 - mmengine - INFO - Iter(train) [195000/640000] base_lr: 1.5801e-04 lr: 1.6182e-05 eta: 7 days, 15:04:45 time: 1.4787 data_time: 0.0273 memory: 25719 grad_norm: 3.2405 loss: 1.4054 detection_loss_cls: 0.0388 detection_loss_reg: 0.3548 caption_loss_cls: 2.3678 grounding_loss_reg: 2.8795 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0362 instance_segmentation_loss_reg: 0.3472 instance_segmentation_loss_poly: 0.9575 +2024/01/05 03:05:19 - mmengine - INFO - Iter(train) [195500/640000] base_lr: 1.5781e-04 lr: 1.6164e-05 eta: 7 days, 14:48:00 time: 1.4583 data_time: 0.0269 memory: 25719 grad_norm: 3.3457 loss: 1.4195 detection_loss_cls: 0.0388 detection_loss_reg: 0.3550 caption_loss_cls: 2.3754 grounding_loss_reg: 2.8791 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0361 instance_segmentation_loss_reg: 0.3461 instance_segmentation_loss_poly: 0.9556 +2024/01/05 03:17:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 03:17:00 - mmengine - INFO - Iter(train) [196000/640000] base_lr: 1.5761e-04 lr: 1.6146e-05 eta: 7 days, 14:26:37 time: 1.4545 data_time: 0.0269 memory: 25719 grad_norm: 3.3873 loss: 1.4166 detection_loss_cls: 0.0388 detection_loss_reg: 0.3557 caption_loss_cls: 2.3740 grounding_loss_reg: 2.8795 semantic_segmentation_loss_cls: 0.0099 instance_segmentation_loss_cls: 0.0362 instance_segmentation_loss_reg: 0.3471 instance_segmentation_loss_poly: 0.9571 +2024/01/05 03:17:00 - mmengine - INFO - Saving checkpoint at 196000 iterations +2024/01/05 03:28:53 - mmengine - INFO - Iter(train) [196500/640000] base_lr: 1.5741e-04 lr: 1.6128e-05 eta: 7 days, 14:08:03 time: 1.4464 data_time: 0.0265 memory: 25719 grad_norm: 3.3427 loss: 1.4087 detection_loss_cls: 0.0386 detection_loss_reg: 0.3543 caption_loss_cls: 2.3706 grounding_loss_reg: 2.8765 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0361 instance_segmentation_loss_reg: 0.3462 instance_segmentation_loss_poly: 0.9556 +2024/01/05 03:40:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 03:40:48 - mmengine - INFO - Iter(train) [197000/640000] base_lr: 1.5721e-04 lr: 1.6110e-05 eta: 7 days, 13:50:24 time: 1.4385 data_time: 0.0264 memory: 25719 grad_norm: 3.3438 loss: 1.4063 detection_loss_cls: 0.0384 detection_loss_reg: 0.3531 caption_loss_cls: 2.3710 grounding_loss_reg: 2.8790 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0361 instance_segmentation_loss_reg: 0.3457 instance_segmentation_loss_poly: 0.9551 +2024/01/05 03:52:48 - mmengine - INFO - Iter(train) [197500/640000] base_lr: 1.5701e-04 lr: 1.6092e-05 eta: 7 days, 13:33:47 time: 1.4385 data_time: 0.0263 memory: 25719 grad_norm: 3.2718 loss: 1.4042 detection_loss_cls: 0.0385 detection_loss_reg: 0.3537 caption_loss_cls: 2.3729 grounding_loss_reg: 2.8794 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0361 instance_segmentation_loss_reg: 0.3455 instance_segmentation_loss_poly: 0.9546 +2024/01/05 04:05:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 04:05:05 - mmengine - INFO - Iter(train) [198000/640000] base_lr: 1.5681e-04 lr: 1.6073e-05 eta: 7 days, 13:21:13 time: 1.4446 data_time: 0.0262 memory: 25719 grad_norm: 3.1899 loss: 1.3922 detection_loss_cls: 0.0386 detection_loss_reg: 0.3547 caption_loss_cls: 2.3777 grounding_loss_reg: 2.8756 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0362 instance_segmentation_loss_reg: 0.3458 instance_segmentation_loss_poly: 0.9556 +2024/01/05 04:05:05 - mmengine - INFO - Saving checkpoint at 198000 iterations +2024/01/05 04:17:35 - mmengine - INFO - Iter(train) [198500/640000] base_lr: 1.5661e-04 lr: 1.6055e-05 eta: 7 days, 13:11:18 time: 1.4376 data_time: 0.0261 memory: 25719 grad_norm: 3.1359 loss: 1.3890 detection_loss_cls: 0.0386 detection_loss_reg: 0.3548 caption_loss_cls: 2.3776 grounding_loss_reg: 2.8757 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0362 instance_segmentation_loss_reg: 0.3462 instance_segmentation_loss_poly: 0.9565 +2024/01/05 04:30:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 04:30:02 - mmengine - INFO - Iter(train) [199000/640000] base_lr: 1.5641e-04 lr: 1.6037e-05 eta: 7 days, 13:00:35 time: 1.4508 data_time: 0.0263 memory: 25719 grad_norm: 3.0873 loss: 1.3860 detection_loss_cls: 0.0385 detection_loss_reg: 0.3546 caption_loss_cls: 2.3741 grounding_loss_reg: 2.8717 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0362 instance_segmentation_loss_reg: 0.3469 instance_segmentation_loss_poly: 0.9571 +2024/01/05 04:43:23 - mmengine - INFO - Iter(train) [199500/640000] base_lr: 1.5620e-04 lr: 1.6019e-05 eta: 7 days, 13:01:11 time: 1.4707 data_time: 0.0269 memory: 25719 grad_norm: 2.9888 loss: 1.3835 detection_loss_cls: 0.0387 detection_loss_reg: 0.3559 caption_loss_cls: 2.3771 grounding_loss_reg: 2.8721 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0361 instance_segmentation_loss_reg: 0.3466 instance_segmentation_loss_poly: 0.9553 +2024/01/05 04:56:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 04:56:12 - mmengine - INFO - Iter(train) [200000/640000] base_lr: 1.5600e-04 lr: 1.6000e-05 eta: 7 days, 12:54:44 time: 1.4875 data_time: 0.0272 memory: 25719 grad_norm: 2.9300 loss: 1.3775 detection_loss_cls: 0.0386 detection_loss_reg: 0.3556 caption_loss_cls: 2.3747 grounding_loss_reg: 2.8731 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0361 instance_segmentation_loss_reg: 0.3483 instance_segmentation_loss_poly: 0.9587 +2024/01/05 04:56:12 - mmengine - INFO - Saving checkpoint at 200000 iterations +2024/01/05 05:08:45 - mmengine - INFO - Evaluating bbox... +2024/01/05 05:09:42 - mmengine - INFO - bbox_mAP_copypaste: 0.467 0.647 0.511 0.311 0.519 0.593 +2024/01/05 05:09:42 - mmengine - INFO - Evaluating segm... +2024/01/05 05:10:56 - mmengine - INFO - segm_mAP_copypaste: 0.309 0.558 0.305 0.169 0.350 0.467 +2024/01/05 05:19:05 - mmengine - INFO - per class results: +2024/01/05 05:19:05 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 76.58 | 87.17 | +| building | 80.44 | 92.24 | +| sky | 93.17 | 97.61 | +| floor | 82.23 | 89.64 | +| tree | 72.06 | 85.93 | +| ceiling | 84.97 | 94.03 | +| road | 82.21 | 90.79 | +| bed | 88.75 | 94.63 | +| windowpane | 62.67 | 80.82 | +| grass | 67.49 | 88.38 | +| cabinet | 60.0 | 71.75 | +| sidewalk | 64.61 | 77.53 | +| person | 80.06 | 91.38 | +| earth | 36.48 | 46.09 | +| door | 48.9 | 65.13 | +| table | 62.64 | 76.93 | +| mountain | 57.04 | 73.47 | +| plant | 49.43 | 57.78 | +| curtain | 73.22 | 88.29 | +| chair | 59.06 | 74.02 | +| car | 83.51 | 90.65 | +| water | 55.2 | 73.84 | +| painting | 66.52 | 87.79 | +| sofa | 70.21 | 83.12 | +| shelf | 47.06 | 65.62 | +| house | 39.96 | 55.65 | +| sea | 58.01 | 77.83 | +| mirror | 66.59 | 78.43 | +| rug | 71.32 | 81.04 | +| field | 28.82 | 38.48 | +| armchair | 47.1 | 66.34 | +| seat | 58.29 | 75.26 | +| fence | 44.88 | 69.95 | +| desk | 44.4 | 67.98 | +| rock | 41.07 | 56.57 | +| wardrobe | 47.31 | 55.45 | +| lamp | 59.85 | 78.02 | +| bathtub | 76.75 | 80.92 | +| railing | 32.96 | 44.71 | +| cushion | 53.74 | 64.8 | +| base | 21.57 | 29.46 | +| box | 24.05 | 31.43 | +| column | 47.76 | 65.97 | +| signboard | 33.61 | 46.41 | +| chest of drawers | 30.78 | 57.96 | +| counter | 40.73 | 58.69 | +| sand | 52.67 | 60.46 | +| sink | 69.94 | 79.94 | +| skyscraper | 44.88 | 55.9 | +| fireplace | 69.93 | 88.26 | +| refrigerator | 76.95 | 85.94 | +| grandstand | 35.79 | 77.33 | +| path | 23.5 | 34.17 | +| stairs | 27.73 | 33.12 | +| runway | 74.76 | 82.88 | +| case | 60.62 | 73.1 | +| pool table | 90.1 | 96.15 | +| pillow | 56.79 | 73.37 | +| screen door | 69.81 | 76.42 | +| stairway | 32.82 | 50.88 | +| river | 19.52 | 30.13 | +| bridge | 66.64 | 82.97 | +| bookcase | 36.83 | 58.79 | +| blind | 39.7 | 43.32 | +| coffee table | 64.16 | 80.66 | +| toilet | 78.92 | 91.29 | +| flower | 28.74 | 38.11 | +| book | 46.66 | 64.35 | +| hill | 10.11 | 19.29 | +| bench | 50.73 | 58.34 | +| countertop | 52.03 | 65.27 | +| stove | 73.62 | 85.67 | +| palm | 43.7 | 66.7 | +| kitchen island | 40.36 | 86.16 | +| computer | 68.49 | 81.32 | +| swivel chair | 43.6 | 57.28 | +| boat | 61.9 | 66.87 | +| bar | 19.49 | 21.6 | +| arcade machine | 60.5 | 62.57 | +| hovel | 19.03 | 20.28 | +| bus | 91.46 | 95.88 | +| towel | 51.78 | 75.15 | +| light | 53.11 | 64.03 | +| truck | 42.52 | 58.84 | +| tower | 44.74 | 81.81 | +| chandelier | 62.16 | 76.1 | +| awning | 26.14 | 28.74 | +| streetlight | 23.79 | 35.46 | +| booth | 33.99 | 74.47 | +| television receiver | 66.82 | 78.35 | +| airplane | 59.44 | 67.33 | +| dirt track | 0.0 | 0.0 | +| apparel | 31.43 | 44.13 | +| pole | 16.48 | 20.23 | +| land | 3.53 | 4.28 | +| bannister | 18.85 | 29.9 | +| escalator | 34.64 | 40.2 | +| ottoman | 52.48 | 68.65 | +| bottle | 21.42 | 26.71 | +| buffet | 46.48 | 61.45 | +| poster | 30.28 | 36.51 | +| stage | 9.85 | 17.74 | +| van | 41.69 | 50.6 | +| ship | 17.45 | 22.27 | +| fountain | 2.34 | 2.4 | +| conveyer belt | 79.36 | 90.39 | +| canopy | 18.82 | 19.68 | +| washer | 66.01 | 70.1 | +| plaything | 28.01 | 34.64 | +| swimming pool | 66.55 | 74.67 | +| stool | 46.32 | 61.99 | +| barrel | 9.01 | 64.18 | +| basket | 29.76 | 37.79 | +| waterfall | 51.69 | 67.48 | +| tent | 90.19 | 97.35 | +| bag | 22.22 | 28.32 | +| minibike | 73.34 | 79.24 | +| cradle | 76.12 | 95.95 | +| oven | 26.68 | 42.56 | +| ball | 47.57 | 71.1 | +| food | 48.58 | 53.84 | +| step | 18.78 | 27.95 | +| tank | 36.42 | 38.73 | +| trade name | 10.3 | 10.64 | +| microwave | 68.2 | 76.12 | +| pot | 49.63 | 58.24 | +| animal | 55.41 | 57.61 | +| bicycle | 57.97 | 76.11 | +| lake | 53.8 | 63.28 | +| dishwasher | 59.39 | 69.85 | +| screen | 67.36 | 73.92 | +| blanket | 11.03 | 13.1 | +| sculpture | 44.47 | 51.56 | +| hood | 60.32 | 73.96 | +| sconce | 39.24 | 47.05 | +| vase | 40.16 | 49.09 | +| traffic light | 33.86 | 49.96 | +| tray | 9.72 | 16.26 | +| ashcan | 38.93 | 48.39 | +| fan | 59.63 | 76.81 | +| pier | 24.3 | 40.14 | +| crt screen | 15.23 | 35.06 | +| plate | 54.02 | 71.86 | +| monitor | 11.13 | 12.86 | +| bulletin board | 11.3 | 12.39 | +| shower | 1.22 | 4.92 | +| radiator | 45.67 | 47.87 | +| glass | 17.18 | 18.76 | +| clock | 21.17 | 25.79 | +| flag | 44.1 | 52.24 | ++---------------------+-------+-------+ +2024/01/05 05:19:22 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4670 coco/bbox_mAP_50: 0.6470 coco/bbox_mAP_75: 0.5110 coco/bbox_mAP_s: 0.3110 coco/bbox_mAP_m: 0.5190 coco/bbox_mAP_l: 0.5930 coco/segm_mAP: 0.3090 coco/segm_mAP_50: 0.5580 coco/segm_mAP_75: 0.3050 coco/segm_mAP_s: 0.1690 coco/segm_mAP_m: 0.3500 coco/segm_mAP_l: 0.4670 Bleu_1: 0.7307 Bleu_2: 0.5626 Bleu_3: 0.4206 Bleu_4: 0.3109 METEOR: 0.2565 ROUGE_L: 0.5389 CIDEr: 1.0020 SPICE: 0.1901 aAcc: 82.6300 mIoU: 47.3900 mAcc: 59.3700 visual-grounding/miou: 0.7736 visual-grounding/acc: 0.8463 data_time: 0.0044 time: 1.3546 +2024/01/05 05:31:01 - mmengine - INFO - Iter(train) [200500/640000] base_lr: 1.5580e-04 lr: 1.5982e-05 eta: 7 days, 12:34:39 time: 1.4849 data_time: 0.0232 memory: 25719 grad_norm: 2.9270 loss: 1.3814 detection_loss_cls: 0.0388 detection_loss_reg: 0.3574 caption_loss_cls: 2.3732 grounding_loss_reg: 2.8675 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0361 instance_segmentation_loss_reg: 0.3487 instance_segmentation_loss_poly: 0.9588 +2024/01/05 05:42:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 05:42:56 - mmengine - INFO - Iter(train) [201000/640000] base_lr: 1.5560e-04 lr: 1.5963e-05 eta: 7 days, 12:17:25 time: 1.4847 data_time: 0.0233 memory: 25719 grad_norm: 2.9320 loss: 1.3870 detection_loss_cls: 0.0389 detection_loss_reg: 0.3569 caption_loss_cls: 2.3718 grounding_loss_reg: 2.8674 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0362 instance_segmentation_loss_reg: 0.3503 instance_segmentation_loss_poly: 0.9615 +2024/01/05 05:55:30 - mmengine - INFO - Iter(train) [201500/640000] base_lr: 1.5539e-04 lr: 1.5945e-05 eta: 7 days, 12:07:54 time: 1.4933 data_time: 0.0235 memory: 25719 grad_norm: 2.8807 loss: 1.3853 detection_loss_cls: 0.0388 detection_loss_reg: 0.3568 caption_loss_cls: 2.3767 grounding_loss_reg: 2.8667 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0362 instance_segmentation_loss_reg: 0.3498 instance_segmentation_loss_poly: 0.9613 +2024/01/05 06:07:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 06:07:34 - mmengine - INFO - Iter(train) [202000/640000] base_lr: 1.5519e-04 lr: 1.5926e-05 eta: 7 days, 11:52:31 time: 1.4898 data_time: 0.0235 memory: 25719 grad_norm: 2.8770 loss: 1.3947 detection_loss_cls: 0.0388 detection_loss_reg: 0.3576 caption_loss_cls: 2.3700 grounding_loss_reg: 2.8674 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0360 instance_segmentation_loss_reg: 0.3488 instance_segmentation_loss_poly: 0.9591 +2024/01/05 06:07:34 - mmengine - INFO - Saving checkpoint at 202000 iterations +2024/01/05 06:20:43 - mmengine - INFO - Iter(train) [202500/640000] base_lr: 1.5499e-04 lr: 1.5908e-05 eta: 7 days, 11:49:35 time: 1.4996 data_time: 0.0238 memory: 25719 grad_norm: 2.8132 loss: 1.3909 detection_loss_cls: 0.0388 detection_loss_reg: 0.3575 caption_loss_cls: 2.3667 grounding_loss_reg: 2.8654 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0361 instance_segmentation_loss_reg: 0.3503 instance_segmentation_loss_poly: 0.9616 +2024/01/05 06:32:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 06:32:58 - mmengine - INFO - Iter(train) [203000/640000] base_lr: 1.5478e-04 lr: 1.5889e-05 eta: 7 days, 11:36:14 time: 1.4966 data_time: 0.0238 memory: 25719 grad_norm: 2.7920 loss: 1.3977 detection_loss_cls: 0.0388 detection_loss_reg: 0.3575 caption_loss_cls: 2.3657 grounding_loss_reg: 2.8613 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3487 instance_segmentation_loss_poly: 0.9588 +2024/01/05 06:45:20 - mmengine - INFO - Iter(train) [203500/640000] base_lr: 1.5458e-04 lr: 1.5871e-05 eta: 7 days, 11:24:22 time: 1.4818 data_time: 0.0235 memory: 25719 grad_norm: 2.8125 loss: 1.3983 detection_loss_cls: 0.0389 detection_loss_reg: 0.3579 caption_loss_cls: 2.3679 grounding_loss_reg: 2.8621 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0360 instance_segmentation_loss_reg: 0.3498 instance_segmentation_loss_poly: 0.9603 +2024/01/05 06:57:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 06:57:57 - mmengine - INFO - Iter(train) [204000/640000] base_lr: 1.5438e-04 lr: 1.5852e-05 eta: 7 days, 11:15:03 time: 1.4788 data_time: 0.0233 memory: 25719 grad_norm: 2.7699 loss: 1.3941 detection_loss_cls: 0.0387 detection_loss_reg: 0.3576 caption_loss_cls: 2.3723 grounding_loss_reg: 2.8615 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0360 instance_segmentation_loss_reg: 0.3502 instance_segmentation_loss_poly: 0.9611 +2024/01/05 06:57:57 - mmengine - INFO - Saving checkpoint at 204000 iterations +2024/01/05 07:10:53 - mmengine - INFO - Iter(train) [204500/640000] base_lr: 1.5417e-04 lr: 1.5834e-05 eta: 7 days, 11:09:16 time: 1.4976 data_time: 0.0277 memory: 25719 grad_norm: 2.7485 loss: 1.3897 detection_loss_cls: 0.0387 detection_loss_reg: 0.3580 caption_loss_cls: 2.3708 grounding_loss_reg: 2.8616 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3492 instance_segmentation_loss_poly: 0.9595 +2024/01/05 07:23:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 07:23:36 - mmengine - INFO - Iter(train) [205000/640000] base_lr: 1.5397e-04 lr: 1.5815e-05 eta: 7 days, 11:00:44 time: 1.5094 data_time: 0.0278 memory: 25719 grad_norm: 2.7029 loss: 1.3706 detection_loss_cls: 0.0387 detection_loss_reg: 0.3578 caption_loss_cls: 2.3669 grounding_loss_reg: 2.8618 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0360 instance_segmentation_loss_reg: 0.3505 instance_segmentation_loss_poly: 0.9606 +2024/01/05 07:35:50 - mmengine - INFO - Iter(train) [205500/640000] base_lr: 1.5376e-04 lr: 1.5796e-05 eta: 7 days, 10:47:10 time: 1.5044 data_time: 0.0277 memory: 25719 grad_norm: 2.7291 loss: 1.3768 detection_loss_cls: 0.0385 detection_loss_reg: 0.3576 caption_loss_cls: 2.3682 grounding_loss_reg: 2.8634 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0358 instance_segmentation_loss_reg: 0.3492 instance_segmentation_loss_poly: 0.9579 +2024/01/05 07:48:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 07:48:10 - mmengine - INFO - Iter(train) [206000/640000] base_lr: 1.5355e-04 lr: 1.5778e-05 eta: 7 days, 10:34:44 time: 1.5086 data_time: 0.0278 memory: 25719 grad_norm: 2.7162 loss: 1.3648 detection_loss_cls: 0.0385 detection_loss_reg: 0.3575 caption_loss_cls: 2.3672 grounding_loss_reg: 2.8608 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3503 instance_segmentation_loss_poly: 0.9598 +2024/01/05 07:48:10 - mmengine - INFO - Saving checkpoint at 206000 iterations +2024/01/05 08:01:06 - mmengine - INFO - Iter(train) [206500/640000] base_lr: 1.5335e-04 lr: 1.5759e-05 eta: 7 days, 10:28:26 time: 1.5054 data_time: 0.0275 memory: 25719 grad_norm: 2.7744 loss: 1.3647 detection_loss_cls: 0.0384 detection_loss_reg: 0.3567 caption_loss_cls: 2.3676 grounding_loss_reg: 2.8624 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3476 instance_segmentation_loss_poly: 0.9547 +2024/01/05 08:13:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 08:13:17 - mmengine - INFO - Iter(train) [207000/640000] base_lr: 1.5314e-04 lr: 1.5740e-05 eta: 7 days, 10:14:13 time: 1.5043 data_time: 0.0275 memory: 25719 grad_norm: 2.7899 loss: 1.3621 detection_loss_cls: 0.0383 detection_loss_reg: 0.3563 caption_loss_cls: 2.3666 grounding_loss_reg: 2.8594 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3474 instance_segmentation_loss_poly: 0.9542 +2024/01/05 08:25:49 - mmengine - INFO - Iter(train) [207500/640000] base_lr: 1.5293e-04 lr: 1.5721e-05 eta: 7 days, 10:03:44 time: 1.5068 data_time: 0.0275 memory: 25719 grad_norm: 2.7668 loss: 1.3609 detection_loss_cls: 0.0383 detection_loss_reg: 0.3564 caption_loss_cls: 2.3665 grounding_loss_reg: 2.8588 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0355 instance_segmentation_loss_reg: 0.3473 instance_segmentation_loss_poly: 0.9539 +2024/01/05 08:37:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 08:37:35 - mmengine - INFO - Iter(train) [208000/640000] base_lr: 1.5273e-04 lr: 1.5703e-05 eta: 7 days, 9:45:40 time: 1.4942 data_time: 0.0273 memory: 25719 grad_norm: 2.8699 loss: 1.3786 detection_loss_cls: 0.0383 detection_loss_reg: 0.3562 caption_loss_cls: 2.3638 grounding_loss_reg: 2.8581 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0355 instance_segmentation_loss_reg: 0.3474 instance_segmentation_loss_poly: 0.9532 +2024/01/05 08:37:35 - mmengine - INFO - Saving checkpoint at 208000 iterations +2024/01/05 08:51:14 - mmengine - INFO - Iter(train) [208500/640000] base_lr: 1.5252e-04 lr: 1.5684e-05 eta: 7 days, 9:45:52 time: 1.5047 data_time: 0.0275 memory: 25719 grad_norm: 2.8496 loss: 1.3660 detection_loss_cls: 0.0384 detection_loss_reg: 0.3568 caption_loss_cls: 2.3593 grounding_loss_reg: 2.8561 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3475 instance_segmentation_loss_poly: 0.9519 +2024/01/05 09:04:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 09:04:09 - mmengine - INFO - Iter(train) [209000/640000] base_lr: 1.5231e-04 lr: 1.5665e-05 eta: 7 days, 9:38:47 time: 1.5078 data_time: 0.0276 memory: 25719 grad_norm: 2.8567 loss: 1.3745 detection_loss_cls: 0.0384 detection_loss_reg: 0.3575 caption_loss_cls: 2.3606 grounding_loss_reg: 2.8517 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0356 instance_segmentation_loss_reg: 0.3473 instance_segmentation_loss_poly: 0.9504 +2024/01/05 09:16:17 - mmengine - INFO - Iter(train) [209500/640000] base_lr: 1.5210e-04 lr: 1.5646e-05 eta: 7 days, 9:24:12 time: 1.5063 data_time: 0.0275 memory: 25719 grad_norm: 2.8979 loss: 1.3644 detection_loss_cls: 0.0383 detection_loss_reg: 0.3560 caption_loss_cls: 2.3564 grounding_loss_reg: 2.8523 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3463 instance_segmentation_loss_poly: 0.9475 +2024/01/05 09:28:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 09:28:44 - mmengine - INFO - Iter(train) [210000/640000] base_lr: 1.5190e-04 lr: 1.5627e-05 eta: 7 days, 9:12:45 time: 1.5082 data_time: 0.0276 memory: 25719 grad_norm: 2.9685 loss: 1.3706 detection_loss_cls: 0.0383 detection_loss_reg: 0.3550 caption_loss_cls: 2.3577 grounding_loss_reg: 2.8470 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0355 instance_segmentation_loss_reg: 0.3464 instance_segmentation_loss_poly: 0.9474 +2024/01/05 09:28:44 - mmengine - INFO - Saving checkpoint at 210000 iterations +2024/01/05 09:41:01 - mmengine - INFO - Iter(train) [210500/640000] base_lr: 1.5169e-04 lr: 1.5608e-05 eta: 7 days, 8:59:32 time: 1.4982 data_time: 0.0275 memory: 25719 grad_norm: 3.0756 loss: 1.3757 detection_loss_cls: 0.0383 detection_loss_reg: 0.3547 caption_loss_cls: 2.3519 grounding_loss_reg: 2.8424 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0355 instance_segmentation_loss_reg: 0.3464 instance_segmentation_loss_poly: 0.9474 +2024/01/05 09:53:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 09:53:46 - mmengine - INFO - Iter(train) [211000/640000] base_lr: 1.5148e-04 lr: 1.5589e-05 eta: 7 days, 8:50:37 time: 1.5068 data_time: 0.0276 memory: 25719 grad_norm: 3.1013 loss: 1.3707 detection_loss_cls: 0.0382 detection_loss_reg: 0.3553 caption_loss_cls: 2.3532 grounding_loss_reg: 2.8439 semantic_segmentation_loss_cls: 0.0098 instance_segmentation_loss_cls: 0.0358 instance_segmentation_loss_reg: 0.3481 instance_segmentation_loss_poly: 0.9507 +2024/01/05 10:05:34 - mmengine - INFO - Iter(train) [211500/640000] base_lr: 1.5127e-04 lr: 1.5570e-05 eta: 7 days, 8:33:08 time: 1.4958 data_time: 0.0274 memory: 25719 grad_norm: 3.2096 loss: 1.3817 detection_loss_cls: 0.0383 detection_loss_reg: 0.3559 caption_loss_cls: 2.3576 grounding_loss_reg: 2.8468 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0359 instance_segmentation_loss_reg: 0.3490 instance_segmentation_loss_poly: 0.9519 +2024/01/05 10:17:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 10:17:39 - mmengine - INFO - Iter(train) [212000/640000] base_lr: 1.5106e-04 lr: 1.5551e-05 eta: 7 days, 8:18:15 time: 1.5004 data_time: 0.0274 memory: 25719 grad_norm: 3.2195 loss: 1.3707 detection_loss_cls: 0.0383 detection_loss_reg: 0.3564 caption_loss_cls: 2.3524 grounding_loss_reg: 2.8499 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0357 instance_segmentation_loss_reg: 0.3484 instance_segmentation_loss_poly: 0.9513 +2024/01/05 10:17:39 - mmengine - INFO - Saving checkpoint at 212000 iterations +2024/01/05 10:30:12 - mmengine - INFO - Iter(train) [212500/640000] base_lr: 1.5085e-04 lr: 1.5532e-05 eta: 7 days, 8:07:36 time: 1.4841 data_time: 0.0271 memory: 25719 grad_norm: 3.2631 loss: 1.3791 detection_loss_cls: 0.0383 detection_loss_reg: 0.3565 caption_loss_cls: 2.3478 grounding_loss_reg: 2.8456 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0357 instance_segmentation_loss_reg: 0.3479 instance_segmentation_loss_poly: 0.9503 +2024/01/05 10:42:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 10:42:58 - mmengine - INFO - Iter(train) [213000/640000] base_lr: 1.5064e-04 lr: 1.5513e-05 eta: 7 days, 7:58:46 time: 1.4819 data_time: 0.0271 memory: 25719 grad_norm: 3.3120 loss: 1.3799 detection_loss_cls: 0.0382 detection_loss_reg: 0.3556 caption_loss_cls: 2.3472 grounding_loss_reg: 2.8448 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0357 instance_segmentation_loss_reg: 0.3470 instance_segmentation_loss_poly: 0.9478 +2024/01/05 10:55:26 - mmengine - INFO - Iter(train) [213500/640000] base_lr: 1.5043e-04 lr: 1.5494e-05 eta: 7 days, 7:47:11 time: 1.4868 data_time: 0.0272 memory: 25719 grad_norm: 3.2620 loss: 1.3729 detection_loss_cls: 0.0382 detection_loss_reg: 0.3552 caption_loss_cls: 2.3488 grounding_loss_reg: 2.8421 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3456 instance_segmentation_loss_poly: 0.9437 +2024/01/05 11:07:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 11:07:42 - mmengine - INFO - Iter(train) [214000/640000] base_lr: 1.5022e-04 lr: 1.5475e-05 eta: 7 days, 7:34:06 time: 1.4841 data_time: 0.0271 memory: 25719 grad_norm: 3.3082 loss: 1.3727 detection_loss_cls: 0.0382 detection_loss_reg: 0.3549 caption_loss_cls: 2.3475 grounding_loss_reg: 2.8397 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0353 instance_segmentation_loss_reg: 0.3449 instance_segmentation_loss_poly: 0.9424 +2024/01/05 11:07:42 - mmengine - INFO - Saving checkpoint at 214000 iterations +2024/01/05 11:20:19 - mmengine - INFO - Iter(train) [214500/640000] base_lr: 1.5001e-04 lr: 1.5455e-05 eta: 7 days, 7:23:44 time: 1.4891 data_time: 0.0273 memory: 25719 grad_norm: 3.2055 loss: 1.3690 detection_loss_cls: 0.0381 detection_loss_reg: 0.3546 caption_loss_cls: 2.3485 grounding_loss_reg: 2.8410 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0353 instance_segmentation_loss_reg: 0.3455 instance_segmentation_loss_poly: 0.9437 +2024/01/05 11:32:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 11:32:31 - mmengine - INFO - Iter(train) [215000/640000] base_lr: 1.4980e-04 lr: 1.5436e-05 eta: 7 days, 7:09:58 time: 1.4809 data_time: 0.0271 memory: 25719 grad_norm: 3.1676 loss: 1.3649 detection_loss_cls: 0.0379 detection_loss_reg: 0.3533 caption_loss_cls: 2.3447 grounding_loss_reg: 2.8427 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3463 instance_segmentation_loss_poly: 0.9446 +2024/01/05 11:44:27 - mmengine - INFO - Iter(train) [215500/640000] base_lr: 1.4959e-04 lr: 1.5417e-05 eta: 7 days, 6:54:03 time: 1.4829 data_time: 0.0271 memory: 25719 grad_norm: 3.3371 loss: 1.3545 detection_loss_cls: 0.0379 detection_loss_reg: 0.3530 caption_loss_cls: 2.3431 grounding_loss_reg: 2.8454 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3459 instance_segmentation_loss_poly: 0.9429 +2024/01/05 11:56:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 11:56:40 - mmengine - INFO - Iter(train) [216000/640000] base_lr: 1.4937e-04 lr: 1.5398e-05 eta: 7 days, 6:40:27 time: 1.4849 data_time: 0.0272 memory: 25719 grad_norm: 3.5695 loss: 1.3502 detection_loss_cls: 0.0379 detection_loss_reg: 0.3529 caption_loss_cls: 2.3446 grounding_loss_reg: 2.8433 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3459 instance_segmentation_loss_poly: 0.9429 +2024/01/05 11:56:40 - mmengine - INFO - Saving checkpoint at 216000 iterations +2024/01/05 12:09:32 - mmengine - INFO - Iter(train) [216500/640000] base_lr: 1.4916e-04 lr: 1.5378e-05 eta: 7 days, 6:32:08 time: 1.4895 data_time: 0.0272 memory: 25719 grad_norm: 3.6671 loss: 1.3470 detection_loss_cls: 0.0379 detection_loss_reg: 0.3533 caption_loss_cls: 2.3412 grounding_loss_reg: 2.8393 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0353 instance_segmentation_loss_reg: 0.3459 instance_segmentation_loss_poly: 0.9428 +2024/01/05 12:22:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 12:22:00 - mmengine - INFO - Iter(train) [217000/640000] base_lr: 1.4895e-04 lr: 1.5359e-05 eta: 7 days, 6:20:39 time: 1.4852 data_time: 0.0270 memory: 25719 grad_norm: 3.6534 loss: 1.3422 detection_loss_cls: 0.0379 detection_loss_reg: 0.3537 caption_loss_cls: 2.3376 grounding_loss_reg: 2.8396 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0354 instance_segmentation_loss_reg: 0.3463 instance_segmentation_loss_poly: 0.9440 +2024/01/05 12:33:57 - mmengine - INFO - Iter(train) [217500/640000] base_lr: 1.4874e-04 lr: 1.5340e-05 eta: 7 days, 6:04:52 time: 1.4773 data_time: 0.0267 memory: 25719 grad_norm: 3.6683 loss: 1.3340 detection_loss_cls: 0.0378 detection_loss_reg: 0.3524 caption_loss_cls: 2.3354 grounding_loss_reg: 2.8359 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0353 instance_segmentation_loss_reg: 0.3457 instance_segmentation_loss_poly: 0.9416 +2024/01/05 12:46:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 12:46:24 - mmengine - INFO - Iter(train) [218000/640000] base_lr: 1.4852e-04 lr: 1.5320e-05 eta: 7 days, 5:53:11 time: 1.4798 data_time: 0.0267 memory: 25719 grad_norm: 3.6144 loss: 1.3314 detection_loss_cls: 0.0378 detection_loss_reg: 0.3534 caption_loss_cls: 2.3323 grounding_loss_reg: 2.8324 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0351 instance_segmentation_loss_reg: 0.3446 instance_segmentation_loss_poly: 0.9398 +2024/01/05 12:46:24 - mmengine - INFO - Saving checkpoint at 218000 iterations +2024/01/05 12:58:38 - mmengine - INFO - Iter(train) [218500/640000] base_lr: 1.4831e-04 lr: 1.5301e-05 eta: 7 days, 5:39:52 time: 1.4744 data_time: 0.0266 memory: 25719 grad_norm: 3.6346 loss: 1.3398 detection_loss_cls: 0.0377 detection_loss_reg: 0.3528 caption_loss_cls: 2.3336 grounding_loss_reg: 2.8340 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0352 instance_segmentation_loss_reg: 0.3455 instance_segmentation_loss_poly: 0.9412 +2024/01/05 13:11:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 13:11:23 - mmengine - INFO - Iter(train) [219000/640000] base_lr: 1.4810e-04 lr: 1.5282e-05 eta: 7 days, 5:30:27 time: 1.4826 data_time: 0.0268 memory: 25719 grad_norm: 3.6810 loss: 1.3380 detection_loss_cls: 0.0377 detection_loss_reg: 0.3519 caption_loss_cls: 2.3286 grounding_loss_reg: 2.8360 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0350 instance_segmentation_loss_reg: 0.3452 instance_segmentation_loss_poly: 0.9418 +2024/01/05 13:24:04 - mmengine - INFO - Iter(train) [219500/640000] base_lr: 1.4788e-04 lr: 1.5262e-05 eta: 7 days, 5:20:30 time: 1.4938 data_time: 0.0271 memory: 25719 grad_norm: 3.4941 loss: 1.3303 detection_loss_cls: 0.0376 detection_loss_reg: 0.3519 caption_loss_cls: 2.3249 grounding_loss_reg: 2.8329 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0349 instance_segmentation_loss_reg: 0.3429 instance_segmentation_loss_poly: 0.9374 +2024/01/05 13:36:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240104_134302 +2024/01/05 13:36:32 - mmengine - INFO - Iter(train) [220000/640000] base_lr: 1.4767e-04 lr: 1.5243e-05 eta: 7 days, 5:08:52 time: 1.4977 data_time: 0.0270 memory: 25719 grad_norm: 3.2121 loss: 1.3212 detection_loss_cls: 0.0377 detection_loss_reg: 0.3524 caption_loss_cls: 2.3236 grounding_loss_reg: 2.8279 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3420 instance_segmentation_loss_poly: 0.9358 +2024/01/05 13:36:32 - mmengine - INFO - Saving checkpoint at 220000 iterations +2024/01/05 14:08:44 - mmengine - INFO - Iter(train) [220500/640000] base_lr: 1.4745e-04 lr: 1.5223e-05 eta: 7 days, 2:33:56 time: 1.4877 data_time: 0.0218 memory: 25720 grad_norm: 3.1761 loss: 1.3196 detection_loss_cls: 0.0374 detection_loss_reg: 0.3500 caption_loss_cls: 2.3254 grounding_loss_reg: 2.8228 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3401 instance_segmentation_loss_poly: 0.9314 +2024/01/05 14:21:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 14:21:11 - mmengine - INFO - Iter(train) [221000/640000] base_lr: 1.4724e-04 lr: 1.5204e-05 eta: 7 days, 4:06:03 time: 1.4873 data_time: 0.0217 memory: 25717 grad_norm: 3.2891 loss: 1.3356 detection_loss_cls: 0.0373 detection_loss_reg: 0.3500 caption_loss_cls: 2.3268 grounding_loss_reg: 2.8247 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3414 instance_segmentation_loss_poly: 0.9336 +2024/01/05 14:33:23 - mmengine - INFO - Iter(train) [221500/640000] base_lr: 1.4702e-04 lr: 1.5184e-05 eta: 7 days, 3:15:48 time: 1.4911 data_time: 0.0215 memory: 25717 grad_norm: 3.4301 loss: 1.3417 detection_loss_cls: 0.0374 detection_loss_reg: 0.3516 caption_loss_cls: 2.3198 grounding_loss_reg: 2.8222 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0348 instance_segmentation_loss_reg: 0.3423 instance_segmentation_loss_poly: 0.9343 +2024/01/05 14:45:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 14:45:31 - mmengine - INFO - Iter(train) [222000/640000] base_lr: 1.4681e-04 lr: 1.5164e-05 eta: 7 days, 2:33:00 time: 1.4864 data_time: 0.0212 memory: 25717 grad_norm: 3.5696 loss: 1.3454 detection_loss_cls: 0.0373 detection_loss_reg: 0.3510 caption_loss_cls: 2.3203 grounding_loss_reg: 2.8224 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3419 instance_segmentation_loss_poly: 0.9329 +2024/01/05 14:45:31 - mmengine - INFO - Saving checkpoint at 222000 iterations +2024/01/05 14:58:10 - mmengine - INFO - Iter(train) [222500/640000] base_lr: 1.4659e-04 lr: 1.5145e-05 eta: 7 days, 3:29:42 time: 1.4926 data_time: 0.0208 memory: 25717 grad_norm: 3.6650 loss: 1.3442 detection_loss_cls: 0.0371 detection_loss_reg: 0.3504 caption_loss_cls: 2.3249 grounding_loss_reg: 2.8189 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3417 instance_segmentation_loss_poly: 0.9326 +2024/01/05 15:10:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 15:10:21 - mmengine - INFO - Iter(train) [223000/640000] base_lr: 1.4638e-04 lr: 1.5125e-05 eta: 7 days, 2:57:18 time: 1.4841 data_time: 0.0203 memory: 25717 grad_norm: 3.6664 loss: 1.3489 detection_loss_cls: 0.0370 detection_loss_reg: 0.3499 caption_loss_cls: 2.3206 grounding_loss_reg: 2.8169 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3412 instance_segmentation_loss_poly: 0.9313 +2024/01/05 15:22:21 - mmengine - INFO - Iter(train) [223500/640000] base_lr: 1.4616e-04 lr: 1.5106e-05 eta: 7 days, 2:09:33 time: 1.4739 data_time: 0.0199 memory: 25717 grad_norm: 3.6495 loss: 1.3573 detection_loss_cls: 0.0368 detection_loss_reg: 0.3491 caption_loss_cls: 2.3168 grounding_loss_reg: 2.8167 semantic_segmentation_loss_cls: 0.0097 instance_segmentation_loss_cls: 0.0346 instance_segmentation_loss_reg: 0.3413 instance_segmentation_loss_poly: 0.9317 +2024/01/05 15:34:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 15:34:55 - mmengine - INFO - Iter(train) [224000/640000] base_lr: 1.4595e-04 lr: 1.5086e-05 eta: 7 days, 2:28:53 time: 1.4753 data_time: 0.0196 memory: 25717 grad_norm: 3.6482 loss: 1.3630 detection_loss_cls: 0.0368 detection_loss_reg: 0.3491 caption_loss_cls: 2.3122 grounding_loss_reg: 2.8150 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3408 instance_segmentation_loss_poly: 0.9301 +2024/01/05 15:34:55 - mmengine - INFO - Saving checkpoint at 224000 iterations +2024/01/05 15:46:39 - mmengine - INFO - Iter(train) [224500/640000] base_lr: 1.4573e-04 lr: 1.5066e-05 eta: 7 days, 1:24:07 time: 1.4682 data_time: 0.0237 memory: 25717 grad_norm: 3.7444 loss: 1.3815 detection_loss_cls: 0.0369 detection_loss_reg: 0.3498 caption_loss_cls: 2.3078 grounding_loss_reg: 2.8161 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0346 instance_segmentation_loss_reg: 0.3413 instance_segmentation_loss_poly: 0.9311 +2024/01/05 15:59:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 15:59:19 - mmengine - INFO - Iter(train) [225000/640000] base_lr: 1.4551e-04 lr: 1.5047e-05 eta: 7 days, 1:47:43 time: 1.4715 data_time: 0.0237 memory: 25717 grad_norm: 3.6491 loss: 1.3591 detection_loss_cls: 0.0368 detection_loss_reg: 0.3481 caption_loss_cls: 2.3080 grounding_loss_reg: 2.8106 semantic_segmentation_loss_cls: 0.0096 instance_segmentation_loss_cls: 0.0346 instance_segmentation_loss_reg: 0.3408 instance_segmentation_loss_poly: 0.9303 +2024/01/05 16:11:29 - mmengine - INFO - Iter(train) [225500/640000] base_lr: 1.4529e-04 lr: 1.5027e-05 eta: 7 days, 1:27:55 time: 1.4713 data_time: 0.0239 memory: 25717 grad_norm: 3.5265 loss: 1.3681 detection_loss_cls: 0.0368 detection_loss_reg: 0.3493 caption_loss_cls: 2.3040 grounding_loss_reg: 2.8090 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3415 instance_segmentation_loss_poly: 0.9318 +2024/01/05 16:23:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 16:23:41 - mmengine - INFO - Iter(train) [226000/640000] base_lr: 1.4508e-04 lr: 1.5007e-05 eta: 7 days, 1:10:03 time: 1.4721 data_time: 0.0241 memory: 25717 grad_norm: 3.3726 loss: 1.3734 detection_loss_cls: 0.0368 detection_loss_reg: 0.3500 caption_loss_cls: 2.3026 grounding_loss_reg: 2.8067 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0346 instance_segmentation_loss_reg: 0.3421 instance_segmentation_loss_poly: 0.9332 +2024/01/05 16:23:41 - mmengine - INFO - Saving checkpoint at 226000 iterations +2024/01/05 16:35:34 - mmengine - INFO - Iter(train) [226500/640000] base_lr: 1.4486e-04 lr: 1.4987e-05 eta: 7 days, 0:34:30 time: 1.4607 data_time: 0.0236 memory: 25717 grad_norm: 3.2766 loss: 1.3697 detection_loss_cls: 0.0369 detection_loss_reg: 0.3505 caption_loss_cls: 2.3004 grounding_loss_reg: 2.8016 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0348 instance_segmentation_loss_reg: 0.3436 instance_segmentation_loss_poly: 0.9367 +2024/01/05 16:47:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 16:47:35 - mmengine - INFO - Iter(train) [227000/640000] base_lr: 1.4464e-04 lr: 1.4967e-05 eta: 7 days, 0:09:20 time: 1.4582 data_time: 0.0235 memory: 25717 grad_norm: 3.2633 loss: 1.3672 detection_loss_cls: 0.0369 detection_loss_reg: 0.3506 caption_loss_cls: 2.2990 grounding_loss_reg: 2.7980 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3433 instance_segmentation_loss_poly: 0.9368 +2024/01/05 16:59:55 - mmengine - INFO - Iter(train) [227500/640000] base_lr: 1.4442e-04 lr: 1.4948e-05 eta: 7 days, 0:03:35 time: 1.4632 data_time: 0.0237 memory: 25717 grad_norm: 3.2232 loss: 1.3679 detection_loss_cls: 0.0368 detection_loss_reg: 0.3502 caption_loss_cls: 2.2985 grounding_loss_reg: 2.7975 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0347 instance_segmentation_loss_reg: 0.3437 instance_segmentation_loss_poly: 0.9372 +2024/01/05 17:12:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 17:12:07 - mmengine - INFO - Iter(train) [228000/640000] base_lr: 1.4420e-04 lr: 1.4928e-05 eta: 6 days, 23:49:36 time: 1.4576 data_time: 0.0237 memory: 25717 grad_norm: 3.2304 loss: 1.3717 detection_loss_cls: 0.0365 detection_loss_reg: 0.3492 caption_loss_cls: 2.2964 grounding_loss_reg: 2.7912 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0345 instance_segmentation_loss_reg: 0.3430 instance_segmentation_loss_poly: 0.9356 +2024/01/05 17:12:07 - mmengine - INFO - Saving checkpoint at 228000 iterations +2024/01/05 17:24:29 - mmengine - INFO - Iter(train) [228500/640000] base_lr: 1.4399e-04 lr: 1.4908e-05 eta: 6 days, 23:44:05 time: 1.4671 data_time: 0.0238 memory: 25717 grad_norm: 3.0122 loss: 1.3495 detection_loss_cls: 0.0363 detection_loss_reg: 0.3478 caption_loss_cls: 2.2942 grounding_loss_reg: 2.7899 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0343 instance_segmentation_loss_reg: 0.3418 instance_segmentation_loss_poly: 0.9330 +2024/01/05 17:36:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 17:36:33 - mmengine - INFO - Iter(train) [229000/640000] base_lr: 1.4377e-04 lr: 1.4888e-05 eta: 6 days, 23:24:20 time: 1.4581 data_time: 0.0237 memory: 25717 grad_norm: 2.9574 loss: 1.3648 detection_loss_cls: 0.0364 detection_loss_reg: 0.3490 caption_loss_cls: 2.2948 grounding_loss_reg: 2.7905 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0341 instance_segmentation_loss_reg: 0.3413 instance_segmentation_loss_poly: 0.9342 +2024/01/05 17:49:42 - mmengine - INFO - Iter(train) [229500/640000] base_lr: 1.4355e-04 lr: 1.4868e-05 eta: 6 days, 23:52:19 time: 1.4727 data_time: 0.0238 memory: 25717 grad_norm: 2.8598 loss: 1.3437 detection_loss_cls: 0.0363 detection_loss_reg: 0.3492 caption_loss_cls: 2.2921 grounding_loss_reg: 2.7879 semantic_segmentation_loss_cls: 0.0095 instance_segmentation_loss_cls: 0.0341 instance_segmentation_loss_reg: 0.3415 instance_segmentation_loss_poly: 0.9345 +2024/01/05 18:01:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 18:01:54 - mmengine - INFO - Iter(train) [230000/640000] base_lr: 1.4333e-04 lr: 1.4848e-05 eta: 6 days, 23:37:03 time: 1.4729 data_time: 0.0237 memory: 25717 grad_norm: 2.8565 loss: 1.3330 detection_loss_cls: 0.0362 detection_loss_reg: 0.3486 caption_loss_cls: 2.2886 grounding_loss_reg: 2.7900 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0339 instance_segmentation_loss_reg: 0.3408 instance_segmentation_loss_poly: 0.9328 +2024/01/05 18:01:54 - mmengine - INFO - Saving checkpoint at 230000 iterations +2024/01/05 18:14:58 - mmengine - INFO - Iter(train) [230500/640000] base_lr: 1.4311e-04 lr: 1.4828e-05 eta: 6 days, 23:56:17 time: 1.4906 data_time: 0.0238 memory: 25717 grad_norm: 2.7880 loss: 1.3114 detection_loss_cls: 0.0363 detection_loss_reg: 0.3494 caption_loss_cls: 2.2887 grounding_loss_reg: 2.7884 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3403 instance_segmentation_loss_poly: 0.9310 +2024/01/05 18:27:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 18:27:43 - mmengine - INFO - Iter(train) [231000/640000] base_lr: 1.4289e-04 lr: 1.4808e-05 eta: 7 days, 0:00:22 time: 1.5016 data_time: 0.0241 memory: 25717 grad_norm: 2.7139 loss: 1.3082 detection_loss_cls: 0.0363 detection_loss_reg: 0.3498 caption_loss_cls: 2.2830 grounding_loss_reg: 2.7891 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3405 instance_segmentation_loss_poly: 0.9318 +2024/01/05 18:39:59 - mmengine - INFO - Iter(train) [231500/640000] base_lr: 1.4267e-04 lr: 1.4788e-05 eta: 6 days, 23:45:52 time: 1.5005 data_time: 0.0241 memory: 25717 grad_norm: 2.7085 loss: 1.3073 detection_loss_cls: 0.0363 detection_loss_reg: 0.3504 caption_loss_cls: 2.2758 grounding_loss_reg: 2.7841 semantic_segmentation_loss_cls: 0.0094 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3415 instance_segmentation_loss_poly: 0.9341 +2024/01/05 18:51:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 18:51:19 - mmengine - INFO - Iter(train) [232000/640000] base_lr: 1.4245e-04 lr: 1.4768e-05 eta: 6 days, 22:59:51 time: 1.4876 data_time: 0.0239 memory: 25717 grad_norm: 2.7008 loss: 1.3086 detection_loss_cls: 0.0363 detection_loss_reg: 0.3511 caption_loss_cls: 2.2722 grounding_loss_reg: 2.7822 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3405 instance_segmentation_loss_poly: 0.9323 +2024/01/05 18:51:19 - mmengine - INFO - Saving checkpoint at 232000 iterations +2024/01/05 19:04:00 - mmengine - INFO - Iter(train) [232500/640000] base_lr: 1.4223e-04 lr: 1.4748e-05 eta: 6 days, 23:00:40 time: 1.4925 data_time: 0.0242 memory: 25717 grad_norm: 2.7323 loss: 1.3238 detection_loss_cls: 0.0363 detection_loss_reg: 0.3511 caption_loss_cls: 2.2713 grounding_loss_reg: 2.7788 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3419 instance_segmentation_loss_poly: 0.9341 +2024/01/05 19:15:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 19:15:34 - mmengine - INFO - Iter(train) [233000/640000] base_lr: 1.4201e-04 lr: 1.4728e-05 eta: 6 days, 22:25:24 time: 1.4849 data_time: 0.0241 memory: 25717 grad_norm: 2.7940 loss: 1.3177 detection_loss_cls: 0.0363 detection_loss_reg: 0.3515 caption_loss_cls: 2.2682 grounding_loss_reg: 2.7797 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3425 instance_segmentation_loss_poly: 0.9346 +2024/01/05 19:27:45 - mmengine - INFO - Iter(train) [233500/640000] base_lr: 1.4178e-04 lr: 1.4708e-05 eta: 6 days, 22:10:37 time: 1.4704 data_time: 0.0241 memory: 25717 grad_norm: 2.8734 loss: 1.3332 detection_loss_cls: 0.0363 detection_loss_reg: 0.3521 caption_loss_cls: 2.2612 grounding_loss_reg: 2.7763 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3429 instance_segmentation_loss_poly: 0.9348 +2024/01/05 19:40:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 19:40:17 - mmengine - INFO - Iter(train) [234000/640000] base_lr: 1.4156e-04 lr: 1.4688e-05 eta: 6 days, 22:06:13 time: 1.4755 data_time: 0.0243 memory: 25717 grad_norm: 2.8380 loss: 1.3398 detection_loss_cls: 0.0362 detection_loss_reg: 0.3508 caption_loss_cls: 2.2570 grounding_loss_reg: 2.7743 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0338 instance_segmentation_loss_reg: 0.3443 instance_segmentation_loss_poly: 0.9380 +2024/01/05 19:40:17 - mmengine - INFO - Saving checkpoint at 234000 iterations +2024/01/05 19:52:28 - mmengine - INFO - Iter(train) [234500/640000] base_lr: 1.4134e-04 lr: 1.4667e-05 eta: 6 days, 21:50:54 time: 1.4619 data_time: 0.0242 memory: 25717 grad_norm: 2.8775 loss: 1.3651 detection_loss_cls: 0.0362 detection_loss_reg: 0.3510 caption_loss_cls: 2.2578 grounding_loss_reg: 2.7725 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3432 instance_segmentation_loss_poly: 0.9352 +2024/01/05 20:04:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 20:04:24 - mmengine - INFO - Iter(train) [235000/640000] base_lr: 1.4112e-04 lr: 1.4647e-05 eta: 6 days, 21:29:47 time: 1.4499 data_time: 0.0240 memory: 25717 grad_norm: 2.9368 loss: 1.3656 detection_loss_cls: 0.0360 detection_loss_reg: 0.3499 caption_loss_cls: 2.2592 grounding_loss_reg: 2.7690 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3420 instance_segmentation_loss_poly: 0.9319 +2024/01/05 20:16:38 - mmengine - INFO - Iter(train) [235500/640000] base_lr: 1.4090e-04 lr: 1.4627e-05 eta: 6 days, 21:16:44 time: 1.4494 data_time: 0.0239 memory: 25717 grad_norm: 2.9463 loss: 1.3652 detection_loss_cls: 0.0360 detection_loss_reg: 0.3495 caption_loss_cls: 2.2591 grounding_loss_reg: 2.7670 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3415 instance_segmentation_loss_poly: 0.9315 +2024/01/05 20:28:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 20:28:57 - mmengine - INFO - Iter(train) [236000/640000] base_lr: 1.4067e-04 lr: 1.4607e-05 eta: 6 days, 21:05:36 time: 1.4640 data_time: 0.0240 memory: 25717 grad_norm: 2.9471 loss: 1.3590 detection_loss_cls: 0.0359 detection_loss_reg: 0.3488 caption_loss_cls: 2.2600 grounding_loss_reg: 2.7648 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3416 instance_segmentation_loss_poly: 0.9324 +2024/01/05 20:28:57 - mmengine - INFO - Saving checkpoint at 236000 iterations +2024/01/05 20:41:13 - mmengine - INFO - Iter(train) [236500/640000] base_lr: 1.4045e-04 lr: 1.4587e-05 eta: 6 days, 20:53:25 time: 1.4577 data_time: 0.0237 memory: 25717 grad_norm: 2.9149 loss: 1.3416 detection_loss_cls: 0.0360 detection_loss_reg: 0.3491 caption_loss_cls: 2.2572 grounding_loss_reg: 2.7649 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3410 instance_segmentation_loss_poly: 0.9312 +2024/01/05 20:54:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 20:54:19 - mmengine - INFO - Iter(train) [237000/640000] base_lr: 1.4023e-04 lr: 1.4566e-05 eta: 6 days, 21:01:05 time: 1.4808 data_time: 0.0241 memory: 25717 grad_norm: 2.8383 loss: 1.3356 detection_loss_cls: 0.0360 detection_loss_reg: 0.3485 caption_loss_cls: 2.2590 grounding_loss_reg: 2.7634 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3420 instance_segmentation_loss_poly: 0.9319 +2024/01/05 21:06:45 - mmengine - INFO - Iter(train) [237500/640000] base_lr: 1.4001e-04 lr: 1.4546e-05 eta: 6 days, 20:52:15 time: 1.4846 data_time: 0.0240 memory: 25717 grad_norm: 2.8000 loss: 1.3390 detection_loss_cls: 0.0362 detection_loss_reg: 0.3501 caption_loss_cls: 2.2574 grounding_loss_reg: 2.7628 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3421 instance_segmentation_loss_poly: 0.9327 +2024/01/05 21:18:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 21:18:37 - mmengine - INFO - Iter(train) [238000/640000] base_lr: 1.3978e-04 lr: 1.4526e-05 eta: 6 days, 20:30:37 time: 1.4746 data_time: 0.0239 memory: 25717 grad_norm: 2.7909 loss: 1.3374 detection_loss_cls: 0.0361 detection_loss_reg: 0.3500 caption_loss_cls: 2.2514 grounding_loss_reg: 2.7634 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3433 instance_segmentation_loss_poly: 0.9348 +2024/01/05 21:18:37 - mmengine - INFO - Saving checkpoint at 238000 iterations +2024/01/05 21:30:40 - mmengine - INFO - Iter(train) [238500/640000] base_lr: 1.3956e-04 lr: 1.4505e-05 eta: 6 days, 20:13:16 time: 1.4728 data_time: 0.0238 memory: 25717 grad_norm: 2.7938 loss: 1.3356 detection_loss_cls: 0.0361 detection_loss_reg: 0.3492 caption_loss_cls: 2.2507 grounding_loss_reg: 2.7627 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3431 instance_segmentation_loss_poly: 0.9339 +2024/01/05 21:43:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 21:43:32 - mmengine - INFO - Iter(train) [239000/640000] base_lr: 1.3933e-04 lr: 1.4485e-05 eta: 6 days, 20:13:32 time: 1.4866 data_time: 0.0240 memory: 25717 grad_norm: 2.7522 loss: 1.3311 detection_loss_cls: 0.0360 detection_loss_reg: 0.3489 caption_loss_cls: 2.2508 grounding_loss_reg: 2.7617 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3415 instance_segmentation_loss_poly: 0.9302 +2024/01/05 21:56:47 - mmengine - INFO - Iter(train) [239500/640000] base_lr: 1.3911e-04 lr: 1.4465e-05 eta: 6 days, 20:20:54 time: 1.5018 data_time: 0.0242 memory: 25717 grad_norm: 2.6889 loss: 1.3200 detection_loss_cls: 0.0359 detection_loss_reg: 0.3479 caption_loss_cls: 2.2519 grounding_loss_reg: 2.7632 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3409 instance_segmentation_loss_poly: 0.9293 +2024/01/05 22:09:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 22:09:01 - mmengine - INFO - Iter(train) [240000/640000] base_lr: 1.3889e-04 lr: 1.4444e-05 eta: 6 days, 20:07:06 time: 1.5008 data_time: 0.0243 memory: 25717 grad_norm: 2.6879 loss: 1.3312 detection_loss_cls: 0.0360 detection_loss_reg: 0.3485 caption_loss_cls: 2.2500 grounding_loss_reg: 2.7639 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3416 instance_segmentation_loss_poly: 0.9305 +2024/01/05 22:09:02 - mmengine - INFO - Saving checkpoint at 240000 iterations +2024/01/05 22:21:17 - mmengine - INFO - Evaluating bbox... +2024/01/05 22:22:16 - mmengine - INFO - bbox_mAP_copypaste: 0.470 0.652 0.517 0.314 0.520 0.597 +2024/01/05 22:22:16 - mmengine - INFO - Evaluating segm... +2024/01/05 22:23:32 - mmengine - INFO - segm_mAP_copypaste: 0.312 0.566 0.308 0.171 0.365 0.473 +2024/01/05 22:29:42 - mmengine - INFO - per class results: +2024/01/05 22:29:42 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 77.56 | 88.58 | +| building | 80.64 | 87.32 | +| sky | 93.19 | 97.96 | +| floor | 81.2 | 91.77 | +| tree | 72.73 | 87.55 | +| ceiling | 83.63 | 93.21 | +| road | 81.7 | 90.55 | +| bed | 88.15 | 93.65 | +| windowpane | 60.93 | 81.88 | +| grass | 65.13 | 85.13 | +| cabinet | 60.3 | 75.63 | +| sidewalk | 65.44 | 78.86 | +| person | 80.37 | 89.97 | +| earth | 39.25 | 48.67 | +| door | 51.45 | 69.09 | +| table | 61.81 | 74.94 | +| mountain | 58.58 | 68.67 | +| plant | 52.01 | 69.85 | +| curtain | 73.82 | 83.56 | +| chair | 58.15 | 71.13 | +| car | 83.85 | 90.28 | +| water | 52.58 | 66.74 | +| painting | 69.8 | 83.71 | +| sofa | 64.43 | 73.51 | +| shelf | 44.74 | 63.94 | +| house | 39.65 | 89.14 | +| sea | 57.33 | 72.52 | +| mirror | 62.61 | 79.26 | +| rug | 64.05 | 68.47 | +| field | 25.63 | 41.52 | +| armchair | 43.54 | 70.77 | +| seat | 54.8 | 83.73 | +| fence | 47.96 | 58.53 | +| desk | 48.45 | 67.38 | +| rock | 46.21 | 77.54 | +| wardrobe | 46.68 | 58.67 | +| lamp | 59.76 | 70.14 | +| bathtub | 77.97 | 84.78 | +| railing | 35.59 | 50.43 | +| cushion | 52.11 | 79.11 | +| base | 26.34 | 33.65 | +| box | 28.78 | 36.1 | +| column | 51.2 | 65.59 | +| signboard | 37.39 | 51.94 | +| chest of drawers | 37.18 | 67.06 | +| counter | 15.5 | 23.2 | +| sand | 40.75 | 51.78 | +| sink | 69.56 | 76.6 | +| skyscraper | 41.44 | 45.34 | +| fireplace | 73.69 | 80.8 | +| refrigerator | 75.26 | 77.9 | +| grandstand | 50.67 | 70.37 | +| path | 22.02 | 38.59 | +| stairs | 36.82 | 48.95 | +| runway | 63.74 | 72.49 | +| case | 50.5 | 61.55 | +| pool table | 88.81 | 95.12 | +| pillow | 44.99 | 51.76 | +| screen door | 74.88 | 82.15 | +| stairway | 33.05 | 40.12 | +| river | 14.07 | 32.59 | +| bridge | 67.18 | 82.37 | +| bookcase | 36.98 | 56.39 | +| blind | 34.15 | 36.25 | +| coffee table | 61.2 | 72.73 | +| toilet | 84.14 | 87.16 | +| flower | 32.98 | 41.73 | +| book | 44.73 | 59.59 | +| hill | 10.18 | 15.73 | +| bench | 53.32 | 58.23 | +| countertop | 58.19 | 67.89 | +| stove | 72.08 | 81.52 | +| palm | 36.15 | 44.05 | +| kitchen island | 41.33 | 69.45 | +| computer | 65.87 | 76.13 | +| swivel chair | 43.94 | 62.59 | +| boat | 75.29 | 82.46 | +| bar | 35.61 | 49.61 | +| arcade machine | 43.88 | 48.7 | +| hovel | 10.54 | 11.84 | +| bus | 91.92 | 94.95 | +| towel | 59.48 | 70.79 | +| light | 52.7 | 62.87 | +| truck | 41.5 | 54.09 | +| tower | 8.85 | 11.84 | +| chandelier | 60.75 | 72.04 | +| awning | 31.72 | 38.39 | +| streetlight | 27.13 | 32.65 | +| booth | 32.67 | 37.36 | +| television receiver | 72.26 | 81.28 | +| airplane | 58.37 | 66.43 | +| dirt track | 2.51 | 4.8 | +| apparel | 27.02 | 41.25 | +| pole | 26.94 | 37.48 | +| land | 2.41 | 2.73 | +| bannister | 15.75 | 18.92 | +| escalator | 10.24 | 10.53 | +| ottoman | 46.86 | 64.82 | +| bottle | 23.11 | 29.08 | +| buffet | 50.77 | 65.83 | +| poster | 30.48 | 38.94 | +| stage | 12.0 | 15.56 | +| van | 36.52 | 44.9 | +| ship | 76.06 | 85.04 | +| fountain | 5.33 | 5.41 | +| conveyer belt | 69.82 | 92.51 | +| canopy | 13.39 | 14.03 | +| washer | 66.42 | 74.5 | +| plaything | 25.22 | 31.29 | +| swimming pool | 43.42 | 58.36 | +| stool | 43.96 | 57.63 | +| barrel | 27.35 | 64.55 | +| basket | 33.63 | 50.62 | +| waterfall | 45.4 | 61.52 | +| tent | 80.28 | 87.29 | +| bag | 23.07 | 28.49 | +| minibike | 70.49 | 82.18 | +| cradle | 75.28 | 96.88 | +| oven | 36.14 | 54.54 | +| ball | 43.98 | 58.82 | +| food | 48.29 | 52.14 | +| step | 15.19 | 17.35 | +| tank | 31.57 | 41.4 | +| trade name | 32.58 | 45.6 | +| microwave | 67.71 | 74.18 | +| pot | 48.28 | 60.69 | +| animal | 62.58 | 65.26 | +| bicycle | 54.42 | 63.01 | +| lake | 40.39 | 63.86 | +| dishwasher | 57.37 | 65.67 | +| screen | 66.17 | 85.34 | +| blanket | 8.69 | 10.8 | +| sculpture | 50.16 | 67.22 | +| hood | 52.91 | 54.88 | +| sconce | 36.05 | 44.59 | +| vase | 39.68 | 53.03 | +| traffic light | 38.1 | 54.22 | +| tray | 6.87 | 9.54 | +| ashcan | 40.33 | 53.67 | +| fan | 53.16 | 61.69 | +| pier | 49.05 | 62.61 | +| crt screen | 9.29 | 11.98 | +| plate | 55.07 | 69.59 | +| monitor | 17.61 | 22.41 | +| bulletin board | 17.29 | 18.64 | +| shower | 2.15 | 2.3 | +| radiator | 58.28 | 61.54 | +| glass | 16.94 | 18.88 | +| clock | 23.1 | 26.96 | +| flag | 34.18 | 38.15 | ++---------------------+-------+-------+ +2024/01/05 22:30:00 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4700 coco/bbox_mAP_50: 0.6520 coco/bbox_mAP_75: 0.5170 coco/bbox_mAP_s: 0.3140 coco/bbox_mAP_m: 0.5200 coco/bbox_mAP_l: 0.5970 coco/segm_mAP: 0.3120 coco/segm_mAP_50: 0.5660 coco/segm_mAP_75: 0.3080 coco/segm_mAP_s: 0.1710 coco/segm_mAP_m: 0.3650 coco/segm_mAP_l: 0.4730 Bleu_1: 0.7319 Bleu_2: 0.5598 Bleu_3: 0.4140 Bleu_4: 0.3015 METEOR: 0.2534 ROUGE_L: 0.5346 CIDEr: 0.9751 SPICE: 0.1898 aAcc: 82.4600 mIoU: 47.2200 mAcc: 58.3000 visual-grounding/miou: 0.7786 visual-grounding/acc: 0.8516 data_time: 0.0101 time: 1.3536 +2024/01/05 22:42:36 - mmengine - INFO - Iter(train) [240500/640000] base_lr: 1.3866e-04 lr: 1.4424e-05 eta: 6 days, 20:01:20 time: 1.5065 data_time: 0.0213 memory: 25717 grad_norm: 2.6667 loss: 1.3409 detection_loss_cls: 0.0361 detection_loss_reg: 0.3503 caption_loss_cls: 2.2497 grounding_loss_reg: 2.7629 semantic_segmentation_loss_cls: 0.0093 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3426 instance_segmentation_loss_poly: 0.9329 +2024/01/05 22:54:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 22:54:33 - mmengine - INFO - Iter(train) [241000/640000] base_lr: 1.3844e-04 lr: 1.4403e-05 eta: 6 days, 19:41:57 time: 1.4892 data_time: 0.0212 memory: 25717 grad_norm: 2.6961 loss: 1.3505 detection_loss_cls: 0.0362 detection_loss_reg: 0.3510 caption_loss_cls: 2.2529 grounding_loss_reg: 2.7610 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0337 instance_segmentation_loss_reg: 0.3429 instance_segmentation_loss_poly: 0.9338 +2024/01/05 23:07:01 - mmengine - INFO - Iter(train) [241500/640000] base_lr: 1.3821e-04 lr: 1.4383e-05 eta: 6 days, 19:32:32 time: 1.4897 data_time: 0.0214 memory: 25717 grad_norm: 2.6936 loss: 1.3497 detection_loss_cls: 0.0360 detection_loss_reg: 0.3489 caption_loss_cls: 2.2556 grounding_loss_reg: 2.7563 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3417 instance_segmentation_loss_poly: 0.9316 +2024/01/05 23:19:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 23:19:51 - mmengine - INFO - Iter(train) [242000/640000] base_lr: 1.3799e-04 lr: 1.4362e-05 eta: 6 days, 19:29:27 time: 1.5039 data_time: 0.0217 memory: 25717 grad_norm: 2.6673 loss: 1.3298 detection_loss_cls: 0.0360 detection_loss_reg: 0.3487 caption_loss_cls: 2.2500 grounding_loss_reg: 2.7558 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3397 instance_segmentation_loss_poly: 0.9283 +2024/01/05 23:19:51 - mmengine - INFO - Saving checkpoint at 242000 iterations +2024/01/05 23:32:25 - mmengine - INFO - Iter(train) [242500/640000] base_lr: 1.3776e-04 lr: 1.4342e-05 eta: 6 days, 19:21:22 time: 1.5117 data_time: 0.0229 memory: 25717 grad_norm: 2.6727 loss: 1.3208 detection_loss_cls: 0.0360 detection_loss_reg: 0.3480 caption_loss_cls: 2.2488 grounding_loss_reg: 2.7518 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3399 instance_segmentation_loss_poly: 0.9279 +2024/01/05 23:44:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/05 23:44:11 - mmengine - INFO - Iter(train) [243000/640000] base_lr: 1.3754e-04 lr: 1.4321e-05 eta: 6 days, 18:59:20 time: 1.4953 data_time: 0.0229 memory: 25717 grad_norm: 2.7087 loss: 1.3242 detection_loss_cls: 0.0361 detection_loss_reg: 0.3477 caption_loss_cls: 2.2510 grounding_loss_reg: 2.7515 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3397 instance_segmentation_loss_poly: 0.9273 +2024/01/05 23:56:00 - mmengine - INFO - Iter(train) [243500/640000] base_lr: 1.3731e-04 lr: 1.4301e-05 eta: 6 days, 18:38:36 time: 1.4739 data_time: 0.0228 memory: 25717 grad_norm: 2.8250 loss: 1.3289 detection_loss_cls: 0.0360 detection_loss_reg: 0.3464 caption_loss_cls: 2.2515 grounding_loss_reg: 2.7487 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3392 instance_segmentation_loss_poly: 0.9252 +2024/01/06 00:07:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 00:07:28 - mmengine - INFO - Iter(train) [244000/640000] base_lr: 1.3708e-04 lr: 1.4280e-05 eta: 6 days, 18:12:13 time: 1.4622 data_time: 0.0227 memory: 25717 grad_norm: 2.8801 loss: 1.3252 detection_loss_cls: 0.0362 detection_loss_reg: 0.3476 caption_loss_cls: 2.2500 grounding_loss_reg: 2.7455 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3394 instance_segmentation_loss_poly: 0.9253 +2024/01/06 00:07:28 - mmengine - INFO - Saving checkpoint at 244000 iterations +2024/01/06 00:19:49 - mmengine - INFO - Iter(train) [244500/640000] base_lr: 1.3686e-04 lr: 1.4260e-05 eta: 6 days, 18:00:58 time: 1.4578 data_time: 0.0268 memory: 25717 grad_norm: 2.9768 loss: 1.3326 detection_loss_cls: 0.0362 detection_loss_reg: 0.3470 caption_loss_cls: 2.2489 grounding_loss_reg: 2.7416 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3402 instance_segmentation_loss_poly: 0.9269 +2024/01/06 00:32:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 00:32:30 - mmengine - INFO - Iter(train) [245000/640000] base_lr: 1.3663e-04 lr: 1.4239e-05 eta: 6 days, 17:54:45 time: 1.4687 data_time: 0.0269 memory: 25717 grad_norm: 3.0207 loss: 1.3248 detection_loss_cls: 0.0361 detection_loss_reg: 0.3467 caption_loss_cls: 2.2551 grounding_loss_reg: 2.7434 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0332 instance_segmentation_loss_reg: 0.3392 instance_segmentation_loss_poly: 0.9247 +2024/01/06 00:45:09 - mmengine - INFO - Iter(train) [245500/640000] base_lr: 1.3640e-04 lr: 1.4218e-05 eta: 6 days, 17:47:57 time: 1.4715 data_time: 0.0270 memory: 25717 grad_norm: 3.1440 loss: 1.3148 detection_loss_cls: 0.0361 detection_loss_reg: 0.3464 caption_loss_cls: 2.2511 grounding_loss_reg: 2.7408 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0332 instance_segmentation_loss_reg: 0.3394 instance_segmentation_loss_poly: 0.9260 +2024/01/06 00:57:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 00:57:45 - mmengine - INFO - Iter(train) [246000/640000] base_lr: 1.3618e-04 lr: 1.4198e-05 eta: 6 days, 17:39:56 time: 1.4680 data_time: 0.0270 memory: 25717 grad_norm: 3.2075 loss: 1.3317 detection_loss_cls: 0.0358 detection_loss_reg: 0.3447 caption_loss_cls: 2.2547 grounding_loss_reg: 2.7402 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0330 instance_segmentation_loss_reg: 0.3380 instance_segmentation_loss_poly: 0.9223 +2024/01/06 00:57:45 - mmengine - INFO - Saving checkpoint at 246000 iterations +2024/01/06 01:10:41 - mmengine - INFO - Iter(train) [246500/640000] base_lr: 1.3595e-04 lr: 1.4177e-05 eta: 6 days, 17:36:58 time: 1.4736 data_time: 0.0268 memory: 25717 grad_norm: 3.2077 loss: 1.3288 detection_loss_cls: 0.0357 detection_loss_reg: 0.3438 caption_loss_cls: 2.2586 grounding_loss_reg: 2.7398 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0329 instance_segmentation_loss_reg: 0.3368 instance_segmentation_loss_poly: 0.9188 +2024/01/06 01:23:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 01:23:28 - mmengine - INFO - Iter(train) [247000/640000] base_lr: 1.3572e-04 lr: 1.4157e-05 eta: 6 days, 17:31:12 time: 1.4887 data_time: 0.0270 memory: 25717 grad_norm: 3.1976 loss: 1.3255 detection_loss_cls: 0.0357 detection_loss_reg: 0.3446 caption_loss_cls: 2.2587 grounding_loss_reg: 2.7406 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0328 instance_segmentation_loss_reg: 0.3372 instance_segmentation_loss_poly: 0.9183 +2024/01/06 01:36:52 - mmengine - INFO - Iter(train) [247500/640000] base_lr: 1.3549e-04 lr: 1.4136e-05 eta: 6 days, 17:34:08 time: 1.5124 data_time: 0.0275 memory: 25717 grad_norm: 3.1936 loss: 1.3195 detection_loss_cls: 0.0357 detection_loss_reg: 0.3449 caption_loss_cls: 2.2597 grounding_loss_reg: 2.7379 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0328 instance_segmentation_loss_reg: 0.3374 instance_segmentation_loss_poly: 0.9180 +2024/01/06 01:48:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 01:48:47 - mmengine - INFO - Iter(train) [248000/640000] base_lr: 1.3527e-04 lr: 1.4115e-05 eta: 6 days, 17:15:37 time: 1.5193 data_time: 0.0276 memory: 25717 grad_norm: 3.2168 loss: 1.3175 detection_loss_cls: 0.0358 detection_loss_reg: 0.3454 caption_loss_cls: 2.2634 grounding_loss_reg: 2.7376 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0328 instance_segmentation_loss_reg: 0.3368 instance_segmentation_loss_poly: 0.9168 +2024/01/06 01:48:47 - mmengine - INFO - Saving checkpoint at 248000 iterations +2024/01/06 02:01:12 - mmengine - INFO - Iter(train) [248500/640000] base_lr: 1.3504e-04 lr: 1.4094e-05 eta: 6 days, 17:04:15 time: 1.5202 data_time: 0.0276 memory: 25717 grad_norm: 3.2799 loss: 1.3181 detection_loss_cls: 0.0359 detection_loss_reg: 0.3465 caption_loss_cls: 2.2654 grounding_loss_reg: 2.7375 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0331 instance_segmentation_loss_reg: 0.3389 instance_segmentation_loss_poly: 0.9215 +2024/01/06 02:13:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 02:13:41 - mmengine - INFO - Iter(train) [249000/640000] base_lr: 1.3481e-04 lr: 1.4074e-05 eta: 6 days, 16:53:53 time: 1.5174 data_time: 0.0275 memory: 25717 grad_norm: 3.7097 loss: 1.3177 detection_loss_cls: 0.0359 detection_loss_reg: 0.3459 caption_loss_cls: 2.2652 grounding_loss_reg: 2.7376 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0332 instance_segmentation_loss_reg: 0.3384 instance_segmentation_loss_poly: 0.9186 +2024/01/06 02:25:47 - mmengine - INFO - Iter(train) [249500/640000] base_lr: 1.3458e-04 lr: 1.4053e-05 eta: 6 days, 16:38:05 time: 1.5089 data_time: 0.0274 memory: 25717 grad_norm: 3.6694 loss: 1.3331 detection_loss_cls: 0.0360 detection_loss_reg: 0.3459 caption_loss_cls: 2.2711 grounding_loss_reg: 2.7351 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0331 instance_segmentation_loss_reg: 0.3382 instance_segmentation_loss_poly: 0.9194 +2024/01/06 02:37:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 02:37:43 - mmengine - INFO - Iter(train) [250000/640000] base_lr: 1.3435e-04 lr: 1.4032e-05 eta: 6 days, 16:20:28 time: 1.4991 data_time: 0.0272 memory: 25717 grad_norm: 3.7041 loss: 1.3366 detection_loss_cls: 0.0361 detection_loss_reg: 0.3468 caption_loss_cls: 2.2718 grounding_loss_reg: 2.7355 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3386 instance_segmentation_loss_poly: 0.9206 +2024/01/06 02:37:43 - mmengine - INFO - Saving checkpoint at 250000 iterations +2024/01/06 02:50:38 - mmengine - INFO - Iter(train) [250500/640000] base_lr: 1.3412e-04 lr: 1.4011e-05 eta: 6 days, 16:15:27 time: 1.4986 data_time: 0.0273 memory: 25717 grad_norm: 3.7081 loss: 1.3470 detection_loss_cls: 0.0361 detection_loss_reg: 0.3476 caption_loss_cls: 2.2731 grounding_loss_reg: 2.7372 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3398 instance_segmentation_loss_poly: 0.9222 +2024/01/06 03:02:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 03:02:11 - mmengine - INFO - Iter(train) [251000/640000] base_lr: 1.3389e-04 lr: 1.3990e-05 eta: 6 days, 15:53:09 time: 1.4803 data_time: 0.0270 memory: 25717 grad_norm: 3.7229 loss: 1.3637 detection_loss_cls: 0.0360 detection_loss_reg: 0.3462 caption_loss_cls: 2.2784 grounding_loss_reg: 2.7406 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3383 instance_segmentation_loss_poly: 0.9191 +2024/01/06 03:14:13 - mmengine - INFO - Iter(train) [251500/640000] base_lr: 1.3367e-04 lr: 1.3970e-05 eta: 6 days, 15:37:10 time: 1.4598 data_time: 0.0266 memory: 25717 grad_norm: 3.6819 loss: 1.3736 detection_loss_cls: 0.0359 detection_loss_reg: 0.3455 caption_loss_cls: 2.2806 grounding_loss_reg: 2.7426 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0332 instance_segmentation_loss_reg: 0.3378 instance_segmentation_loss_poly: 0.9172 +2024/01/06 03:25:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 03:25:48 - mmengine - INFO - Iter(train) [252000/640000] base_lr: 1.3344e-04 lr: 1.3949e-05 eta: 6 days, 15:15:49 time: 1.4549 data_time: 0.0266 memory: 25717 grad_norm: 3.6678 loss: 1.3759 detection_loss_cls: 0.0360 detection_loss_reg: 0.3458 caption_loss_cls: 2.2791 grounding_loss_reg: 2.7389 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3382 instance_segmentation_loss_poly: 0.9178 +2024/01/06 03:25:48 - mmengine - INFO - Saving checkpoint at 252000 iterations +2024/01/06 03:37:41 - mmengine - INFO - Iter(train) [252500/640000] base_lr: 1.3321e-04 lr: 1.3928e-05 eta: 6 days, 14:58:13 time: 1.4468 data_time: 0.0264 memory: 25717 grad_norm: 3.6707 loss: 1.3702 detection_loss_cls: 0.0360 detection_loss_reg: 0.3448 caption_loss_cls: 2.2807 grounding_loss_reg: 2.7385 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3374 instance_segmentation_loss_poly: 0.9162 +2024/01/06 03:49:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 03:49:34 - mmengine - INFO - Iter(train) [253000/640000] base_lr: 1.3298e-04 lr: 1.3907e-05 eta: 6 days, 14:41:00 time: 1.4378 data_time: 0.0263 memory: 25717 grad_norm: 3.3203 loss: 1.3770 detection_loss_cls: 0.0359 detection_loss_reg: 0.3439 caption_loss_cls: 2.2847 grounding_loss_reg: 2.7368 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3368 instance_segmentation_loss_poly: 0.9147 +2024/01/06 04:01:35 - mmengine - INFO - Iter(train) [253500/640000] base_lr: 1.3275e-04 lr: 1.3886e-05 eta: 6 days, 14:25:17 time: 1.4366 data_time: 0.0263 memory: 25717 grad_norm: 3.3580 loss: 1.3721 detection_loss_cls: 0.0359 detection_loss_reg: 0.3442 caption_loss_cls: 2.2835 grounding_loss_reg: 2.7402 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3369 instance_segmentation_loss_poly: 0.9152 +2024/01/06 04:13:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 04:13:53 - mmengine - INFO - Iter(train) [254000/640000] base_lr: 1.3252e-04 lr: 1.3865e-05 eta: 6 days, 14:13:01 time: 1.4421 data_time: 0.0264 memory: 25717 grad_norm: 3.3766 loss: 1.3644 detection_loss_cls: 0.0359 detection_loss_reg: 0.3438 caption_loss_cls: 2.2820 grounding_loss_reg: 2.7427 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3378 instance_segmentation_loss_poly: 0.9169 +2024/01/06 04:13:53 - mmengine - INFO - Saving checkpoint at 254000 iterations +2024/01/06 04:26:24 - mmengine - INFO - Iter(train) [254500/640000] base_lr: 1.3229e-04 lr: 1.3844e-05 eta: 6 days, 14:03:04 time: 1.4360 data_time: 0.0262 memory: 25717 grad_norm: 3.4335 loss: 1.3534 detection_loss_cls: 0.0360 detection_loss_reg: 0.3445 caption_loss_cls: 2.2731 grounding_loss_reg: 2.7403 semantic_segmentation_loss_cls: 0.0092 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3370 instance_segmentation_loss_poly: 0.9166 +2024/01/06 04:38:49 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 04:38:49 - mmengine - INFO - Iter(train) [255000/640000] base_lr: 1.3205e-04 lr: 1.3823e-05 eta: 6 days, 13:52:00 time: 1.4490 data_time: 0.0264 memory: 25717 grad_norm: 3.4629 loss: 1.3411 detection_loss_cls: 0.0362 detection_loss_reg: 0.3449 caption_loss_cls: 2.2743 grounding_loss_reg: 2.7360 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3376 instance_segmentation_loss_poly: 0.9186 +2024/01/06 04:52:13 - mmengine - INFO - Iter(train) [255500/640000] base_lr: 1.3182e-04 lr: 1.3802e-05 eta: 6 days, 13:51:33 time: 1.4694 data_time: 0.0269 memory: 25717 grad_norm: 3.4826 loss: 1.3341 detection_loss_cls: 0.0361 detection_loss_reg: 0.3454 caption_loss_cls: 2.2744 grounding_loss_reg: 2.7362 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3393 instance_segmentation_loss_poly: 0.9219 +2024/01/06 05:05:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 05:05:00 - mmengine - INFO - Iter(train) [256000/640000] base_lr: 1.3159e-04 lr: 1.3781e-05 eta: 6 days, 13:44:08 time: 1.4873 data_time: 0.0269 memory: 25717 grad_norm: 3.4243 loss: 1.3200 detection_loss_cls: 0.0361 detection_loss_reg: 0.3456 caption_loss_cls: 2.2750 grounding_loss_reg: 2.7362 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3395 instance_segmentation_loss_poly: 0.9213 +2024/01/06 05:05:00 - mmengine - INFO - Saving checkpoint at 256000 iterations +2024/01/06 05:16:55 - mmengine - INFO - Iter(train) [256500/640000] base_lr: 1.3136e-04 lr: 1.3760e-05 eta: 6 days, 13:27:36 time: 1.4881 data_time: 0.0269 memory: 25717 grad_norm: 3.3550 loss: 1.3202 detection_loss_cls: 0.0361 detection_loss_reg: 0.3459 caption_loss_cls: 2.2756 grounding_loss_reg: 2.7360 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3388 instance_segmentation_loss_poly: 0.9190 +2024/01/06 05:28:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 05:28:50 - mmengine - INFO - Iter(train) [257000/640000] base_lr: 1.3113e-04 lr: 1.3739e-05 eta: 6 days, 13:11:06 time: 1.4884 data_time: 0.0269 memory: 25717 grad_norm: 3.3160 loss: 1.3238 detection_loss_cls: 0.0361 detection_loss_reg: 0.3466 caption_loss_cls: 2.2786 grounding_loss_reg: 2.7348 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3387 instance_segmentation_loss_poly: 0.9195 +2024/01/06 05:41:22 - mmengine - INFO - Iter(train) [257500/640000] base_lr: 1.3090e-04 lr: 1.3718e-05 eta: 6 days, 13:01:02 time: 1.4964 data_time: 0.0271 memory: 25717 grad_norm: 3.2629 loss: 1.3211 detection_loss_cls: 0.0361 detection_loss_reg: 0.3464 caption_loss_cls: 2.2817 grounding_loss_reg: 2.7352 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3379 instance_segmentation_loss_poly: 0.9162 +2024/01/06 05:53:26 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 05:53:26 - mmengine - INFO - Iter(train) [258000/640000] base_lr: 1.3067e-04 lr: 1.3697e-05 eta: 6 days, 12:46:10 time: 1.4928 data_time: 0.0271 memory: 25717 grad_norm: 3.3159 loss: 1.3337 detection_loss_cls: 0.0362 detection_loss_reg: 0.3475 caption_loss_cls: 2.2823 grounding_loss_reg: 2.7358 semantic_segmentation_loss_cls: 0.0091 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3387 instance_segmentation_loss_poly: 0.9178 +2024/01/06 05:53:26 - mmengine - INFO - Saving checkpoint at 258000 iterations +2024/01/06 06:06:35 - mmengine - INFO - Iter(train) [258500/640000] base_lr: 1.3044e-04 lr: 1.3676e-05 eta: 6 days, 12:42:00 time: 1.5022 data_time: 0.0273 memory: 25717 grad_norm: 3.3021 loss: 1.3321 detection_loss_cls: 0.0362 detection_loss_reg: 0.3475 caption_loss_cls: 2.2842 grounding_loss_reg: 2.7358 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3393 instance_segmentation_loss_poly: 0.9195 +2024/01/06 06:18:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 06:18:47 - mmengine - INFO - Iter(train) [259000/640000] base_lr: 1.3020e-04 lr: 1.3655e-05 eta: 6 days, 12:28:33 time: 1.4991 data_time: 0.0273 memory: 25717 grad_norm: 3.4526 loss: 1.3365 detection_loss_cls: 0.0361 detection_loss_reg: 0.3467 caption_loss_cls: 2.2842 grounding_loss_reg: 2.7339 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3399 instance_segmentation_loss_poly: 0.9199 +2024/01/06 06:31:06 - mmengine - INFO - Iter(train) [259500/640000] base_lr: 1.2997e-04 lr: 1.3634e-05 eta: 6 days, 12:16:03 time: 1.4827 data_time: 0.0269 memory: 25717 grad_norm: 3.6094 loss: 1.3275 detection_loss_cls: 0.0361 detection_loss_reg: 0.3467 caption_loss_cls: 2.2808 grounding_loss_reg: 2.7317 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3396 instance_segmentation_loss_poly: 0.9190 +2024/01/06 06:43:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 06:43:45 - mmengine - INFO - Iter(train) [260000/640000] base_lr: 1.2974e-04 lr: 1.3613e-05 eta: 6 days, 12:06:56 time: 1.4810 data_time: 0.0269 memory: 25717 grad_norm: 3.6445 loss: 1.3292 detection_loss_cls: 0.0359 detection_loss_reg: 0.3454 caption_loss_cls: 2.2822 grounding_loss_reg: 2.7321 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3391 instance_segmentation_loss_poly: 0.9178 +2024/01/06 06:43:45 - mmengine - INFO - Saving checkpoint at 260000 iterations +2024/01/06 06:56:24 - mmengine - INFO - Evaluating bbox... +2024/01/06 06:57:21 - mmengine - INFO - bbox_mAP_copypaste: 0.475 0.655 0.521 0.317 0.524 0.617 +2024/01/06 06:57:21 - mmengine - INFO - Evaluating segm... +2024/01/06 06:58:33 - mmengine - INFO - segm_mAP_copypaste: 0.310 0.566 0.301 0.173 0.355 0.475 +2024/01/06 07:06:05 - mmengine - INFO - per class results: +2024/01/06 07:06:05 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 76.99 | 88.86 | +| building | 82.49 | 91.84 | +| sky | 92.89 | 97.92 | +| floor | 82.34 | 90.48 | +| tree | 72.91 | 86.55 | +| ceiling | 84.52 | 93.63 | +| road | 83.41 | 90.65 | +| bed | 90.27 | 95.08 | +| windowpane | 60.73 | 72.5 | +| grass | 66.09 | 81.02 | +| cabinet | 61.14 | 73.81 | +| sidewalk | 66.78 | 80.68 | +| person | 79.82 | 90.02 | +| earth | 39.91 | 56.53 | +| door | 51.55 | 65.03 | +| table | 62.28 | 76.77 | +| mountain | 55.57 | 63.96 | +| plant | 52.85 | 65.18 | +| curtain | 74.66 | 84.84 | +| chair | 58.25 | 68.47 | +| car | 83.86 | 92.14 | +| water | 54.48 | 81.19 | +| painting | 70.66 | 85.02 | +| sofa | 70.65 | 85.22 | +| shelf | 46.17 | 70.94 | +| house | 52.66 | 68.68 | +| sea | 35.37 | 37.22 | +| mirror | 67.28 | 78.98 | +| rug | 69.34 | 76.06 | +| field | 30.19 | 49.63 | +| armchair | 46.42 | 63.53 | +| seat | 61.55 | 85.24 | +| fence | 32.76 | 45.79 | +| desk | 52.45 | 73.18 | +| rock | 54.55 | 71.05 | +| wardrobe | 40.21 | 52.14 | +| lamp | 61.98 | 73.58 | +| bathtub | 79.78 | 82.88 | +| railing | 33.49 | 46.22 | +| cushion | 55.99 | 68.62 | +| base | 24.4 | 30.26 | +| box | 24.02 | 29.44 | +| column | 49.52 | 64.73 | +| signboard | 35.87 | 56.79 | +| chest of drawers | 36.86 | 51.48 | +| counter | 30.9 | 38.73 | +| sand | 41.67 | 55.46 | +| sink | 71.74 | 81.88 | +| skyscraper | 70.42 | 92.16 | +| fireplace | 68.31 | 86.28 | +| refrigerator | 76.87 | 84.1 | +| grandstand | 35.62 | 79.64 | +| path | 14.33 | 20.95 | +| stairs | 30.11 | 34.6 | +| runway | 69.38 | 89.22 | +| case | 53.87 | 73.78 | +| pool table | 91.47 | 95.69 | +| pillow | 55.3 | 67.91 | +| screen door | 76.03 | 80.61 | +| stairway | 34.74 | 58.98 | +| river | 14.36 | 26.98 | +| bridge | 64.11 | 85.09 | +| bookcase | 36.66 | 49.42 | +| blind | 45.52 | 58.24 | +| coffee table | 63.55 | 81.5 | +| toilet | 85.21 | 90.05 | +| flower | 38.06 | 48.58 | +| book | 47.39 | 70.49 | +| hill | 10.66 | 13.82 | +| bench | 57.17 | 77.4 | +| countertop | 50.33 | 68.57 | +| stove | 74.39 | 80.1 | +| palm | 43.19 | 61.28 | +| kitchen island | 46.51 | 93.88 | +| computer | 70.77 | 79.8 | +| swivel chair | 50.83 | 71.91 | +| boat | 62.26 | 65.28 | +| bar | 44.33 | 58.75 | +| arcade machine | 22.42 | 24.24 | +| hovel | 34.15 | 44.52 | +| bus | 90.99 | 95.37 | +| towel | 64.63 | 82.03 | +| light | 51.33 | 64.17 | +| truck | 39.04 | 55.05 | +| tower | 19.01 | 38.34 | +| chandelier | 62.5 | 86.94 | +| awning | 34.49 | 40.98 | +| streetlight | 29.93 | 38.71 | +| booth | 38.76 | 43.37 | +| television receiver | 71.18 | 83.73 | +| airplane | 52.75 | 66.68 | +| dirt track | 4.55 | 13.87 | +| apparel | 32.53 | 50.27 | +| pole | 25.88 | 38.48 | +| land | 1.09 | 1.41 | +| bannister | 15.53 | 20.82 | +| escalator | 9.43 | 9.58 | +| ottoman | 52.17 | 69.37 | +| bottle | 22.16 | 30.14 | +| buffet | 41.89 | 54.7 | +| poster | 26.05 | 34.7 | +| stage | 13.79 | 19.98 | +| van | 44.44 | 56.54 | +| ship | 22.07 | 29.31 | +| fountain | 15.61 | 15.94 | +| conveyer belt | 65.97 | 91.9 | +| canopy | 37.17 | 44.58 | +| washer | 70.38 | 72.92 | +| plaything | 33.8 | 39.62 | +| swimming pool | 49.88 | 53.74 | +| stool | 46.61 | 60.16 | +| barrel | 26.53 | 41.45 | +| basket | 35.76 | 48.09 | +| waterfall | 44.6 | 66.6 | +| tent | 84.26 | 89.43 | +| bag | 17.52 | 18.91 | +| minibike | 70.82 | 76.98 | +| cradle | 73.61 | 96.98 | +| oven | 41.5 | 70.37 | +| ball | 48.53 | 71.62 | +| food | 48.68 | 56.04 | +| step | 12.81 | 16.15 | +| tank | 37.69 | 51.95 | +| trade name | 12.86 | 13.46 | +| microwave | 73.36 | 76.26 | +| pot | 51.61 | 61.97 | +| animal | 59.66 | 63.27 | +| bicycle | 56.05 | 69.03 | +| lake | 58.8 | 62.76 | +| dishwasher | 59.94 | 75.28 | +| screen | 60.01 | 75.84 | +| blanket | 23.69 | 30.04 | +| sculpture | 61.23 | 78.92 | +| hood | 58.68 | 67.05 | +| sconce | 39.24 | 51.01 | +| vase | 40.81 | 58.62 | +| traffic light | 38.91 | 57.09 | +| tray | 7.27 | 10.6 | +| ashcan | 37.8 | 58.82 | +| fan | 58.58 | 69.22 | +| pier | 48.32 | 64.53 | +| crt screen | 9.44 | 25.67 | +| plate | 55.09 | 68.11 | +| monitor | 2.12 | 2.69 | +| bulletin board | 34.66 | 54.07 | +| shower | 2.44 | 2.64 | +| radiator | 57.09 | 61.76 | +| glass | 15.22 | 16.93 | +| clock | 25.03 | 31.02 | +| flag | 26.84 | 30.48 | ++---------------------+-------+-------+ +2024/01/06 07:06:22 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4750 coco/bbox_mAP_50: 0.6550 coco/bbox_mAP_75: 0.5210 coco/bbox_mAP_s: 0.3170 coco/bbox_mAP_m: 0.5240 coco/bbox_mAP_l: 0.6170 coco/segm_mAP: 0.3100 coco/segm_mAP_50: 0.5660 coco/segm_mAP_75: 0.3010 coco/segm_mAP_s: 0.1730 coco/segm_mAP_m: 0.3550 coco/segm_mAP_l: 0.4750 Bleu_1: 0.7418 Bleu_2: 0.5737 Bleu_3: 0.4280 Bleu_4: 0.3152 METEOR: 0.2593 ROUGE_L: 0.5430 CIDEr: 1.0162 SPICE: 0.1899 aAcc: 83.0500 mIoU: 48.3400 mAcc: 60.4600 visual-grounding/miou: 0.7849 visual-grounding/acc: 0.8552 data_time: 0.0042 time: 1.3488 +2024/01/06 07:19:00 - mmengine - INFO - Iter(train) [260500/640000] base_lr: 1.2951e-04 lr: 1.3591e-05 eta: 6 days, 11:57:43 time: 1.4920 data_time: 0.0228 memory: 25717 grad_norm: 3.6146 loss: 1.3240 detection_loss_cls: 0.0358 detection_loss_reg: 0.3435 caption_loss_cls: 2.2810 grounding_loss_reg: 2.7311 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0332 instance_segmentation_loss_reg: 0.3373 instance_segmentation_loss_poly: 0.9146 +2024/01/06 07:31:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 07:31:35 - mmengine - INFO - Iter(train) [261000/640000] base_lr: 1.2927e-04 lr: 1.3570e-05 eta: 6 days, 11:47:47 time: 1.5021 data_time: 0.0229 memory: 25717 grad_norm: 3.5547 loss: 1.3047 detection_loss_cls: 0.0359 detection_loss_reg: 0.3435 caption_loss_cls: 2.2809 grounding_loss_reg: 2.7302 semantic_segmentation_loss_cls: 0.0090 instance_segmentation_loss_cls: 0.0332 instance_segmentation_loss_reg: 0.3371 instance_segmentation_loss_poly: 0.9140 +2024/01/06 07:43:45 - mmengine - INFO - Iter(train) [261500/640000] base_lr: 1.2904e-04 lr: 1.3549e-05 eta: 6 days, 11:33:57 time: 1.4966 data_time: 0.0229 memory: 25717 grad_norm: 3.6315 loss: 1.3112 detection_loss_cls: 0.0359 detection_loss_reg: 0.3439 caption_loss_cls: 2.2783 grounding_loss_reg: 2.7335 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0331 instance_segmentation_loss_reg: 0.3361 instance_segmentation_loss_poly: 0.9117 +2024/01/06 07:56:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 07:56:05 - mmengine - INFO - Iter(train) [262000/640000] base_lr: 1.2881e-04 lr: 1.3528e-05 eta: 6 days, 11:21:35 time: 1.5006 data_time: 0.0229 memory: 25717 grad_norm: 3.6028 loss: 1.2985 detection_loss_cls: 0.0358 detection_loss_reg: 0.3430 caption_loss_cls: 2.2787 grounding_loss_reg: 2.7364 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0332 instance_segmentation_loss_reg: 0.3371 instance_segmentation_loss_poly: 0.9147 +2024/01/06 07:56:05 - mmengine - INFO - Saving checkpoint at 262000 iterations +2024/01/06 08:08:59 - mmengine - INFO - Iter(train) [262500/640000] base_lr: 1.2857e-04 lr: 1.3507e-05 eta: 6 days, 11:14:15 time: 1.4970 data_time: 0.0228 memory: 25717 grad_norm: 3.5775 loss: 1.3022 detection_loss_cls: 0.0359 detection_loss_reg: 0.3441 caption_loss_cls: 2.2769 grounding_loss_reg: 2.7397 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3373 instance_segmentation_loss_poly: 0.9160 +2024/01/06 08:21:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 08:21:12 - mmengine - INFO - Iter(train) [263000/640000] base_lr: 1.2834e-04 lr: 1.3485e-05 eta: 6 days, 11:00:50 time: 1.4971 data_time: 0.0229 memory: 25717 grad_norm: 3.4754 loss: 1.3049 detection_loss_cls: 0.0359 detection_loss_reg: 0.3448 caption_loss_cls: 2.2764 grounding_loss_reg: 2.7406 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3380 instance_segmentation_loss_poly: 0.9175 +2024/01/06 08:33:46 - mmengine - INFO - Iter(train) [263500/640000] base_lr: 1.2811e-04 lr: 1.3464e-05 eta: 6 days, 10:50:28 time: 1.5010 data_time: 0.0232 memory: 25717 grad_norm: 3.3113 loss: 1.3156 detection_loss_cls: 0.0359 detection_loss_reg: 0.3453 caption_loss_cls: 2.2776 grounding_loss_reg: 2.7383 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3376 instance_segmentation_loss_poly: 0.9177 +2024/01/06 08:45:26 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 08:45:26 - mmengine - INFO - Iter(train) [264000/640000] base_lr: 1.2787e-04 lr: 1.3443e-05 eta: 6 days, 10:32:22 time: 1.4861 data_time: 0.0231 memory: 25717 grad_norm: 3.3228 loss: 1.3385 detection_loss_cls: 0.0358 detection_loss_reg: 0.3438 caption_loss_cls: 2.2794 grounding_loss_reg: 2.7435 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3373 instance_segmentation_loss_poly: 0.9165 +2024/01/06 08:45:26 - mmengine - INFO - Saving checkpoint at 264000 iterations +2024/01/06 08:59:05 - mmengine - INFO - Iter(train) [264500/640000] base_lr: 1.2764e-04 lr: 1.3422e-05 eta: 6 days, 10:31:10 time: 1.5010 data_time: 0.0276 memory: 25717 grad_norm: 3.2964 loss: 1.3185 detection_loss_cls: 0.0357 detection_loss_reg: 0.3442 caption_loss_cls: 2.2732 grounding_loss_reg: 2.7422 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0332 instance_segmentation_loss_reg: 0.3357 instance_segmentation_loss_poly: 0.9132 +2024/01/06 09:11:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 09:11:59 - mmengine - INFO - Iter(train) [265000/640000] base_lr: 1.2741e-04 lr: 1.3400e-05 eta: 6 days, 10:23:22 time: 1.5055 data_time: 0.0279 memory: 25717 grad_norm: 3.2931 loss: 1.3339 detection_loss_cls: 0.0358 detection_loss_reg: 0.3444 caption_loss_cls: 2.2729 grounding_loss_reg: 2.7410 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3371 instance_segmentation_loss_poly: 0.9155 +2024/01/06 09:24:07 - mmengine - INFO - Iter(train) [265500/640000] base_lr: 1.2717e-04 lr: 1.3379e-05 eta: 6 days, 10:09:10 time: 1.5049 data_time: 0.0278 memory: 25717 grad_norm: 3.2882 loss: 1.3320 detection_loss_cls: 0.0357 detection_loss_reg: 0.3434 caption_loss_cls: 2.2727 grounding_loss_reg: 2.7423 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3378 instance_segmentation_loss_poly: 0.9162 +2024/01/06 09:36:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 09:36:35 - mmengine - INFO - Iter(train) [266000/640000] base_lr: 1.2694e-04 lr: 1.3358e-05 eta: 6 days, 9:57:44 time: 1.5069 data_time: 0.0278 memory: 25717 grad_norm: 3.3069 loss: 1.3370 detection_loss_cls: 0.0357 detection_loss_reg: 0.3444 caption_loss_cls: 2.2740 grounding_loss_reg: 2.7397 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3390 instance_segmentation_loss_poly: 0.9188 +2024/01/06 09:36:35 - mmengine - INFO - Saving checkpoint at 266000 iterations +2024/01/06 09:48:49 - mmengine - INFO - Iter(train) [266500/640000] base_lr: 1.2670e-04 lr: 1.3337e-05 eta: 6 days, 9:44:24 time: 1.4969 data_time: 0.0276 memory: 25717 grad_norm: 3.3812 loss: 1.3435 detection_loss_cls: 0.0359 detection_loss_reg: 0.3455 caption_loss_cls: 2.2696 grounding_loss_reg: 2.7405 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0336 instance_segmentation_loss_reg: 0.3391 instance_segmentation_loss_poly: 0.9199 +2024/01/06 10:01:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 10:01:28 - mmengine - INFO - Iter(train) [267000/640000] base_lr: 1.2647e-04 lr: 1.3315e-05 eta: 6 days, 9:34:29 time: 1.5035 data_time: 0.0277 memory: 25717 grad_norm: 3.3445 loss: 1.3267 detection_loss_cls: 0.0359 detection_loss_reg: 0.3454 caption_loss_cls: 2.2661 grounding_loss_reg: 2.7416 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3386 instance_segmentation_loss_poly: 0.9180 +2024/01/06 10:13:16 - mmengine - INFO - Iter(train) [267500/640000] base_lr: 1.2623e-04 lr: 1.3294e-05 eta: 6 days, 9:17:41 time: 1.4919 data_time: 0.0272 memory: 25717 grad_norm: 3.4560 loss: 1.3303 detection_loss_cls: 0.0359 detection_loss_reg: 0.3459 caption_loss_cls: 2.2656 grounding_loss_reg: 2.7404 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3378 instance_segmentation_loss_poly: 0.9159 +2024/01/06 10:25:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 10:25:20 - mmengine - INFO - Iter(train) [268000/640000] base_lr: 1.2600e-04 lr: 1.3272e-05 eta: 6 days, 9:03:10 time: 1.4979 data_time: 0.0273 memory: 25717 grad_norm: 3.4869 loss: 1.3158 detection_loss_cls: 0.0359 detection_loss_reg: 0.3453 caption_loss_cls: 2.2619 grounding_loss_reg: 2.7380 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3389 instance_segmentation_loss_poly: 0.9183 +2024/01/06 10:25:20 - mmengine - INFO - Saving checkpoint at 268000 iterations +2024/01/06 10:37:51 - mmengine - INFO - Iter(train) [268500/640000] base_lr: 1.2576e-04 lr: 1.3251e-05 eta: 6 days, 8:52:05 time: 1.4808 data_time: 0.0270 memory: 25717 grad_norm: 3.5805 loss: 1.3388 detection_loss_cls: 0.0358 detection_loss_reg: 0.3449 caption_loss_cls: 2.2632 grounding_loss_reg: 2.7408 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3379 instance_segmentation_loss_poly: 0.9164 +2024/01/06 10:50:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 10:50:37 - mmengine - INFO - Iter(train) [269000/640000] base_lr: 1.2553e-04 lr: 1.3230e-05 eta: 6 days, 8:43:00 time: 1.4791 data_time: 0.0270 memory: 25717 grad_norm: 3.6355 loss: 1.3387 detection_loss_cls: 0.0359 detection_loss_reg: 0.3454 caption_loss_cls: 2.2624 grounding_loss_reg: 2.7390 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3394 instance_segmentation_loss_poly: 0.9202 +2024/01/06 11:03:06 - mmengine - INFO - Iter(train) [269500/640000] base_lr: 1.2529e-04 lr: 1.3208e-05 eta: 6 days, 8:31:32 time: 1.4842 data_time: 0.0272 memory: 25717 grad_norm: 3.5684 loss: 1.3354 detection_loss_cls: 0.0360 detection_loss_reg: 0.3459 caption_loss_cls: 2.2588 grounding_loss_reg: 2.7392 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0335 instance_segmentation_loss_reg: 0.3401 instance_segmentation_loss_poly: 0.9205 +2024/01/06 11:15:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 11:15:23 - mmengine - INFO - Iter(train) [270000/640000] base_lr: 1.2506e-04 lr: 1.3187e-05 eta: 6 days, 8:18:43 time: 1.4816 data_time: 0.0272 memory: 25717 grad_norm: 3.4862 loss: 1.3324 detection_loss_cls: 0.0359 detection_loss_reg: 0.3460 caption_loss_cls: 2.2603 grounding_loss_reg: 2.7391 semantic_segmentation_loss_cls: 0.0089 instance_segmentation_loss_cls: 0.0334 instance_segmentation_loss_reg: 0.3403 instance_segmentation_loss_poly: 0.9218 +2024/01/06 11:15:23 - mmengine - INFO - Saving checkpoint at 270000 iterations +2024/01/06 11:27:52 - mmengine - INFO - Iter(train) [270500/640000] base_lr: 1.2482e-04 lr: 1.3165e-05 eta: 6 days, 8:07:21 time: 1.4854 data_time: 0.0271 memory: 25717 grad_norm: 3.3991 loss: 1.3193 detection_loss_cls: 0.0357 detection_loss_reg: 0.3449 caption_loss_cls: 2.2595 grounding_loss_reg: 2.7385 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0332 instance_segmentation_loss_reg: 0.3388 instance_segmentation_loss_poly: 0.9184 +2024/01/06 11:40:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 11:40:08 - mmengine - INFO - Iter(train) [271000/640000] base_lr: 1.2458e-04 lr: 1.3144e-05 eta: 6 days, 7:54:15 time: 1.4793 data_time: 0.0270 memory: 25717 grad_norm: 3.3820 loss: 1.3336 detection_loss_cls: 0.0356 detection_loss_reg: 0.3444 caption_loss_cls: 2.2611 grounding_loss_reg: 2.7343 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3394 instance_segmentation_loss_poly: 0.9205 +2024/01/06 11:52:07 - mmengine - INFO - Iter(train) [271500/640000] base_lr: 1.2435e-04 lr: 1.3123e-05 eta: 6 days, 7:39:15 time: 1.4822 data_time: 0.0271 memory: 25717 grad_norm: 3.3014 loss: 1.3321 detection_loss_cls: 0.0356 detection_loss_reg: 0.3449 caption_loss_cls: 2.2610 grounding_loss_reg: 2.7324 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0333 instance_segmentation_loss_reg: 0.3392 instance_segmentation_loss_poly: 0.9196 +2024/01/06 12:04:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 12:04:15 - mmengine - INFO - Iter(train) [272000/640000] base_lr: 1.2411e-04 lr: 1.3101e-05 eta: 6 days, 7:25:26 time: 1.4833 data_time: 0.0270 memory: 25717 grad_norm: 3.2875 loss: 1.3273 detection_loss_cls: 0.0355 detection_loss_reg: 0.3449 caption_loss_cls: 2.2605 grounding_loss_reg: 2.7298 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0332 instance_segmentation_loss_reg: 0.3386 instance_segmentation_loss_poly: 0.9188 +2024/01/06 12:04:15 - mmengine - INFO - Saving checkpoint at 272000 iterations +2024/01/06 12:17:07 - mmengine - INFO - Iter(train) [272500/640000] base_lr: 1.2388e-04 lr: 1.3080e-05 eta: 6 days, 7:16:41 time: 1.4886 data_time: 0.0271 memory: 25717 grad_norm: 3.2159 loss: 1.3265 detection_loss_cls: 0.0354 detection_loss_reg: 0.3443 caption_loss_cls: 2.2620 grounding_loss_reg: 2.7299 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0331 instance_segmentation_loss_reg: 0.3379 instance_segmentation_loss_poly: 0.9184 +2024/01/06 12:29:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 12:29:34 - mmengine - INFO - Iter(train) [273000/640000] base_lr: 1.2364e-04 lr: 1.3058e-05 eta: 6 days, 7:05:02 time: 1.4837 data_time: 0.0268 memory: 25717 grad_norm: 3.2233 loss: 1.3187 detection_loss_cls: 0.0352 detection_loss_reg: 0.3430 caption_loss_cls: 2.2577 grounding_loss_reg: 2.7323 semantic_segmentation_loss_cls: 0.0088 instance_segmentation_loss_cls: 0.0330 instance_segmentation_loss_reg: 0.3373 instance_segmentation_loss_poly: 0.9169 +2024/01/06 12:41:32 - mmengine - INFO - Iter(train) [273500/640000] base_lr: 1.2340e-04 lr: 1.3037e-05 eta: 6 days, 6:50:02 time: 1.4761 data_time: 0.0264 memory: 25717 grad_norm: 3.1866 loss: 1.3074 detection_loss_cls: 0.0352 detection_loss_reg: 0.3430 caption_loss_cls: 2.2612 grounding_loss_reg: 2.7315 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0329 instance_segmentation_loss_reg: 0.3356 instance_segmentation_loss_poly: 0.9135 +2024/01/06 12:53:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 12:53:58 - mmengine - INFO - Iter(train) [274000/640000] base_lr: 1.2317e-04 lr: 1.3015e-05 eta: 6 days, 6:38:16 time: 1.4783 data_time: 0.0263 memory: 25717 grad_norm: 3.1696 loss: 1.3039 detection_loss_cls: 0.0352 detection_loss_reg: 0.3429 caption_loss_cls: 2.2607 grounding_loss_reg: 2.7295 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0328 instance_segmentation_loss_reg: 0.3349 instance_segmentation_loss_poly: 0.9119 +2024/01/06 12:53:58 - mmengine - INFO - Saving checkpoint at 274000 iterations +2024/01/06 13:06:19 - mmengine - INFO - Iter(train) [274500/640000] base_lr: 1.2293e-04 lr: 1.2994e-05 eta: 6 days, 6:25:49 time: 1.4760 data_time: 0.0265 memory: 25717 grad_norm: 3.2640 loss: 1.3198 detection_loss_cls: 0.0350 detection_loss_reg: 0.3421 caption_loss_cls: 2.2657 grounding_loss_reg: 2.7285 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0328 instance_segmentation_loss_reg: 0.3356 instance_segmentation_loss_poly: 0.9120 +2024/01/06 13:19:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 13:19:08 - mmengine - INFO - Iter(train) [275000/640000] base_lr: 1.2269e-04 lr: 1.2972e-05 eta: 6 days, 6:16:35 time: 1.4846 data_time: 0.0265 memory: 25717 grad_norm: 3.2561 loss: 1.3094 detection_loss_cls: 0.0349 detection_loss_reg: 0.3419 caption_loss_cls: 2.2665 grounding_loss_reg: 2.7272 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0326 instance_segmentation_loss_reg: 0.3342 instance_segmentation_loss_poly: 0.9087 +2024/01/06 13:31:48 - mmengine - INFO - Iter(train) [275500/640000] base_lr: 1.2245e-04 lr: 1.2950e-05 eta: 6 days, 6:06:17 time: 1.4948 data_time: 0.0268 memory: 25717 grad_norm: 3.3597 loss: 1.3100 detection_loss_cls: 0.0349 detection_loss_reg: 0.3422 caption_loss_cls: 2.2676 grounding_loss_reg: 2.7292 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0326 instance_segmentation_loss_reg: 0.3343 instance_segmentation_loss_poly: 0.9093 +2024/01/06 13:44:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240105_135304 +2024/01/06 13:44:16 - mmengine - INFO - Iter(train) [276000/640000] base_lr: 1.2222e-04 lr: 1.2929e-05 eta: 6 days, 5:54:38 time: 1.4997 data_time: 0.0269 memory: 25717 grad_norm: 3.3049 loss: 1.3005 detection_loss_cls: 0.0350 detection_loss_reg: 0.3424 caption_loss_cls: 2.2707 grounding_loss_reg: 2.7278 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0325 instance_segmentation_loss_reg: 0.3342 instance_segmentation_loss_poly: 0.9101 +2024/01/06 13:44:16 - mmengine - INFO - Saving checkpoint at 276000 iterations +2024/01/06 14:09:08 - mmengine - INFO - Iter(train) [276500/640000] base_lr: 1.2198e-04 lr: 1.2907e-05 eta: 6 days, 4:35:31 time: 1.4907 data_time: 0.0218 memory: 25718 grad_norm: 3.3125 loss: 1.2952 detection_loss_cls: 0.0349 detection_loss_reg: 0.3423 caption_loss_cls: 2.2685 grounding_loss_reg: 2.7227 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0325 instance_segmentation_loss_reg: 0.3354 instance_segmentation_loss_poly: 0.9132 +2024/01/06 14:21:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 14:21:36 - mmengine - INFO - Iter(train) [277000/640000] base_lr: 1.2174e-04 lr: 1.2886e-05 eta: 6 days, 5:31:16 time: 1.4908 data_time: 0.0216 memory: 25717 grad_norm: 3.3106 loss: 1.3073 detection_loss_cls: 0.0348 detection_loss_reg: 0.3428 caption_loss_cls: 2.2669 grounding_loss_reg: 2.7207 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0327 instance_segmentation_loss_reg: 0.3366 instance_segmentation_loss_poly: 0.9159 +2024/01/06 14:33:42 - mmengine - INFO - Iter(train) [277500/640000] base_lr: 1.2150e-04 lr: 1.2864e-05 eta: 6 days, 4:17:56 time: 1.4929 data_time: 0.0213 memory: 25717 grad_norm: 3.3444 loss: 1.3030 detection_loss_cls: 0.0347 detection_loss_reg: 0.3411 caption_loss_cls: 2.2636 grounding_loss_reg: 2.7180 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0326 instance_segmentation_loss_reg: 0.3354 instance_segmentation_loss_poly: 0.9130 +2024/01/06 14:45:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 14:45:51 - mmengine - INFO - Iter(train) [278000/640000] base_lr: 1.2127e-04 lr: 1.2842e-05 eta: 6 days, 3:42:06 time: 1.4885 data_time: 0.0211 memory: 25717 grad_norm: 3.3382 loss: 1.3072 detection_loss_cls: 0.0346 detection_loss_reg: 0.3415 caption_loss_cls: 2.2629 grounding_loss_reg: 2.7145 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0327 instance_segmentation_loss_reg: 0.3358 instance_segmentation_loss_poly: 0.9146 +2024/01/06 14:45:51 - mmengine - INFO - Saving checkpoint at 278000 iterations +2024/01/06 14:58:28 - mmengine - INFO - Iter(train) [278500/640000] base_lr: 1.2103e-04 lr: 1.2821e-05 eta: 6 days, 4:23:22 time: 1.4927 data_time: 0.0206 memory: 25717 grad_norm: 3.2558 loss: 1.2964 detection_loss_cls: 0.0346 detection_loss_reg: 0.3414 caption_loss_cls: 2.2603 grounding_loss_reg: 2.7096 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0326 instance_segmentation_loss_reg: 0.3363 instance_segmentation_loss_poly: 0.9155 +2024/01/06 15:10:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 15:10:37 - mmengine - INFO - Iter(train) [279000/640000] base_lr: 1.2079e-04 lr: 1.2799e-05 eta: 6 days, 3:50:58 time: 1.4827 data_time: 0.0203 memory: 25717 grad_norm: 3.2574 loss: 1.3042 detection_loss_cls: 0.0347 detection_loss_reg: 0.3426 caption_loss_cls: 2.2613 grounding_loss_reg: 2.7041 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0326 instance_segmentation_loss_reg: 0.3377 instance_segmentation_loss_poly: 0.9186 +2024/01/06 15:22:39 - mmengine - INFO - Iter(train) [279500/640000] base_lr: 1.2055e-04 lr: 1.2778e-05 eta: 6 days, 3:11:20 time: 1.4731 data_time: 0.0198 memory: 25717 grad_norm: 3.1140 loss: 1.3015 detection_loss_cls: 0.0347 detection_loss_reg: 0.3429 caption_loss_cls: 2.2599 grounding_loss_reg: 2.7012 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0326 instance_segmentation_loss_reg: 0.3378 instance_segmentation_loss_poly: 0.9186 +2024/01/06 15:35:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 15:35:17 - mmengine - INFO - Iter(train) [280000/640000] base_lr: 1.2031e-04 lr: 1.2756e-05 eta: 6 days, 3:33:52 time: 1.4756 data_time: 0.0196 memory: 25717 grad_norm: 3.1182 loss: 1.3074 detection_loss_cls: 0.0347 detection_loss_reg: 0.3432 caption_loss_cls: 2.2594 grounding_loss_reg: 2.7008 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0326 instance_segmentation_loss_reg: 0.3373 instance_segmentation_loss_poly: 0.9174 +2024/01/06 15:35:17 - mmengine - INFO - Saving checkpoint at 280000 iterations +2024/01/06 15:47:31 - mmengine - INFO - Evaluating bbox... +2024/01/06 15:48:27 - mmengine - INFO - bbox_mAP_copypaste: 0.477 0.658 0.523 0.325 0.530 0.610 +2024/01/06 15:48:27 - mmengine - INFO - Evaluating segm... +2024/01/06 15:49:41 - mmengine - INFO - segm_mAP_copypaste: 0.317 0.575 0.304 0.177 0.365 0.482 +2024/01/06 15:58:50 - mmengine - INFO - per class results: +2024/01/06 15:58:50 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 77.86 | 88.91 | +| building | 82.02 | 91.93 | +| sky | 93.55 | 97.47 | +| floor | 81.94 | 91.53 | +| tree | 73.31 | 87.73 | +| ceiling | 82.32 | 94.83 | +| road | 81.94 | 91.13 | +| bed | 89.16 | 94.9 | +| windowpane | 61.73 | 75.58 | +| grass | 64.13 | 78.2 | +| cabinet | 62.26 | 73.01 | +| sidewalk | 62.37 | 78.12 | +| person | 80.92 | 91.16 | +| earth | 37.27 | 48.36 | +| door | 52.05 | 65.97 | +| table | 63.95 | 79.66 | +| mountain | 60.08 | 68.78 | +| plant | 53.05 | 66.13 | +| curtain | 75.45 | 85.94 | +| chair | 58.45 | 70.66 | +| car | 83.43 | 92.4 | +| water | 53.89 | 71.2 | +| painting | 73.22 | 86.97 | +| sofa | 68.64 | 84.28 | +| shelf | 45.18 | 70.5 | +| house | 28.24 | 30.49 | +| sea | 50.32 | 69.62 | +| mirror | 67.26 | 73.35 | +| rug | 70.59 | 77.2 | +| field | 25.22 | 41.86 | +| armchair | 47.11 | 66.91 | +| seat | 61.92 | 74.53 | +| fence | 45.62 | 62.78 | +| desk | 44.65 | 68.05 | +| rock | 45.11 | 71.85 | +| wardrobe | 41.53 | 54.06 | +| lamp | 60.87 | 75.59 | +| bathtub | 76.23 | 79.31 | +| railing | 33.46 | 47.73 | +| cushion | 59.19 | 66.48 | +| base | 22.42 | 32.3 | +| box | 26.77 | 34.11 | +| column | 49.32 | 62.09 | +| signboard | 31.76 | 37.56 | +| chest of drawers | 41.94 | 60.89 | +| counter | 26.18 | 33.36 | +| sand | 47.01 | 58.27 | +| sink | 73.08 | 81.87 | +| skyscraper | 52.58 | 65.71 | +| fireplace | 73.56 | 86.76 | +| refrigerator | 74.22 | 77.21 | +| grandstand | 34.21 | 74.76 | +| path | 18.43 | 30.2 | +| stairs | 33.49 | 37.89 | +| runway | 66.69 | 95.77 | +| case | 58.72 | 83.99 | +| pool table | 91.18 | 94.66 | +| pillow | 61.56 | 76.85 | +| screen door | 84.1 | 87.11 | +| stairway | 39.64 | 52.89 | +| river | 15.51 | 30.59 | +| bridge | 66.56 | 86.96 | +| bookcase | 36.71 | 57.61 | +| blind | 48.44 | 69.8 | +| coffee table | 65.49 | 77.14 | +| toilet | 85.48 | 89.12 | +| flower | 35.35 | 47.85 | +| book | 49.15 | 68.49 | +| hill | 15.71 | 25.67 | +| bench | 55.2 | 67.27 | +| countertop | 57.96 | 67.3 | +| stove | 75.11 | 82.86 | +| palm | 43.35 | 64.14 | +| kitchen island | 43.97 | 73.5 | +| computer | 61.42 | 69.66 | +| swivel chair | 35.99 | 45.31 | +| boat | 58.46 | 64.68 | +| bar | 39.4 | 54.64 | +| arcade machine | 68.52 | 76.35 | +| hovel | 23.97 | 26.0 | +| bus | 90.72 | 95.39 | +| towel | 64.62 | 73.15 | +| light | 50.12 | 60.33 | +| truck | 38.74 | 57.52 | +| tower | 22.19 | 36.77 | +| chandelier | 57.53 | 65.62 | +| awning | 28.62 | 30.99 | +| streetlight | 33.56 | 46.74 | +| booth | 34.41 | 39.82 | +| television receiver | 67.59 | 78.88 | +| airplane | 57.23 | 65.19 | +| dirt track | 8.02 | 16.01 | +| apparel | 35.81 | 49.0 | +| pole | 26.62 | 38.17 | +| land | 4.45 | 8.86 | +| bannister | 14.82 | 20.64 | +| escalator | 15.68 | 15.98 | +| ottoman | 53.81 | 67.2 | +| bottle | 21.23 | 27.35 | +| buffet | 47.58 | 60.97 | +| poster | 26.07 | 47.97 | +| stage | 10.32 | 18.11 | +| van | 44.84 | 56.4 | +| ship | 7.72 | 9.94 | +| fountain | 4.95 | 5.01 | +| conveyer belt | 60.39 | 93.14 | +| canopy | 38.1 | 42.93 | +| washer | 65.68 | 66.31 | +| plaything | 35.15 | 48.06 | +| swimming pool | 58.79 | 82.16 | +| stool | 45.49 | 53.62 | +| barrel | 38.26 | 63.89 | +| basket | 30.75 | 42.99 | +| waterfall | 45.19 | 63.9 | +| tent | 88.73 | 97.12 | +| bag | 18.36 | 21.51 | +| minibike | 70.68 | 79.01 | +| cradle | 76.15 | 95.06 | +| oven | 59.01 | 75.03 | +| ball | 50.0 | 70.9 | +| food | 52.21 | 58.37 | +| step | 7.55 | 8.93 | +| tank | 33.81 | 41.64 | +| trade name | 32.15 | 45.19 | +| microwave | 85.03 | 94.45 | +| pot | 51.43 | 59.31 | +| animal | 57.9 | 61.18 | +| bicycle | 57.72 | 76.57 | +| lake | 57.05 | 63.05 | +| dishwasher | 57.84 | 72.62 | +| screen | 59.24 | 81.14 | +| blanket | 15.06 | 17.35 | +| sculpture | 39.73 | 62.41 | +| hood | 55.18 | 63.59 | +| sconce | 36.79 | 45.14 | +| vase | 44.39 | 52.79 | +| traffic light | 39.64 | 56.98 | +| tray | 8.1 | 10.96 | +| ashcan | 45.47 | 61.65 | +| fan | 52.84 | 59.71 | +| pier | 47.15 | 69.72 | +| crt screen | 5.78 | 6.14 | +| plate | 54.22 | 73.77 | +| monitor | 40.09 | 87.56 | +| bulletin board | 45.47 | 67.7 | +| shower | 5.35 | 6.19 | +| radiator | 55.61 | 61.22 | +| glass | 17.85 | 19.28 | +| clock | 24.84 | 30.05 | +| flag | 25.71 | 28.24 | ++---------------------+-------+-------+ +2024/01/06 15:59:08 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4770 coco/bbox_mAP_50: 0.6580 coco/bbox_mAP_75: 0.5230 coco/bbox_mAP_s: 0.3250 coco/bbox_mAP_m: 0.5300 coco/bbox_mAP_l: 0.6100 coco/segm_mAP: 0.3170 coco/segm_mAP_50: 0.5750 coco/segm_mAP_75: 0.3040 coco/segm_mAP_s: 0.1770 coco/segm_mAP_m: 0.3650 coco/segm_mAP_l: 0.4820 Bleu_1: 0.7426 Bleu_2: 0.5739 Bleu_3: 0.4301 Bleu_4: 0.3197 METEOR: 0.2620 ROUGE_L: 0.5439 CIDEr: 1.0330 SPICE: 0.1914 aAcc: 82.9900 mIoU: 48.8200 mAcc: 60.8300 visual-grounding/miou: 0.7925 visual-grounding/acc: 0.8611 data_time: 0.0097 time: 1.3524 +2024/01/06 16:10:25 - mmengine - INFO - Iter(train) [280500/640000] base_lr: 1.2008e-04 lr: 1.2734e-05 eta: 6 days, 2:04:38 time: 1.4617 data_time: 0.0205 memory: 25719 grad_norm: 3.1370 loss: 1.3188 detection_loss_cls: 0.0349 detection_loss_reg: 0.3451 caption_loss_cls: 2.2515 grounding_loss_reg: 2.6972 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0327 instance_segmentation_loss_reg: 0.3383 instance_segmentation_loss_poly: 0.9193 +2024/01/06 16:23:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 16:23:03 - mmengine - INFO - Iter(train) [281000/640000] base_lr: 1.1984e-04 lr: 1.2713e-05 eta: 6 days, 2:23:54 time: 1.4644 data_time: 0.0209 memory: 25719 grad_norm: 3.0263 loss: 1.3103 detection_loss_cls: 0.0349 detection_loss_reg: 0.3470 caption_loss_cls: 2.2493 grounding_loss_reg: 2.6968 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0329 instance_segmentation_loss_reg: 0.3414 instance_segmentation_loss_poly: 0.9249 +2024/01/06 16:35:09 - mmengine - INFO - Iter(train) [281500/640000] base_lr: 1.1960e-04 lr: 1.2691e-05 eta: 6 days, 2:02:24 time: 1.4642 data_time: 0.0214 memory: 25719 grad_norm: 2.9860 loss: 1.3206 detection_loss_cls: 0.0348 detection_loss_reg: 0.3464 caption_loss_cls: 2.2498 grounding_loss_reg: 2.6918 semantic_segmentation_loss_cls: 0.0087 instance_segmentation_loss_cls: 0.0328 instance_segmentation_loss_reg: 0.3418 instance_segmentation_loss_poly: 0.9265 +2024/01/06 16:47:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 16:47:14 - mmengine - INFO - Iter(train) [282000/640000] base_lr: 1.1936e-04 lr: 1.2669e-05 eta: 6 days, 1:41:58 time: 1.4633 data_time: 0.0217 memory: 25719 grad_norm: 3.0320 loss: 1.3197 detection_loss_cls: 0.0349 detection_loss_reg: 0.3473 caption_loss_cls: 2.2481 grounding_loss_reg: 2.6841 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0328 instance_segmentation_loss_reg: 0.3418 instance_segmentation_loss_poly: 0.9260 +2024/01/06 16:47:14 - mmengine - INFO - Saving checkpoint at 282000 iterations +2024/01/06 16:59:06 - mmengine - INFO - Iter(train) [282500/640000] base_lr: 1.1912e-04 lr: 1.2647e-05 eta: 6 days, 1:10:05 time: 1.4519 data_time: 0.0223 memory: 25719 grad_norm: 3.0587 loss: 1.3294 detection_loss_cls: 0.0349 detection_loss_reg: 0.3475 caption_loss_cls: 2.2504 grounding_loss_reg: 2.6836 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0327 instance_segmentation_loss_reg: 0.3423 instance_segmentation_loss_poly: 0.9271 +2024/01/06 17:11:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 17:11:04 - mmengine - INFO - Iter(train) [283000/640000] base_lr: 1.1888e-04 lr: 1.2626e-05 eta: 6 days, 0:46:49 time: 1.4491 data_time: 0.0225 memory: 25719 grad_norm: 3.0461 loss: 1.3261 detection_loss_cls: 0.0348 detection_loss_reg: 0.3465 caption_loss_cls: 2.2488 grounding_loss_reg: 2.6808 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0326 instance_segmentation_loss_reg: 0.3418 instance_segmentation_loss_poly: 0.9261 +2024/01/06 17:23:21 - mmengine - INFO - Iter(train) [283500/640000] base_lr: 1.1864e-04 lr: 1.2604e-05 eta: 6 days, 0:39:52 time: 1.4530 data_time: 0.0228 memory: 25719 grad_norm: 3.0344 loss: 1.3233 detection_loss_cls: 0.0347 detection_loss_reg: 0.3460 caption_loss_cls: 2.2445 grounding_loss_reg: 2.6817 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0325 instance_segmentation_loss_reg: 0.3412 instance_segmentation_loss_poly: 0.9243 +2024/01/06 17:35:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 17:35:30 - mmengine - INFO - Iter(train) [284000/640000] base_lr: 1.1840e-04 lr: 1.2582e-05 eta: 6 days, 0:26:35 time: 1.4457 data_time: 0.0229 memory: 25719 grad_norm: 3.0125 loss: 1.3322 detection_loss_cls: 0.0348 detection_loss_reg: 0.3464 caption_loss_cls: 2.2459 grounding_loss_reg: 2.6760 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0324 instance_segmentation_loss_reg: 0.3402 instance_segmentation_loss_poly: 0.9221 +2024/01/06 17:35:30 - mmengine - INFO - Saving checkpoint at 284000 iterations +2024/01/06 17:47:49 - mmengine - INFO - Iter(train) [284500/640000] base_lr: 1.1817e-04 lr: 1.2560e-05 eta: 6 days, 0:20:17 time: 1.4604 data_time: 0.0271 memory: 25719 grad_norm: 2.9733 loss: 1.3198 detection_loss_cls: 0.0349 detection_loss_reg: 0.3475 caption_loss_cls: 2.2509 grounding_loss_reg: 2.6708 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0324 instance_segmentation_loss_reg: 0.3407 instance_segmentation_loss_poly: 0.9230 +2024/01/06 17:59:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 17:59:52 - mmengine - INFO - Iter(train) [285000/640000] base_lr: 1.1793e-04 lr: 1.2539e-05 eta: 6 days, 0:02:47 time: 1.4516 data_time: 0.0268 memory: 25719 grad_norm: 3.0190 loss: 1.3123 detection_loss_cls: 0.0346 detection_loss_reg: 0.3446 caption_loss_cls: 2.2484 grounding_loss_reg: 2.6718 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0321 instance_segmentation_loss_reg: 0.3386 instance_segmentation_loss_poly: 0.9185 +2024/01/06 18:12:54 - mmengine - INFO - Iter(train) [285500/640000] base_lr: 1.1769e-04 lr: 1.2517e-05 eta: 6 days, 0:22:23 time: 1.4656 data_time: 0.0269 memory: 25719 grad_norm: 2.9604 loss: 1.2952 detection_loss_cls: 0.0346 detection_loss_reg: 0.3449 caption_loss_cls: 2.2418 grounding_loss_reg: 2.6683 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0321 instance_segmentation_loss_reg: 0.3387 instance_segmentation_loss_poly: 0.9184 +2024/01/06 18:25:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 18:25:01 - mmengine - INFO - Iter(train) [286000/640000] base_lr: 1.1745e-04 lr: 1.2495e-05 eta: 6 days, 0:06:17 time: 1.4660 data_time: 0.0269 memory: 25719 grad_norm: 2.9012 loss: 1.2944 detection_loss_cls: 0.0345 detection_loss_reg: 0.3448 caption_loss_cls: 2.2396 grounding_loss_reg: 2.6669 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0321 instance_segmentation_loss_reg: 0.3391 instance_segmentation_loss_poly: 0.9196 +2024/01/06 18:25:01 - mmengine - INFO - Saving checkpoint at 286000 iterations +2024/01/06 18:38:00 - mmengine - INFO - Iter(train) [286500/640000] base_lr: 1.1721e-04 lr: 1.2473e-05 eta: 6 days, 0:20:03 time: 1.4830 data_time: 0.0266 memory: 25719 grad_norm: 2.8467 loss: 1.2671 detection_loss_cls: 0.0345 detection_loss_reg: 0.3442 caption_loss_cls: 2.2405 grounding_loss_reg: 2.6650 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0319 instance_segmentation_loss_reg: 0.3370 instance_segmentation_loss_poly: 0.9153 +2024/01/06 18:50:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 18:50:39 - mmengine - INFO - Iter(train) [287000/640000] base_lr: 1.1697e-04 lr: 1.2452e-05 eta: 6 days, 0:20:42 time: 1.4933 data_time: 0.0268 memory: 25719 grad_norm: 2.7928 loss: 1.2606 detection_loss_cls: 0.0345 detection_loss_reg: 0.3446 caption_loss_cls: 2.2395 grounding_loss_reg: 2.6637 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0319 instance_segmentation_loss_reg: 0.3372 instance_segmentation_loss_poly: 0.9156 +2024/01/06 19:02:47 - mmengine - INFO - Iter(train) [287500/640000] base_lr: 1.1673e-04 lr: 1.2430e-05 eta: 6 days, 0:03:59 time: 1.4910 data_time: 0.0267 memory: 25719 grad_norm: 2.7694 loss: 1.2660 detection_loss_cls: 0.0345 detection_loss_reg: 0.3441 caption_loss_cls: 2.2373 grounding_loss_reg: 2.6650 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0318 instance_segmentation_loss_reg: 0.3370 instance_segmentation_loss_poly: 0.9157 +2024/01/06 19:14:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 19:14:02 - mmengine - INFO - Iter(train) [288000/640000] base_lr: 1.1649e-04 lr: 1.2408e-05 eta: 5 days, 23:21:55 time: 1.4774 data_time: 0.0266 memory: 25719 grad_norm: 2.7709 loss: 1.2697 detection_loss_cls: 0.0345 detection_loss_reg: 0.3445 caption_loss_cls: 2.2368 grounding_loss_reg: 2.6656 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0317 instance_segmentation_loss_reg: 0.3369 instance_segmentation_loss_poly: 0.9168 +2024/01/06 19:14:02 - mmengine - INFO - Saving checkpoint at 288000 iterations +2024/01/06 19:26:32 - mmengine - INFO - Iter(train) [288500/640000] base_lr: 1.1625e-04 lr: 1.2386e-05 eta: 5 days, 23:17:33 time: 1.4802 data_time: 0.0268 memory: 25719 grad_norm: 2.7685 loss: 1.2769 detection_loss_cls: 0.0346 detection_loss_reg: 0.3450 caption_loss_cls: 2.2364 grounding_loss_reg: 2.6626 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0318 instance_segmentation_loss_reg: 0.3373 instance_segmentation_loss_poly: 0.9169 +2024/01/06 19:37:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 19:37:59 - mmengine - INFO - Iter(train) [289000/640000] base_lr: 1.1601e-04 lr: 1.2364e-05 eta: 5 days, 22:44:07 time: 1.4712 data_time: 0.0267 memory: 25719 grad_norm: 2.7818 loss: 1.2790 detection_loss_cls: 0.0345 detection_loss_reg: 0.3445 caption_loss_cls: 2.2296 grounding_loss_reg: 2.6596 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0318 instance_segmentation_loss_reg: 0.3372 instance_segmentation_loss_poly: 0.9165 +2024/01/06 19:49:59 - mmengine - INFO - Iter(train) [289500/640000] base_lr: 1.1577e-04 lr: 1.2342e-05 eta: 5 days, 22:26:38 time: 1.4557 data_time: 0.0267 memory: 25719 grad_norm: 2.8334 loss: 1.3048 detection_loss_cls: 0.0344 detection_loss_reg: 0.3441 caption_loss_cls: 2.2335 grounding_loss_reg: 2.6579 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0317 instance_segmentation_loss_reg: 0.3370 instance_segmentation_loss_poly: 0.9155 +2024/01/06 20:02:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 20:02:27 - mmengine - INFO - Iter(train) [290000/640000] base_lr: 1.1553e-04 lr: 1.2321e-05 eta: 5 days, 22:21:03 time: 1.4609 data_time: 0.0268 memory: 25719 grad_norm: 2.8193 loss: 1.3064 detection_loss_cls: 0.0344 detection_loss_reg: 0.3435 caption_loss_cls: 2.2309 grounding_loss_reg: 2.6546 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0318 instance_segmentation_loss_reg: 0.3370 instance_segmentation_loss_poly: 0.9159 +2024/01/06 20:02:27 - mmengine - INFO - Saving checkpoint at 290000 iterations +2024/01/06 20:14:36 - mmengine - INFO - Iter(train) [290500/640000] base_lr: 1.1529e-04 lr: 1.2299e-05 eta: 5 days, 22:07:53 time: 1.4486 data_time: 0.0269 memory: 25719 grad_norm: 2.8352 loss: 1.3329 detection_loss_cls: 0.0344 detection_loss_reg: 0.3438 caption_loss_cls: 2.2261 grounding_loss_reg: 2.6544 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0319 instance_segmentation_loss_reg: 0.3367 instance_segmentation_loss_poly: 0.9135 +2024/01/06 20:26:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 20:26:32 - mmengine - INFO - Iter(train) [291000/640000] base_lr: 1.1505e-04 lr: 1.2277e-05 eta: 5 days, 21:49:09 time: 1.4376 data_time: 0.0268 memory: 25719 grad_norm: 2.8661 loss: 1.3398 detection_loss_cls: 0.0344 detection_loss_reg: 0.3450 caption_loss_cls: 2.2231 grounding_loss_reg: 2.6517 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0320 instance_segmentation_loss_reg: 0.3379 instance_segmentation_loss_poly: 0.9154 +2024/01/06 20:38:44 - mmengine - INFO - Iter(train) [291500/640000] base_lr: 1.1481e-04 lr: 1.2255e-05 eta: 5 days, 21:37:04 time: 1.4387 data_time: 0.0268 memory: 25719 grad_norm: 2.9026 loss: 1.3381 detection_loss_cls: 0.0343 detection_loss_reg: 0.3444 caption_loss_cls: 2.2218 grounding_loss_reg: 2.6509 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0319 instance_segmentation_loss_reg: 0.3370 instance_segmentation_loss_poly: 0.9123 +2024/01/06 20:50:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 20:50:58 - mmengine - INFO - Iter(train) [292000/640000] base_lr: 1.1456e-04 lr: 1.2233e-05 eta: 5 days, 21:25:54 time: 1.4536 data_time: 0.0269 memory: 25719 grad_norm: 2.8855 loss: 1.3306 detection_loss_cls: 0.0344 detection_loss_reg: 0.3445 caption_loss_cls: 2.2214 grounding_loss_reg: 2.6474 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0320 instance_segmentation_loss_reg: 0.3376 instance_segmentation_loss_poly: 0.9136 +2024/01/06 20:50:59 - mmengine - INFO - Saving checkpoint at 292000 iterations +2024/01/06 21:03:11 - mmengine - INFO - Iter(train) [292500/640000] base_lr: 1.1432e-04 lr: 1.2211e-05 eta: 5 days, 21:13:50 time: 1.4491 data_time: 0.0264 memory: 25719 grad_norm: 2.8969 loss: 1.3248 detection_loss_cls: 0.0345 detection_loss_reg: 0.3450 caption_loss_cls: 2.2229 grounding_loss_reg: 2.6468 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0320 instance_segmentation_loss_reg: 0.3379 instance_segmentation_loss_poly: 0.9142 +2024/01/06 21:16:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 21:16:12 - mmengine - INFO - Iter(train) [293000/640000] base_lr: 1.1408e-04 lr: 1.2189e-05 eta: 5 days, 21:18:30 time: 1.4728 data_time: 0.0269 memory: 25719 grad_norm: 3.0742 loss: 1.3205 detection_loss_cls: 0.0346 detection_loss_reg: 0.3462 caption_loss_cls: 2.2186 grounding_loss_reg: 2.6426 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0321 instance_segmentation_loss_reg: 0.3395 instance_segmentation_loss_poly: 0.9170 +2024/01/06 21:28:30 - mmengine - INFO - Iter(train) [293500/640000] base_lr: 1.1384e-04 lr: 1.2167e-05 eta: 5 days, 21:07:55 time: 1.4773 data_time: 0.0268 memory: 25719 grad_norm: 3.1232 loss: 1.3129 detection_loss_cls: 0.0347 detection_loss_reg: 0.3470 caption_loss_cls: 2.2149 grounding_loss_reg: 2.6414 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0321 instance_segmentation_loss_reg: 0.3399 instance_segmentation_loss_poly: 0.9172 +2024/01/06 21:40:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 21:40:14 - mmengine - INFO - Iter(train) [294000/640000] base_lr: 1.1360e-04 lr: 1.2146e-05 eta: 5 days, 20:46:07 time: 1.4663 data_time: 0.0265 memory: 25719 grad_norm: 3.1812 loss: 1.3168 detection_loss_cls: 0.0347 detection_loss_reg: 0.3473 caption_loss_cls: 2.2138 grounding_loss_reg: 2.6414 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0321 instance_segmentation_loss_reg: 0.3405 instance_segmentation_loss_poly: 0.9181 +2024/01/06 21:40:14 - mmengine - INFO - Saving checkpoint at 294000 iterations +2024/01/06 21:52:12 - mmengine - INFO - Iter(train) [294500/640000] base_lr: 1.1336e-04 lr: 1.2124e-05 eta: 5 days, 20:29:22 time: 1.4633 data_time: 0.0260 memory: 25719 grad_norm: 3.2577 loss: 1.3163 detection_loss_cls: 0.0348 detection_loss_reg: 0.3476 caption_loss_cls: 2.2105 grounding_loss_reg: 2.6413 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0321 instance_segmentation_loss_reg: 0.3407 instance_segmentation_loss_poly: 0.9181 +2024/01/06 22:04:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 22:04:56 - mmengine - INFO - Iter(train) [295000/640000] base_lr: 1.1312e-04 lr: 1.2102e-05 eta: 5 days, 20:26:49 time: 1.4754 data_time: 0.0262 memory: 25719 grad_norm: 3.2596 loss: 1.3133 detection_loss_cls: 0.0348 detection_loss_reg: 0.3467 caption_loss_cls: 2.2117 grounding_loss_reg: 2.6369 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0322 instance_segmentation_loss_reg: 0.3419 instance_segmentation_loss_poly: 0.9200 +2024/01/06 22:18:07 - mmengine - INFO - Iter(train) [295500/640000] base_lr: 1.1288e-04 lr: 1.2080e-05 eta: 5 days, 20:31:50 time: 1.4903 data_time: 0.0262 memory: 25719 grad_norm: 3.2502 loss: 1.3012 detection_loss_cls: 0.0347 detection_loss_reg: 0.3458 caption_loss_cls: 2.2135 grounding_loss_reg: 2.6359 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0321 instance_segmentation_loss_reg: 0.3408 instance_segmentation_loss_poly: 0.9181 +2024/01/06 22:30:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 22:30:19 - mmengine - INFO - Iter(train) [296000/640000] base_lr: 1.1264e-04 lr: 1.2058e-05 eta: 5 days, 20:18:42 time: 1.4895 data_time: 0.0262 memory: 25719 grad_norm: 3.3052 loss: 1.3037 detection_loss_cls: 0.0347 detection_loss_reg: 0.3455 caption_loss_cls: 2.2141 grounding_loss_reg: 2.6358 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0320 instance_segmentation_loss_reg: 0.3401 instance_segmentation_loss_poly: 0.9159 +2024/01/06 22:30:19 - mmengine - INFO - Saving checkpoint at 296000 iterations +2024/01/06 22:43:12 - mmengine - INFO - Iter(train) [296500/640000] base_lr: 1.1240e-04 lr: 1.2036e-05 eta: 5 days, 20:17:11 time: 1.4997 data_time: 0.0262 memory: 25719 grad_norm: 3.3220 loss: 1.3024 detection_loss_cls: 0.0347 detection_loss_reg: 0.3458 caption_loss_cls: 2.2145 grounding_loss_reg: 2.6356 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0320 instance_segmentation_loss_reg: 0.3399 instance_segmentation_loss_poly: 0.9144 +2024/01/06 22:55:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 22:55:06 - mmengine - INFO - Iter(train) [297000/640000] base_lr: 1.1215e-04 lr: 1.2014e-05 eta: 5 days, 19:59:14 time: 1.4830 data_time: 0.0257 memory: 25719 grad_norm: 3.1654 loss: 1.3107 detection_loss_cls: 0.0347 detection_loss_reg: 0.3449 caption_loss_cls: 2.2139 grounding_loss_reg: 2.6347 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0320 instance_segmentation_loss_reg: 0.3396 instance_segmentation_loss_poly: 0.9146 +2024/01/06 23:07:33 - mmengine - INFO - Iter(train) [297500/640000] base_lr: 1.1191e-04 lr: 1.1992e-05 eta: 5 days, 19:50:07 time: 1.4851 data_time: 0.0257 memory: 25719 grad_norm: 3.2047 loss: 1.3097 detection_loss_cls: 0.0347 detection_loss_reg: 0.3450 caption_loss_cls: 2.2174 grounding_loss_reg: 2.6327 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0318 instance_segmentation_loss_reg: 0.3385 instance_segmentation_loss_poly: 0.9126 +2024/01/06 23:20:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 23:20:24 - mmengine - INFO - Iter(train) [298000/640000] base_lr: 1.1167e-04 lr: 1.1970e-05 eta: 5 days, 19:47:07 time: 1.5019 data_time: 0.0260 memory: 25719 grad_norm: 3.1542 loss: 1.2994 detection_loss_cls: 0.0347 detection_loss_reg: 0.3442 caption_loss_cls: 2.2233 grounding_loss_reg: 2.6334 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0318 instance_segmentation_loss_reg: 0.3383 instance_segmentation_loss_poly: 0.9128 +2024/01/06 23:20:24 - mmengine - INFO - Saving checkpoint at 298000 iterations +2024/01/06 23:32:52 - mmengine - INFO - Iter(train) [298500/640000] base_lr: 1.1143e-04 lr: 1.1948e-05 eta: 5 days, 19:37:55 time: 1.5095 data_time: 0.0260 memory: 25719 grad_norm: 3.1211 loss: 1.2893 detection_loss_cls: 0.0348 detection_loss_reg: 0.3444 caption_loss_cls: 2.2193 grounding_loss_reg: 2.6385 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0318 instance_segmentation_loss_reg: 0.3379 instance_segmentation_loss_poly: 0.9117 +2024/01/06 23:44:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/06 23:44:41 - mmengine - INFO - Iter(train) [299000/640000] base_lr: 1.1119e-04 lr: 1.1926e-05 eta: 5 days, 19:19:00 time: 1.4958 data_time: 0.0257 memory: 25719 grad_norm: 3.1366 loss: 1.2828 detection_loss_cls: 0.0347 detection_loss_reg: 0.3437 caption_loss_cls: 2.2180 grounding_loss_reg: 2.6400 semantic_segmentation_loss_cls: 0.0086 instance_segmentation_loss_cls: 0.0317 instance_segmentation_loss_reg: 0.3369 instance_segmentation_loss_poly: 0.9088 +2024/01/06 23:56:35 - mmengine - INFO - Iter(train) [299500/640000] base_lr: 1.1095e-04 lr: 1.1904e-05 eta: 5 days, 19:01:36 time: 1.4765 data_time: 0.0258 memory: 25719 grad_norm: 3.2150 loss: 1.2946 detection_loss_cls: 0.0347 detection_loss_reg: 0.3441 caption_loss_cls: 2.2155 grounding_loss_reg: 2.6376 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0318 instance_segmentation_loss_reg: 0.3381 instance_segmentation_loss_poly: 0.9114 +2024/01/07 00:08:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 00:08:05 - mmengine - INFO - Iter(train) [300000/640000] base_lr: 1.1070e-04 lr: 1.1882e-05 eta: 5 days, 18:38:32 time: 1.4660 data_time: 0.0256 memory: 25719 grad_norm: 3.2593 loss: 1.2986 detection_loss_cls: 0.0347 detection_loss_reg: 0.3442 caption_loss_cls: 2.2204 grounding_loss_reg: 2.6380 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0318 instance_segmentation_loss_reg: 0.3380 instance_segmentation_loss_poly: 0.9112 +2024/01/07 00:08:05 - mmengine - INFO - Saving checkpoint at 300000 iterations +2024/01/07 00:20:59 - mmengine - INFO - Evaluating bbox... +2024/01/07 00:21:56 - mmengine - INFO - bbox_mAP_copypaste: 0.483 0.662 0.531 0.341 0.533 0.618 +2024/01/07 00:21:56 - mmengine - INFO - Evaluating segm... +2024/01/07 00:23:08 - mmengine - INFO - segm_mAP_copypaste: 0.315 0.577 0.307 0.185 0.363 0.468 +2024/01/07 00:30:47 - mmengine - INFO - per class results: +2024/01/07 00:30:47 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 77.4 | 88.84 | +| building | 82.85 | 90.23 | +| sky | 93.26 | 97.41 | +| floor | 81.72 | 90.93 | +| tree | 73.49 | 89.79 | +| ceiling | 83.14 | 94.58 | +| road | 82.53 | 90.67 | +| bed | 88.94 | 93.34 | +| windowpane | 62.15 | 79.0 | +| grass | 67.55 | 82.35 | +| cabinet | 60.67 | 74.45 | +| sidewalk | 64.33 | 78.37 | +| person | 80.61 | 89.81 | +| earth | 39.11 | 54.51 | +| door | 51.78 | 65.62 | +| table | 62.52 | 76.58 | +| mountain | 59.94 | 73.32 | +| plant | 50.24 | 59.49 | +| curtain | 75.21 | 87.36 | +| chair | 56.6 | 66.49 | +| car | 83.37 | 92.01 | +| water | 55.16 | 68.56 | +| painting | 70.67 | 84.4 | +| sofa | 68.33 | 87.17 | +| shelf | 44.8 | 67.1 | +| house | 50.92 | 66.05 | +| sea | 52.67 | 73.4 | +| mirror | 66.82 | 79.32 | +| rug | 60.65 | 67.49 | +| field | 27.56 | 40.67 | +| armchair | 45.04 | 64.26 | +| seat | 64.36 | 81.29 | +| fence | 44.8 | 60.74 | +| desk | 48.49 | 65.53 | +| rock | 46.44 | 64.21 | +| wardrobe | 42.41 | 59.8 | +| lamp | 60.34 | 70.09 | +| bathtub | 76.7 | 83.32 | +| railing | 35.16 | 51.77 | +| cushion | 53.15 | 68.02 | +| base | 25.01 | 36.13 | +| box | 25.6 | 30.37 | +| column | 51.1 | 63.32 | +| signboard | 38.41 | 50.68 | +| chest of drawers | 38.68 | 54.01 | +| counter | 27.45 | 39.83 | +| sand | 41.43 | 52.77 | +| sink | 73.05 | 84.4 | +| skyscraper | 62.62 | 81.61 | +| fireplace | 73.28 | 84.98 | +| refrigerator | 74.05 | 85.56 | +| grandstand | 43.04 | 78.02 | +| path | 21.65 | 33.94 | +| stairs | 36.6 | 47.15 | +| runway | 72.9 | 90.89 | +| case | 50.83 | 55.33 | +| pool table | 91.5 | 94.38 | +| pillow | 55.5 | 68.16 | +| screen door | 78.56 | 84.42 | +| stairway | 33.94 | 39.93 | +| river | 14.13 | 30.76 | +| bridge | 69.03 | 83.65 | +| bookcase | 33.65 | 49.54 | +| blind | 42.93 | 46.87 | +| coffee table | 55.83 | 59.74 | +| toilet | 85.3 | 89.17 | +| flower | 39.38 | 58.27 | +| book | 50.25 | 74.75 | +| hill | 14.66 | 25.17 | +| bench | 53.93 | 73.38 | +| countertop | 56.19 | 62.01 | +| stove | 70.71 | 82.47 | +| palm | 44.99 | 74.65 | +| kitchen island | 44.34 | 80.07 | +| computer | 61.97 | 68.18 | +| swivel chair | 44.46 | 69.25 | +| boat | 61.16 | 66.49 | +| bar | 41.92 | 53.5 | +| arcade machine | 35.61 | 36.92 | +| hovel | 32.69 | 35.17 | +| bus | 90.96 | 95.89 | +| towel | 62.21 | 74.78 | +| light | 49.84 | 59.15 | +| truck | 38.59 | 56.45 | +| tower | 21.34 | 36.34 | +| chandelier | 58.83 | 67.1 | +| awning | 33.38 | 45.34 | +| streetlight | 28.02 | 35.79 | +| booth | 37.57 | 43.59 | +| television receiver | 67.07 | 89.35 | +| airplane | 55.33 | 69.16 | +| dirt track | 0.83 | 1.62 | +| apparel | 35.1 | 51.91 | +| pole | 24.82 | 33.24 | +| land | 4.74 | 6.71 | +| bannister | 19.05 | 23.98 | +| escalator | 23.14 | 24.35 | +| ottoman | 50.66 | 70.37 | +| bottle | 21.6 | 28.8 | +| buffet | 45.19 | 59.48 | +| poster | 30.85 | 49.88 | +| stage | 13.27 | 21.47 | +| van | 47.28 | 63.62 | +| ship | 6.48 | 8.19 | +| fountain | 15.07 | 16.81 | +| conveyer belt | 71.24 | 91.22 | +| canopy | 24.66 | 30.22 | +| washer | 67.56 | 68.81 | +| plaything | 33.43 | 38.15 | +| swimming pool | 48.8 | 49.76 | +| stool | 49.06 | 67.94 | +| barrel | 10.92 | 68.3 | +| basket | 28.2 | 38.22 | +| waterfall | 55.93 | 77.77 | +| tent | 61.61 | 97.56 | +| bag | 19.43 | 22.32 | +| minibike | 71.14 | 83.26 | +| cradle | 80.5 | 94.63 | +| oven | 38.64 | 53.92 | +| ball | 47.08 | 75.82 | +| food | 57.37 | 74.73 | +| step | 16.54 | 21.84 | +| tank | 37.73 | 53.02 | +| trade name | 30.43 | 41.52 | +| microwave | 79.29 | 89.56 | +| pot | 51.33 | 58.76 | +| animal | 61.73 | 65.65 | +| bicycle | 57.84 | 80.83 | +| lake | 59.99 | 63.02 | +| dishwasher | 51.32 | 64.39 | +| screen | 51.11 | 84.71 | +| blanket | 18.19 | 23.22 | +| sculpture | 56.68 | 63.19 | +| hood | 60.99 | 66.97 | +| sconce | 26.78 | 28.63 | +| vase | 40.0 | 59.76 | +| traffic light | 37.32 | 64.24 | +| tray | 6.74 | 9.56 | +| ashcan | 39.19 | 58.33 | +| fan | 61.1 | 74.02 | +| pier | 43.82 | 78.75 | +| crt screen | 10.27 | 25.96 | +| plate | 56.81 | 73.5 | +| monitor | 6.98 | 10.83 | +| bulletin board | 48.13 | 63.49 | +| shower | 2.5 | 2.76 | +| radiator | 52.22 | 56.98 | +| glass | 18.27 | 19.89 | +| clock | 24.79 | 31.39 | +| flag | 29.89 | 36.59 | ++---------------------+-------+-------+ +2024/01/07 00:31:05 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4830 coco/bbox_mAP_50: 0.6620 coco/bbox_mAP_75: 0.5310 coco/bbox_mAP_s: 0.3410 coco/bbox_mAP_m: 0.5330 coco/bbox_mAP_l: 0.6180 coco/segm_mAP: 0.3150 coco/segm_mAP_50: 0.5770 coco/segm_mAP_75: 0.3070 coco/segm_mAP_s: 0.1850 coco/segm_mAP_m: 0.3630 coco/segm_mAP_l: 0.4680 Bleu_1: 0.7452 Bleu_2: 0.5766 Bleu_3: 0.4313 Bleu_4: 0.3176 METEOR: 0.2579 ROUGE_L: 0.5439 CIDEr: 1.0177 SPICE: 0.1912 aAcc: 83.0400 mIoU: 48.3000 mAcc: 60.8800 visual-grounding/miou: 0.7983 visual-grounding/acc: 0.8675 data_time: 0.0058 time: 1.3479 +2024/01/07 00:43:06 - mmengine - INFO - Iter(train) [300500/640000] base_lr: 1.1046e-04 lr: 1.1860e-05 eta: 5 days, 18:23:59 time: 1.4538 data_time: 0.0220 memory: 25719 grad_norm: 3.2636 loss: 1.3025 detection_loss_cls: 0.0346 detection_loss_reg: 0.3436 caption_loss_cls: 2.2228 grounding_loss_reg: 2.6378 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0317 instance_segmentation_loss_reg: 0.3369 instance_segmentation_loss_poly: 0.9078 +2024/01/07 00:55:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 00:55:41 - mmengine - INFO - Iter(train) [301000/640000] base_lr: 1.1022e-04 lr: 1.1838e-05 eta: 5 days, 18:16:36 time: 1.4641 data_time: 0.0222 memory: 25719 grad_norm: 3.2234 loss: 1.2901 detection_loss_cls: 0.0345 detection_loss_reg: 0.3417 caption_loss_cls: 2.2202 grounding_loss_reg: 2.6342 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0315 instance_segmentation_loss_reg: 0.3363 instance_segmentation_loss_poly: 0.9066 +2024/01/07 01:08:19 - mmengine - INFO - Iter(train) [301500/640000] base_lr: 1.0998e-04 lr: 1.1816e-05 eta: 5 days, 18:09:33 time: 1.4669 data_time: 0.0223 memory: 25719 grad_norm: 3.1191 loss: 1.2859 detection_loss_cls: 0.0344 detection_loss_reg: 0.3405 caption_loss_cls: 2.2260 grounding_loss_reg: 2.6360 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0314 instance_segmentation_loss_reg: 0.3346 instance_segmentation_loss_poly: 0.9016 +2024/01/07 01:20:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 01:20:53 - mmengine - INFO - Iter(train) [302000/640000] base_lr: 1.0974e-04 lr: 1.1794e-05 eta: 5 days, 18:01:22 time: 1.4626 data_time: 0.0223 memory: 25719 grad_norm: 3.1403 loss: 1.2836 detection_loss_cls: 0.0344 detection_loss_reg: 0.3405 caption_loss_cls: 2.2164 grounding_loss_reg: 2.6373 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0313 instance_segmentation_loss_reg: 0.3332 instance_segmentation_loss_poly: 0.8992 +2024/01/07 01:20:53 - mmengine - INFO - Saving checkpoint at 302000 iterations +2024/01/07 01:33:47 - mmengine - INFO - Iter(train) [302500/640000] base_lr: 1.0949e-04 lr: 1.1772e-05 eta: 5 days, 17:57:24 time: 1.4691 data_time: 0.0226 memory: 25719 grad_norm: 3.0942 loss: 1.2828 detection_loss_cls: 0.0343 detection_loss_reg: 0.3403 caption_loss_cls: 2.2170 grounding_loss_reg: 2.6360 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0314 instance_segmentation_loss_reg: 0.3346 instance_segmentation_loss_poly: 0.9014 +2024/01/07 01:46:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 01:46:33 - mmengine - INFO - Iter(train) [303000/640000] base_lr: 1.0925e-04 lr: 1.1750e-05 eta: 5 days, 17:51:13 time: 1.4831 data_time: 0.0231 memory: 25719 grad_norm: 3.0477 loss: 1.2802 detection_loss_cls: 0.0343 detection_loss_reg: 0.3406 caption_loss_cls: 2.2173 grounding_loss_reg: 2.6329 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0314 instance_segmentation_loss_reg: 0.3340 instance_segmentation_loss_poly: 0.8990 +2024/01/07 01:59:55 - mmengine - INFO - Iter(train) [303500/640000] base_lr: 1.0901e-04 lr: 1.1728e-05 eta: 5 days, 17:52:26 time: 1.5052 data_time: 0.0232 memory: 25719 grad_norm: 2.9409 loss: 1.2738 detection_loss_cls: 0.0343 detection_loss_reg: 0.3413 caption_loss_cls: 2.2191 grounding_loss_reg: 2.6328 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0315 instance_segmentation_loss_reg: 0.3362 instance_segmentation_loss_poly: 0.9033 +2024/01/07 02:11:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 02:11:48 - mmengine - INFO - Iter(train) [304000/640000] base_lr: 1.0877e-04 lr: 1.1706e-05 eta: 5 days, 17:35:09 time: 1.5111 data_time: 0.0234 memory: 25719 grad_norm: 2.8603 loss: 1.2687 detection_loss_cls: 0.0343 detection_loss_reg: 0.3416 caption_loss_cls: 2.2174 grounding_loss_reg: 2.6322 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0315 instance_segmentation_loss_reg: 0.3366 instance_segmentation_loss_poly: 0.9044 +2024/01/07 02:11:48 - mmengine - INFO - Saving checkpoint at 304000 iterations +2024/01/07 02:24:14 - mmengine - INFO - Iter(train) [304500/640000] base_lr: 1.0853e-04 lr: 1.1684e-05 eta: 5 days, 17:24:28 time: 1.5164 data_time: 0.0270 memory: 25719 grad_norm: 2.8329 loss: 1.2697 detection_loss_cls: 0.0342 detection_loss_reg: 0.3421 caption_loss_cls: 2.2203 grounding_loss_reg: 2.6307 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0314 instance_segmentation_loss_reg: 0.3358 instance_segmentation_loss_poly: 0.9021 +2024/01/07 02:36:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 02:36:40 - mmengine - INFO - Iter(train) [305000/640000] base_lr: 1.0828e-04 lr: 1.1662e-05 eta: 5 days, 17:13:47 time: 1.5140 data_time: 0.0269 memory: 25719 grad_norm: 2.8213 loss: 1.2756 detection_loss_cls: 0.0343 detection_loss_reg: 0.3426 caption_loss_cls: 2.2234 grounding_loss_reg: 2.6292 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0315 instance_segmentation_loss_reg: 0.3371 instance_segmentation_loss_poly: 0.9047 +2024/01/07 02:48:40 - mmengine - INFO - Iter(train) [305500/640000] base_lr: 1.0804e-04 lr: 1.1640e-05 eta: 5 days, 16:58:11 time: 1.5045 data_time: 0.0267 memory: 25719 grad_norm: 2.8517 loss: 1.2867 detection_loss_cls: 0.0343 detection_loss_reg: 0.3438 caption_loss_cls: 2.2296 grounding_loss_reg: 2.6261 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0314 instance_segmentation_loss_reg: 0.3365 instance_segmentation_loss_poly: 0.9045 +2024/01/07 03:00:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 03:00:36 - mmengine - INFO - Iter(train) [306000/640000] base_lr: 1.0780e-04 lr: 1.1618e-05 eta: 5 days, 16:42:03 time: 1.4953 data_time: 0.0265 memory: 25719 grad_norm: 2.8442 loss: 1.2881 detection_loss_cls: 0.0342 detection_loss_reg: 0.3422 caption_loss_cls: 2.2267 grounding_loss_reg: 2.6261 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0313 instance_segmentation_loss_reg: 0.3358 instance_segmentation_loss_poly: 0.9028 +2024/01/07 03:00:36 - mmengine - INFO - Saving checkpoint at 306000 iterations +2024/01/07 03:13:29 - mmengine - INFO - Iter(train) [306500/640000] base_lr: 1.0756e-04 lr: 1.1596e-05 eta: 5 days, 16:36:20 time: 1.4949 data_time: 0.0264 memory: 25719 grad_norm: 2.8325 loss: 1.2904 detection_loss_cls: 0.0342 detection_loss_reg: 0.3428 caption_loss_cls: 2.2270 grounding_loss_reg: 2.6268 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0315 instance_segmentation_loss_reg: 0.3376 instance_segmentation_loss_poly: 0.9076 +2024/01/07 03:25:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 03:25:00 - mmengine - INFO - Iter(train) [307000/640000] base_lr: 1.0731e-04 lr: 1.1574e-05 eta: 5 days, 16:15:42 time: 1.4763 data_time: 0.0259 memory: 25719 grad_norm: 2.8743 loss: 1.3090 detection_loss_cls: 0.0340 detection_loss_reg: 0.3418 caption_loss_cls: 2.2311 grounding_loss_reg: 2.6250 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0314 instance_segmentation_loss_reg: 0.3366 instance_segmentation_loss_poly: 0.9050 +2024/01/07 03:36:58 - mmengine - INFO - Iter(train) [307500/640000] base_lr: 1.0707e-04 lr: 1.1552e-05 eta: 5 days, 16:00:07 time: 1.4551 data_time: 0.0255 memory: 25719 grad_norm: 2.8881 loss: 1.3175 detection_loss_cls: 0.0340 detection_loss_reg: 0.3424 caption_loss_cls: 2.2326 grounding_loss_reg: 2.6229 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0314 instance_segmentation_loss_reg: 0.3369 instance_segmentation_loss_poly: 0.9048 +2024/01/07 03:48:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 03:48:37 - mmengine - INFO - Iter(train) [308000/640000] base_lr: 1.0683e-04 lr: 1.1530e-05 eta: 5 days, 15:41:21 time: 1.4517 data_time: 0.0254 memory: 25719 grad_norm: 3.9813 loss: 1.3185 detection_loss_cls: 0.0339 detection_loss_reg: 0.3419 caption_loss_cls: 2.2357 grounding_loss_reg: 2.6226 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0313 instance_segmentation_loss_reg: 0.3358 instance_segmentation_loss_poly: 0.9012 +2024/01/07 03:48:37 - mmengine - INFO - Saving checkpoint at 308000 iterations +2024/01/07 04:00:26 - mmengine - INFO - Iter(train) [308500/640000] base_lr: 1.0659e-04 lr: 1.1508e-05 eta: 5 days, 15:24:32 time: 1.4426 data_time: 0.0250 memory: 25719 grad_norm: 4.0508 loss: 1.3129 detection_loss_cls: 0.0338 detection_loss_reg: 0.3409 caption_loss_cls: 2.2368 grounding_loss_reg: 2.6203 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3347 instance_segmentation_loss_poly: 0.8990 +2024/01/07 04:12:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 04:12:23 - mmengine - INFO - Iter(train) [309000/640000] base_lr: 1.0634e-04 lr: 1.1486e-05 eta: 5 days, 15:09:05 time: 1.4352 data_time: 0.0249 memory: 25719 grad_norm: 4.0997 loss: 1.3225 detection_loss_cls: 0.0336 detection_loss_reg: 0.3399 caption_loss_cls: 2.2384 grounding_loss_reg: 2.6226 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3348 instance_segmentation_loss_poly: 0.8982 +2024/01/07 04:24:22 - mmengine - INFO - Iter(train) [309500/640000] base_lr: 1.0610e-04 lr: 1.1464e-05 eta: 5 days, 14:54:13 time: 1.4351 data_time: 0.0248 memory: 25719 grad_norm: 4.1159 loss: 1.3123 detection_loss_cls: 0.0336 detection_loss_reg: 0.3391 caption_loss_cls: 2.2376 grounding_loss_reg: 2.6203 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3332 instance_segmentation_loss_poly: 0.8948 +2024/01/07 04:36:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 04:36:37 - mmengine - INFO - Iter(train) [310000/640000] base_lr: 1.0586e-04 lr: 1.1442e-05 eta: 5 days, 14:42:03 time: 1.4398 data_time: 0.0248 memory: 25719 grad_norm: 4.1104 loss: 1.3097 detection_loss_cls: 0.0335 detection_loss_reg: 0.3384 caption_loss_cls: 2.2398 grounding_loss_reg: 2.6214 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3328 instance_segmentation_loss_poly: 0.8936 +2024/01/07 04:36:37 - mmengine - INFO - Saving checkpoint at 310000 iterations +2024/01/07 04:49:07 - mmengine - INFO - Iter(train) [310500/640000] base_lr: 1.0562e-04 lr: 1.1420e-05 eta: 5 days, 14:32:03 time: 1.4338 data_time: 0.0248 memory: 25719 grad_norm: 4.1000 loss: 1.3078 detection_loss_cls: 0.0335 detection_loss_reg: 0.3384 caption_loss_cls: 2.2375 grounding_loss_reg: 2.6207 semantic_segmentation_loss_cls: 0.0085 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3330 instance_segmentation_loss_poly: 0.8941 +2024/01/07 05:01:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 05:01:32 - mmengine - INFO - Iter(train) [311000/640000] base_lr: 1.0537e-04 lr: 1.1398e-05 eta: 5 days, 14:21:22 time: 1.4474 data_time: 0.0250 memory: 25719 grad_norm: 4.1318 loss: 1.2975 detection_loss_cls: 0.0337 detection_loss_reg: 0.3390 caption_loss_cls: 2.2372 grounding_loss_reg: 2.6134 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0309 instance_segmentation_loss_reg: 0.3320 instance_segmentation_loss_poly: 0.8922 +2024/01/07 05:14:53 - mmengine - INFO - Iter(train) [311500/640000] base_lr: 1.0513e-04 lr: 1.1375e-05 eta: 5 days, 14:19:14 time: 1.4681 data_time: 0.0254 memory: 25719 grad_norm: 4.1057 loss: 1.2922 detection_loss_cls: 0.0336 detection_loss_reg: 0.3380 caption_loss_cls: 2.2414 grounding_loss_reg: 2.6131 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3338 instance_segmentation_loss_poly: 0.8962 +2024/01/07 05:27:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 05:27:38 - mmengine - INFO - Iter(train) [312000/640000] base_lr: 1.0489e-04 lr: 1.1353e-05 eta: 5 days, 14:11:23 time: 1.4847 data_time: 0.0255 memory: 25719 grad_norm: 2.9772 loss: 1.2823 detection_loss_cls: 0.0336 detection_loss_reg: 0.3375 caption_loss_cls: 2.2430 grounding_loss_reg: 2.6162 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3321 instance_segmentation_loss_poly: 0.8915 +2024/01/07 05:27:38 - mmengine - INFO - Saving checkpoint at 312000 iterations +2024/01/07 05:39:34 - mmengine - INFO - Iter(train) [312500/640000] base_lr: 1.0464e-04 lr: 1.1331e-05 eta: 5 days, 13:56:00 time: 1.4864 data_time: 0.0258 memory: 25719 grad_norm: 2.9311 loss: 1.2826 detection_loss_cls: 0.0336 detection_loss_reg: 0.3375 caption_loss_cls: 2.2402 grounding_loss_reg: 2.6130 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0309 instance_segmentation_loss_reg: 0.3319 instance_segmentation_loss_poly: 0.8902 +2024/01/07 05:51:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 05:51:30 - mmengine - INFO - Iter(train) [313000/640000] base_lr: 1.0440e-04 lr: 1.1309e-05 eta: 5 days, 13:40:39 time: 1.4862 data_time: 0.0259 memory: 25719 grad_norm: 2.9255 loss: 1.2827 detection_loss_cls: 0.0335 detection_loss_reg: 0.3371 caption_loss_cls: 2.2454 grounding_loss_reg: 2.6096 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3321 instance_segmentation_loss_poly: 0.8904 +2024/01/07 06:03:57 - mmengine - INFO - Iter(train) [313500/640000] base_lr: 1.0416e-04 lr: 1.1287e-05 eta: 5 days, 13:29:59 time: 1.4931 data_time: 0.0262 memory: 25719 grad_norm: 2.9059 loss: 1.2860 detection_loss_cls: 0.0335 detection_loss_reg: 0.3377 caption_loss_cls: 2.2468 grounding_loss_reg: 2.6089 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3321 instance_segmentation_loss_poly: 0.8903 +2024/01/07 06:15:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 06:15:55 - mmengine - INFO - Iter(train) [314000/640000] base_lr: 1.0392e-04 lr: 1.1265e-05 eta: 5 days, 13:15:08 time: 1.4888 data_time: 0.0263 memory: 25719 grad_norm: 2.9322 loss: 1.3035 detection_loss_cls: 0.0334 detection_loss_reg: 0.3378 caption_loss_cls: 2.2494 grounding_loss_reg: 2.6081 semantic_segmentation_loss_cls: 0.0084 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3324 instance_segmentation_loss_poly: 0.8904 +2024/01/07 06:15:55 - mmengine - INFO - Saving checkpoint at 314000 iterations +2024/01/07 06:29:00 - mmengine - INFO - Iter(train) [314500/640000] base_lr: 1.0367e-04 lr: 1.1243e-05 eta: 5 days, 13:09:48 time: 1.4978 data_time: 0.0264 memory: 25719 grad_norm: 2.9165 loss: 1.2945 detection_loss_cls: 0.0333 detection_loss_reg: 0.3372 caption_loss_cls: 2.2464 grounding_loss_reg: 2.6028 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3322 instance_segmentation_loss_poly: 0.8903 +2024/01/07 06:41:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 06:41:10 - mmengine - INFO - Iter(train) [315000/640000] base_lr: 1.0343e-04 lr: 1.1221e-05 eta: 5 days, 12:56:38 time: 1.4941 data_time: 0.0264 memory: 25719 grad_norm: 2.9133 loss: 1.2992 detection_loss_cls: 0.0334 detection_loss_reg: 0.3381 caption_loss_cls: 2.2434 grounding_loss_reg: 2.6037 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3322 instance_segmentation_loss_poly: 0.8894 +2024/01/07 06:53:26 - mmengine - INFO - Iter(train) [315500/640000] base_lr: 1.0319e-04 lr: 1.1199e-05 eta: 5 days, 12:44:12 time: 1.4777 data_time: 0.0260 memory: 25719 grad_norm: 2.9196 loss: 1.2928 detection_loss_cls: 0.0334 detection_loss_reg: 0.3385 caption_loss_cls: 2.2391 grounding_loss_reg: 2.6052 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3327 instance_segmentation_loss_poly: 0.8909 +2024/01/07 07:06:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 07:06:05 - mmengine - INFO - Iter(train) [316000/640000] base_lr: 1.0294e-04 lr: 1.1177e-05 eta: 5 days, 12:35:03 time: 1.4763 data_time: 0.0261 memory: 25719 grad_norm: 2.9000 loss: 1.2921 detection_loss_cls: 0.0333 detection_loss_reg: 0.3383 caption_loss_cls: 2.2375 grounding_loss_reg: 2.6071 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3340 instance_segmentation_loss_poly: 0.8932 +2024/01/07 07:06:05 - mmengine - INFO - Saving checkpoint at 316000 iterations +2024/01/07 07:18:58 - mmengine - INFO - Iter(train) [316500/640000] base_lr: 1.0270e-04 lr: 1.1155e-05 eta: 5 days, 12:27:35 time: 1.4905 data_time: 0.0264 memory: 25719 grad_norm: 2.8488 loss: 1.2892 detection_loss_cls: 0.0333 detection_loss_reg: 0.3376 caption_loss_cls: 2.2384 grounding_loss_reg: 2.6052 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3329 instance_segmentation_loss_poly: 0.8913 +2024/01/07 07:31:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 07:31:38 - mmengine - INFO - Iter(train) [317000/640000] base_lr: 1.0246e-04 lr: 1.1133e-05 eta: 5 days, 12:18:12 time: 1.5015 data_time: 0.0264 memory: 25719 grad_norm: 2.7786 loss: 1.2742 detection_loss_cls: 0.0334 detection_loss_reg: 0.3386 caption_loss_cls: 2.2389 grounding_loss_reg: 2.6042 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3331 instance_segmentation_loss_poly: 0.8912 +2024/01/07 07:43:50 - mmengine - INFO - Iter(train) [317500/640000] base_lr: 1.0222e-04 lr: 1.1110e-05 eta: 5 days, 12:05:15 time: 1.4979 data_time: 0.0264 memory: 25719 grad_norm: 2.7690 loss: 1.2827 detection_loss_cls: 0.0335 detection_loss_reg: 0.3401 caption_loss_cls: 2.2289 grounding_loss_reg: 2.6063 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0313 instance_segmentation_loss_reg: 0.3347 instance_segmentation_loss_poly: 0.8935 +2024/01/07 07:56:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 07:56:07 - mmengine - INFO - Iter(train) [318000/640000] base_lr: 1.0197e-04 lr: 1.1088e-05 eta: 5 days, 11:52:51 time: 1.5025 data_time: 0.0265 memory: 25719 grad_norm: 2.7479 loss: 1.2668 detection_loss_cls: 0.0333 detection_loss_reg: 0.3392 caption_loss_cls: 2.2339 grounding_loss_reg: 2.6068 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3346 instance_segmentation_loss_poly: 0.8918 +2024/01/07 07:56:07 - mmengine - INFO - Saving checkpoint at 318000 iterations +2024/01/07 08:08:56 - mmengine - INFO - Iter(train) [318500/640000] base_lr: 1.0173e-04 lr: 1.1066e-05 eta: 5 days, 11:44:35 time: 1.4985 data_time: 0.0266 memory: 25719 grad_norm: 2.7821 loss: 1.2694 detection_loss_cls: 0.0333 detection_loss_reg: 0.3396 caption_loss_cls: 2.2324 grounding_loss_reg: 2.6050 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3348 instance_segmentation_loss_poly: 0.8920 +2024/01/07 08:21:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 08:21:06 - mmengine - INFO - Iter(train) [319000/640000] base_lr: 1.0149e-04 lr: 1.1044e-05 eta: 5 days, 11:31:20 time: 1.4985 data_time: 0.0266 memory: 25719 grad_norm: 2.7623 loss: 1.2637 detection_loss_cls: 0.0333 detection_loss_reg: 0.3395 caption_loss_cls: 2.2304 grounding_loss_reg: 2.6030 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3348 instance_segmentation_loss_poly: 0.8923 +2024/01/07 08:33:43 - mmengine - INFO - Iter(train) [319500/640000] base_lr: 1.0124e-04 lr: 1.1022e-05 eta: 5 days, 11:21:21 time: 1.5038 data_time: 0.0267 memory: 25719 grad_norm: 2.7693 loss: 1.2681 detection_loss_cls: 0.0333 detection_loss_reg: 0.3403 caption_loss_cls: 2.2244 grounding_loss_reg: 2.5995 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3338 instance_segmentation_loss_poly: 0.8903 +2024/01/07 08:45:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 08:45:27 - mmengine - INFO - Iter(train) [320000/640000] base_lr: 1.0100e-04 lr: 1.1000e-05 eta: 5 days, 11:04:55 time: 1.4898 data_time: 0.0265 memory: 25719 grad_norm: 2.8484 loss: 1.2832 detection_loss_cls: 0.0333 detection_loss_reg: 0.3405 caption_loss_cls: 2.2233 grounding_loss_reg: 2.6015 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3341 instance_segmentation_loss_poly: 0.8923 +2024/01/07 08:45:27 - mmengine - INFO - Saving checkpoint at 320000 iterations +2024/01/07 08:57:59 - mmengine - INFO - Evaluating bbox... +2024/01/07 08:58:56 - mmengine - INFO - bbox_mAP_copypaste: 0.488 0.668 0.532 0.334 0.538 0.624 +2024/01/07 08:58:56 - mmengine - INFO - Evaluating segm... +2024/01/07 09:00:09 - mmengine - INFO - segm_mAP_copypaste: 0.320 0.579 0.308 0.178 0.368 0.490 +2024/01/07 09:07:17 - mmengine - INFO - per class results: +2024/01/07 09:07:17 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 77.86 | 89.49 | +| building | 82.13 | 90.85 | +| sky | 93.48 | 96.54 | +| floor | 83.22 | 90.71 | +| tree | 73.06 | 91.66 | +| ceiling | 85.07 | 92.21 | +| road | 82.49 | 88.88 | +| bed | 88.81 | 94.83 | +| windowpane | 62.1 | 75.56 | +| grass | 66.58 | 79.57 | +| cabinet | 60.56 | 73.13 | +| sidewalk | 64.58 | 79.88 | +| person | 80.58 | 92.64 | +| earth | 38.82 | 51.59 | +| door | 50.84 | 60.76 | +| table | 62.82 | 78.56 | +| mountain | 59.78 | 78.38 | +| plant | 50.73 | 60.56 | +| curtain | 71.22 | 88.33 | +| chair | 57.8 | 67.13 | +| car | 84.52 | 93.12 | +| water | 56.33 | 72.74 | +| painting | 71.73 | 87.41 | +| sofa | 70.36 | 85.07 | +| shelf | 45.67 | 77.35 | +| house | 47.36 | 60.23 | +| sea | 53.78 | 65.54 | +| mirror | 66.42 | 75.54 | +| rug | 73.83 | 83.37 | +| field | 31.32 | 51.14 | +| armchair | 45.59 | 63.23 | +| seat | 61.71 | 83.76 | +| fence | 45.33 | 70.69 | +| desk | 48.81 | 67.93 | +| rock | 36.54 | 51.51 | +| wardrobe | 44.61 | 68.17 | +| lamp | 60.44 | 75.67 | +| bathtub | 79.94 | 83.55 | +| railing | 37.07 | 51.66 | +| cushion | 59.63 | 71.95 | +| base | 23.43 | 38.39 | +| box | 23.2 | 27.81 | +| column | 43.15 | 48.21 | +| signboard | 36.34 | 53.69 | +| chest of drawers | 40.75 | 62.52 | +| counter | 27.54 | 39.31 | +| sand | 45.04 | 62.54 | +| sink | 71.96 | 84.01 | +| skyscraper | 47.7 | 58.93 | +| fireplace | 77.74 | 84.7 | +| refrigerator | 73.3 | 77.69 | +| grandstand | 43.26 | 73.01 | +| path | 18.98 | 29.8 | +| stairs | 28.71 | 32.68 | +| runway | 78.45 | 83.99 | +| case | 59.01 | 69.12 | +| pool table | 90.58 | 95.14 | +| pillow | 61.09 | 77.51 | +| screen door | 79.2 | 80.69 | +| stairway | 31.53 | 44.33 | +| river | 8.15 | 17.84 | +| bridge | 58.23 | 72.89 | +| bookcase | 38.57 | 56.97 | +| blind | 32.79 | 37.23 | +| coffee table | 66.13 | 76.13 | +| toilet | 86.95 | 90.2 | +| flower | 40.31 | 65.85 | +| book | 47.33 | 64.17 | +| hill | 13.61 | 26.42 | +| bench | 55.63 | 64.5 | +| countertop | 57.85 | 73.18 | +| stove | 76.24 | 80.47 | +| palm | 48.39 | 72.18 | +| kitchen island | 42.41 | 92.66 | +| computer | 72.19 | 84.62 | +| swivel chair | 48.18 | 70.84 | +| boat | 64.0 | 70.1 | +| bar | 40.4 | 54.08 | +| arcade machine | 68.45 | 76.68 | +| hovel | 47.09 | 53.25 | +| bus | 92.38 | 94.81 | +| towel | 64.18 | 83.93 | +| light | 51.35 | 62.15 | +| truck | 41.55 | 57.68 | +| tower | 24.83 | 49.74 | +| chandelier | 61.2 | 71.99 | +| awning | 30.23 | 33.15 | +| streetlight | 31.32 | 44.91 | +| booth | 61.25 | 69.69 | +| television receiver | 70.26 | 79.42 | +| airplane | 59.29 | 69.49 | +| dirt track | 6.66 | 24.45 | +| apparel | 33.77 | 43.72 | +| pole | 25.49 | 35.83 | +| land | 2.85 | 4.14 | +| bannister | 16.68 | 23.21 | +| escalator | 7.69 | 7.72 | +| ottoman | 50.56 | 71.97 | +| bottle | 17.62 | 19.85 | +| buffet | 35.69 | 41.48 | +| poster | 32.84 | 41.09 | +| stage | 5.75 | 8.07 | +| van | 43.2 | 55.18 | +| ship | 7.68 | 8.81 | +| fountain | 13.0 | 13.15 | +| conveyer belt | 68.68 | 91.48 | +| canopy | 11.14 | 13.77 | +| washer | 71.4 | 76.88 | +| plaything | 40.71 | 49.86 | +| swimming pool | 52.68 | 77.91 | +| stool | 45.0 | 62.46 | +| barrel | 54.39 | 61.78 | +| basket | 29.08 | 38.94 | +| waterfall | 47.6 | 70.54 | +| tent | 93.84 | 96.16 | +| bag | 17.08 | 19.66 | +| minibike | 70.27 | 88.54 | +| cradle | 79.85 | 92.37 | +| oven | 49.26 | 57.65 | +| ball | 44.3 | 71.17 | +| food | 45.77 | 51.0 | +| step | 12.13 | 18.01 | +| tank | 34.11 | 47.57 | +| trade name | 28.33 | 38.38 | +| microwave | 80.88 | 87.89 | +| pot | 50.35 | 58.67 | +| animal | 53.38 | 55.82 | +| bicycle | 57.09 | 75.63 | +| lake | 50.49 | 65.79 | +| dishwasher | 53.23 | 64.24 | +| screen | 62.44 | 76.85 | +| blanket | 20.7 | 23.66 | +| sculpture | 55.62 | 77.04 | +| hood | 54.22 | 67.65 | +| sconce | 42.8 | 52.53 | +| vase | 42.85 | 54.14 | +| traffic light | 39.37 | 66.1 | +| tray | 6.03 | 9.59 | +| ashcan | 40.11 | 55.11 | +| fan | 60.46 | 70.95 | +| pier | 39.18 | 68.28 | +| crt screen | 12.18 | 22.41 | +| plate | 55.27 | 69.65 | +| monitor | 31.73 | 40.33 | +| bulletin board | 16.14 | 18.01 | +| shower | 5.55 | 7.18 | +| radiator | 34.36 | 35.89 | +| glass | 18.71 | 20.68 | +| clock | 26.06 | 35.29 | +| flag | 33.41 | 38.41 | ++---------------------+-------+-------+ +2024/01/07 09:07:34 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4880 coco/bbox_mAP_50: 0.6680 coco/bbox_mAP_75: 0.5320 coco/bbox_mAP_s: 0.3340 coco/bbox_mAP_m: 0.5380 coco/bbox_mAP_l: 0.6240 coco/segm_mAP: 0.3200 coco/segm_mAP_50: 0.5790 coco/segm_mAP_75: 0.3080 coco/segm_mAP_s: 0.1780 coco/segm_mAP_m: 0.3680 coco/segm_mAP_l: 0.4900 Bleu_1: 0.7465 Bleu_2: 0.5795 Bleu_3: 0.4345 Bleu_4: 0.3242 METEOR: 0.2613 ROUGE_L: 0.5474 CIDEr: 1.0395 SPICE: 0.1968 aAcc: 83.1300 mIoU: 49.0200 mAcc: 60.9500 visual-grounding/miou: 0.7998 visual-grounding/acc: 0.8698 data_time: 0.0043 time: 1.3425 +2024/01/07 09:20:56 - mmengine - INFO - Iter(train) [320500/640000] base_lr: 1.0076e-04 lr: 1.0978e-05 eta: 5 days, 11:00:40 time: 1.4978 data_time: 0.0230 memory: 25719 grad_norm: 2.8119 loss: 1.2773 detection_loss_cls: 0.0333 detection_loss_reg: 0.3401 caption_loss_cls: 2.2246 grounding_loss_reg: 2.6008 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3343 instance_segmentation_loss_poly: 0.8924 +2024/01/07 09:33:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 09:33:51 - mmengine - INFO - Iter(train) [321000/640000] base_lr: 1.0051e-04 lr: 1.0956e-05 eta: 5 days, 10:52:41 time: 1.5017 data_time: 0.0232 memory: 25719 grad_norm: 2.8169 loss: 1.2831 detection_loss_cls: 0.0333 detection_loss_reg: 0.3407 caption_loss_cls: 2.2218 grounding_loss_reg: 2.5987 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0313 instance_segmentation_loss_reg: 0.3347 instance_segmentation_loss_poly: 0.8937 +2024/01/07 09:46:06 - mmengine - INFO - Iter(train) [321500/640000] base_lr: 1.0027e-04 lr: 1.0934e-05 eta: 5 days, 10:39:57 time: 1.5023 data_time: 0.0230 memory: 25719 grad_norm: 2.8229 loss: 1.2723 detection_loss_cls: 0.0332 detection_loss_reg: 0.3402 caption_loss_cls: 2.2253 grounding_loss_reg: 2.5987 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0313 instance_segmentation_loss_reg: 0.3340 instance_segmentation_loss_poly: 0.8914 +2024/01/07 09:58:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 09:58:29 - mmengine - INFO - Iter(train) [322000/640000] base_lr: 1.0003e-04 lr: 1.0912e-05 eta: 5 days, 10:28:11 time: 1.5040 data_time: 0.0230 memory: 25719 grad_norm: 2.8151 loss: 1.2686 detection_loss_cls: 0.0333 detection_loss_reg: 0.3402 caption_loss_cls: 2.2254 grounding_loss_reg: 2.5937 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0312 instance_segmentation_loss_reg: 0.3329 instance_segmentation_loss_poly: 0.8887 +2024/01/07 09:58:29 - mmengine - INFO - Saving checkpoint at 322000 iterations +2024/01/07 10:10:44 - mmengine - INFO - Iter(train) [322500/640000] base_lr: 9.9786e-05 lr: 1.0890e-05 eta: 5 days, 10:15:24 time: 1.4953 data_time: 0.0227 memory: 25719 grad_norm: 2.8186 loss: 1.2793 detection_loss_cls: 0.0332 detection_loss_reg: 0.3395 caption_loss_cls: 2.2246 grounding_loss_reg: 2.5926 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0313 instance_segmentation_loss_reg: 0.3334 instance_segmentation_loss_poly: 0.8901 +2024/01/07 10:23:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 10:23:29 - mmengine - INFO - Iter(train) [323000/640000] base_lr: 9.9543e-05 lr: 1.0868e-05 eta: 5 days, 10:06:00 time: 1.5039 data_time: 0.0227 memory: 25719 grad_norm: 2.7654 loss: 1.2680 detection_loss_cls: 0.0331 detection_loss_reg: 0.3387 caption_loss_cls: 2.2271 grounding_loss_reg: 2.5917 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3314 instance_segmentation_loss_poly: 0.8855 +2024/01/07 10:35:18 - mmengine - INFO - Iter(train) [323500/640000] base_lr: 9.9300e-05 lr: 1.0845e-05 eta: 5 days, 9:50:23 time: 1.4921 data_time: 0.0224 memory: 25719 grad_norm: 2.7843 loss: 1.2701 detection_loss_cls: 0.0330 detection_loss_reg: 0.3382 caption_loss_cls: 2.2280 grounding_loss_reg: 2.5871 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0311 instance_segmentation_loss_reg: 0.3317 instance_segmentation_loss_poly: 0.8858 +2024/01/07 10:47:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 10:47:22 - mmengine - INFO - Iter(train) [324000/640000] base_lr: 9.9057e-05 lr: 1.0823e-05 eta: 5 days, 9:36:27 time: 1.4971 data_time: 0.0224 memory: 25719 grad_norm: 2.7729 loss: 1.2586 detection_loss_cls: 0.0331 detection_loss_reg: 0.3382 caption_loss_cls: 2.2284 grounding_loss_reg: 2.5884 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3306 instance_segmentation_loss_poly: 0.8833 +2024/01/07 10:47:22 - mmengine - INFO - Saving checkpoint at 324000 iterations +2024/01/07 10:59:51 - mmengine - INFO - Iter(train) [324500/640000] base_lr: 9.8814e-05 lr: 1.0801e-05 eta: 5 days, 9:25:15 time: 1.4831 data_time: 0.0258 memory: 25719 grad_norm: 2.8265 loss: 1.2629 detection_loss_cls: 0.0331 detection_loss_reg: 0.3387 caption_loss_cls: 2.2217 grounding_loss_reg: 2.5850 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3309 instance_segmentation_loss_poly: 0.8837 +2024/01/07 11:12:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 11:12:35 - mmengine - INFO - Iter(train) [325000/640000] base_lr: 9.8571e-05 lr: 1.0779e-05 eta: 5 days, 9:15:44 time: 1.4805 data_time: 0.0257 memory: 25719 grad_norm: 2.8385 loss: 1.2644 detection_loss_cls: 0.0329 detection_loss_reg: 0.3372 caption_loss_cls: 2.2183 grounding_loss_reg: 2.5876 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3313 instance_segmentation_loss_poly: 0.8844 +2024/01/07 11:25:04 - mmengine - INFO - Iter(train) [325500/640000] base_lr: 9.8328e-05 lr: 1.0757e-05 eta: 5 days, 9:04:25 time: 1.4838 data_time: 0.0257 memory: 25719 grad_norm: 2.8180 loss: 1.2623 detection_loss_cls: 0.0329 detection_loss_reg: 0.3376 caption_loss_cls: 2.2187 grounding_loss_reg: 2.5875 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3307 instance_segmentation_loss_poly: 0.8820 +2024/01/07 11:37:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 11:37:23 - mmengine - INFO - Iter(train) [326000/640000] base_lr: 9.8085e-05 lr: 1.0735e-05 eta: 5 days, 8:52:11 time: 1.4829 data_time: 0.0257 memory: 25719 grad_norm: 2.8014 loss: 1.2636 detection_loss_cls: 0.0329 detection_loss_reg: 0.3372 caption_loss_cls: 2.2181 grounding_loss_reg: 2.5867 semantic_segmentation_loss_cls: 0.0083 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3310 instance_segmentation_loss_poly: 0.8823 +2024/01/07 11:37:23 - mmengine - INFO - Saving checkpoint at 326000 iterations +2024/01/07 11:49:56 - mmengine - INFO - Iter(train) [326500/640000] base_lr: 9.7842e-05 lr: 1.0713e-05 eta: 5 days, 8:41:16 time: 1.4874 data_time: 0.0256 memory: 25719 grad_norm: 2.7573 loss: 1.2520 detection_loss_cls: 0.0329 detection_loss_reg: 0.3369 caption_loss_cls: 2.2147 grounding_loss_reg: 2.5867 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0309 instance_segmentation_loss_reg: 0.3317 instance_segmentation_loss_poly: 0.8833 +2024/01/07 12:02:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 12:02:06 - mmengine - INFO - Iter(train) [327000/640000] base_lr: 9.7599e-05 lr: 1.0691e-05 eta: 5 days, 8:28:01 time: 1.4787 data_time: 0.0256 memory: 25719 grad_norm: 2.7737 loss: 1.2596 detection_loss_cls: 0.0328 detection_loss_reg: 0.3364 caption_loss_cls: 2.2131 grounding_loss_reg: 2.5859 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0309 instance_segmentation_loss_reg: 0.3315 instance_segmentation_loss_poly: 0.8826 +2024/01/07 12:14:01 - mmengine - INFO - Iter(train) [327500/640000] base_lr: 9.7357e-05 lr: 1.0669e-05 eta: 5 days, 8:13:19 time: 1.4803 data_time: 0.0257 memory: 25719 grad_norm: 2.7913 loss: 1.2576 detection_loss_cls: 0.0328 detection_loss_reg: 0.3365 caption_loss_cls: 2.2074 grounding_loss_reg: 2.5820 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3320 instance_segmentation_loss_poly: 0.8841 +2024/01/07 12:26:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 12:26:07 - mmengine - INFO - Iter(train) [328000/640000] base_lr: 9.7114e-05 lr: 1.0647e-05 eta: 5 days, 7:59:41 time: 1.4807 data_time: 0.0258 memory: 25719 grad_norm: 2.7627 loss: 1.2559 detection_loss_cls: 0.0327 detection_loss_reg: 0.3364 caption_loss_cls: 2.2054 grounding_loss_reg: 2.5799 semantic_segmentation_loss_cls: 0.0082 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3325 instance_segmentation_loss_poly: 0.8855 +2024/01/07 12:26:07 - mmengine - INFO - Saving checkpoint at 328000 iterations +2024/01/07 12:38:55 - mmengine - INFO - Iter(train) [328500/640000] base_lr: 9.6871e-05 lr: 1.0625e-05 eta: 5 days, 7:50:18 time: 1.4856 data_time: 0.0257 memory: 25719 grad_norm: 2.7627 loss: 1.2536 detection_loss_cls: 0.0326 detection_loss_reg: 0.3353 caption_loss_cls: 2.2022 grounding_loss_reg: 2.5784 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0310 instance_segmentation_loss_reg: 0.3323 instance_segmentation_loss_poly: 0.8849 +2024/01/07 12:51:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 12:51:22 - mmengine - INFO - Iter(train) [329000/640000] base_lr: 9.6628e-05 lr: 1.0603e-05 eta: 5 days, 7:38:42 time: 1.4810 data_time: 0.0255 memory: 25719 grad_norm: 2.7967 loss: 1.2448 detection_loss_cls: 0.0326 detection_loss_reg: 0.3357 caption_loss_cls: 2.1967 grounding_loss_reg: 2.5756 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0309 instance_segmentation_loss_reg: 0.3319 instance_segmentation_loss_poly: 0.8840 +2024/01/07 13:03:16 - mmengine - INFO - Iter(train) [329500/640000] base_lr: 9.6385e-05 lr: 1.0580e-05 eta: 5 days, 7:24:00 time: 1.4725 data_time: 0.0253 memory: 25719 grad_norm: 2.8018 loss: 1.2399 detection_loss_cls: 0.0326 detection_loss_reg: 0.3368 caption_loss_cls: 2.2002 grounding_loss_reg: 2.5725 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0308 instance_segmentation_loss_reg: 0.3318 instance_segmentation_loss_poly: 0.8833 +2024/01/07 13:15:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240106_135333 +2024/01/07 13:15:38 - mmengine - INFO - Iter(train) [330000/640000] base_lr: 9.6143e-05 lr: 1.0558e-05 eta: 5 days, 7:12:00 time: 1.4731 data_time: 0.0253 memory: 25719 grad_norm: 2.8259 loss: 1.2446 detection_loss_cls: 0.0327 detection_loss_reg: 0.3375 caption_loss_cls: 2.2005 grounding_loss_reg: 2.5708 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3308 instance_segmentation_loss_poly: 0.8824 +2024/01/07 13:15:38 - mmengine - INFO - Saving checkpoint at 330000 iterations +2024/01/07 14:11:28 - mmengine - INFO - Iter(train) [330500/640000] base_lr: 9.5900e-05 lr: 1.0536e-05 eta: 5 days, 6:05:49 time: 1.4684 data_time: 0.0207 memory: 25718 grad_norm: 2.8491 loss: 1.2487 detection_loss_cls: 0.0326 detection_loss_reg: 0.3380 caption_loss_cls: 2.2000 grounding_loss_reg: 2.5719 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0307 instance_segmentation_loss_reg: 0.3313 instance_segmentation_loss_poly: 0.8838 +2024/01/07 14:23:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 14:23:55 - mmengine - INFO - Iter(train) [331000/640000] base_lr: 9.5657e-05 lr: 1.0514e-05 eta: 5 days, 6:59:54 time: 1.4725 data_time: 0.0207 memory: 25718 grad_norm: 2.9305 loss: 1.2540 detection_loss_cls: 0.0325 detection_loss_reg: 0.3378 caption_loss_cls: 2.1935 grounding_loss_reg: 2.5679 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0306 instance_segmentation_loss_reg: 0.3307 instance_segmentation_loss_poly: 0.8828 +2024/01/07 14:36:06 - mmengine - INFO - Iter(train) [331500/640000] base_lr: 9.5415e-05 lr: 1.0492e-05 eta: 5 days, 6:16:11 time: 1.4763 data_time: 0.0205 memory: 25718 grad_norm: 2.9226 loss: 1.2439 detection_loss_cls: 0.0324 detection_loss_reg: 0.3374 caption_loss_cls: 2.1892 grounding_loss_reg: 2.5669 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0305 instance_segmentation_loss_reg: 0.3308 instance_segmentation_loss_poly: 0.8828 +2024/01/07 14:48:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 14:48:12 - mmengine - INFO - Iter(train) [332000/640000] base_lr: 9.5172e-05 lr: 1.0470e-05 eta: 5 days, 5:36:22 time: 1.4765 data_time: 0.0202 memory: 25718 grad_norm: 2.9361 loss: 1.2477 detection_loss_cls: 0.0323 detection_loss_reg: 0.3387 caption_loss_cls: 2.1874 grounding_loss_reg: 2.5631 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0305 instance_segmentation_loss_reg: 0.3318 instance_segmentation_loss_poly: 0.8854 +2024/01/07 14:48:12 - mmengine - INFO - Saving checkpoint at 332000 iterations +2024/01/07 15:00:53 - mmengine - INFO - Iter(train) [332500/640000] base_lr: 9.4930e-05 lr: 1.0448e-05 eta: 5 days, 6:17:40 time: 1.4746 data_time: 0.0205 memory: 25718 grad_norm: 2.9432 loss: 1.2599 detection_loss_cls: 0.0322 detection_loss_reg: 0.3387 caption_loss_cls: 2.1903 grounding_loss_reg: 2.5594 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0303 instance_segmentation_loss_reg: 0.3309 instance_segmentation_loss_poly: 0.8842 +2024/01/07 15:13:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 15:13:00 - mmengine - INFO - Iter(train) [333000/640000] base_lr: 9.4687e-05 lr: 1.0426e-05 eta: 5 days, 5:45:09 time: 1.4699 data_time: 0.0203 memory: 25718 grad_norm: 2.9363 loss: 1.2665 detection_loss_cls: 0.0323 detection_loss_reg: 0.3392 caption_loss_cls: 2.1866 grounding_loss_reg: 2.5599 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0303 instance_segmentation_loss_reg: 0.3311 instance_segmentation_loss_poly: 0.8853 +2024/01/07 15:24:59 - mmengine - INFO - Iter(train) [333500/640000] base_lr: 9.4445e-05 lr: 1.0404e-05 eta: 5 days, 5:05:50 time: 1.4711 data_time: 0.0203 memory: 25718 grad_norm: 2.9890 loss: 1.2727 detection_loss_cls: 0.0321 detection_loss_reg: 0.3385 caption_loss_cls: 2.1870 grounding_loss_reg: 2.5587 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0302 instance_segmentation_loss_reg: 0.3299 instance_segmentation_loss_poly: 0.8828 +2024/01/07 15:37:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 15:37:29 - mmengine - INFO - Iter(train) [334000/640000] base_lr: 9.4202e-05 lr: 1.0382e-05 eta: 5 days, 5:12:54 time: 1.4731 data_time: 0.0201 memory: 25718 grad_norm: 2.9897 loss: 1.2568 detection_loss_cls: 0.0320 detection_loss_reg: 0.3366 caption_loss_cls: 2.1796 grounding_loss_reg: 2.5545 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0300 instance_segmentation_loss_reg: 0.3285 instance_segmentation_loss_poly: 0.8806 +2024/01/07 15:37:29 - mmengine - INFO - Saving checkpoint at 334000 iterations +2024/01/07 15:49:17 - mmengine - INFO - Iter(train) [334500/640000] base_lr: 9.3960e-05 lr: 1.0360e-05 eta: 5 days, 4:27:15 time: 1.4665 data_time: 0.0246 memory: 25718 grad_norm: 3.0266 loss: 1.2701 detection_loss_cls: 0.0321 detection_loss_reg: 0.3381 caption_loss_cls: 2.1766 grounding_loss_reg: 2.5533 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0301 instance_segmentation_loss_reg: 0.3303 instance_segmentation_loss_poly: 0.8849 +2024/01/07 16:02:00 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 16:02:00 - mmengine - INFO - Iter(train) [335000/640000] base_lr: 9.3718e-05 lr: 1.0338e-05 eta: 5 days, 4:45:27 time: 1.4708 data_time: 0.0246 memory: 25718 grad_norm: 2.9263 loss: 1.2591 detection_loss_cls: 0.0320 detection_loss_reg: 0.3367 caption_loss_cls: 2.1747 grounding_loss_reg: 2.5500 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0300 instance_segmentation_loss_reg: 0.3297 instance_segmentation_loss_poly: 0.8842 +2024/01/07 16:14:16 - mmengine - INFO - Iter(train) [335500/640000] base_lr: 9.3475e-05 lr: 1.0316e-05 eta: 5 days, 4:32:00 time: 1.4719 data_time: 0.0247 memory: 25718 grad_norm: 2.9254 loss: 1.2622 detection_loss_cls: 0.0320 detection_loss_reg: 0.3378 caption_loss_cls: 2.1710 grounding_loss_reg: 2.5453 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0298 instance_segmentation_loss_reg: 0.3287 instance_segmentation_loss_poly: 0.8824 +2024/01/07 16:26:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 16:26:34 - mmengine - INFO - Iter(train) [336000/640000] base_lr: 9.3233e-05 lr: 1.0294e-05 eta: 5 days, 4:21:25 time: 1.4749 data_time: 0.0248 memory: 25718 grad_norm: 2.9378 loss: 1.2636 detection_loss_cls: 0.0318 detection_loss_reg: 0.3368 caption_loss_cls: 2.1721 grounding_loss_reg: 2.5395 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0297 instance_segmentation_loss_reg: 0.3282 instance_segmentation_loss_poly: 0.8819 +2024/01/07 16:26:34 - mmengine - INFO - Saving checkpoint at 336000 iterations +2024/01/07 16:38:33 - mmengine - INFO - Iter(train) [336500/640000] base_lr: 9.2991e-05 lr: 1.0272e-05 eta: 5 days, 3:55:31 time: 1.4646 data_time: 0.0243 memory: 25718 grad_norm: 2.9584 loss: 1.2612 detection_loss_cls: 0.0319 detection_loss_reg: 0.3374 caption_loss_cls: 2.1736 grounding_loss_reg: 2.5380 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3282 instance_segmentation_loss_poly: 0.8818 +2024/01/07 16:50:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 16:50:38 - mmengine - INFO - Iter(train) [337000/640000] base_lr: 9.2749e-05 lr: 1.0250e-05 eta: 5 days, 3:35:56 time: 1.4639 data_time: 0.0243 memory: 25718 grad_norm: 2.9534 loss: 1.2546 detection_loss_cls: 0.0319 detection_loss_reg: 0.3369 caption_loss_cls: 2.1698 grounding_loss_reg: 2.5336 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3279 instance_segmentation_loss_poly: 0.8807 +2024/01/07 17:03:03 - mmengine - INFO - Iter(train) [337500/640000] base_lr: 9.2507e-05 lr: 1.0228e-05 eta: 5 days, 3:30:10 time: 1.4702 data_time: 0.0245 memory: 25718 grad_norm: 2.9015 loss: 1.2562 detection_loss_cls: 0.0317 detection_loss_reg: 0.3355 caption_loss_cls: 2.1715 grounding_loss_reg: 2.5314 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3275 instance_segmentation_loss_poly: 0.8795 +2024/01/07 17:15:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 17:15:15 - mmengine - INFO - Iter(train) [338000/640000] base_lr: 9.2264e-05 lr: 1.0206e-05 eta: 5 days, 3:16:31 time: 1.4659 data_time: 0.0246 memory: 25718 grad_norm: 2.9173 loss: 1.2716 detection_loss_cls: 0.0316 detection_loss_reg: 0.3350 caption_loss_cls: 2.1680 grounding_loss_reg: 2.5267 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3262 instance_segmentation_loss_poly: 0.8773 +2024/01/07 17:15:15 - mmengine - INFO - Saving checkpoint at 338000 iterations +2024/01/07 17:27:38 - mmengine - INFO - Iter(train) [338500/640000] base_lr: 9.2022e-05 lr: 1.0184e-05 eta: 5 days, 3:08:50 time: 1.4747 data_time: 0.0244 memory: 25718 grad_norm: 2.8684 loss: 1.2446 detection_loss_cls: 0.0315 detection_loss_reg: 0.3340 caption_loss_cls: 2.1676 grounding_loss_reg: 2.5224 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3258 instance_segmentation_loss_poly: 0.8758 +2024/01/07 17:39:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 17:39:48 - mmengine - INFO - Iter(train) [339000/640000] base_lr: 9.1781e-05 lr: 1.0162e-05 eta: 5 days, 2:53:13 time: 1.4662 data_time: 0.0243 memory: 25718 grad_norm: 2.9052 loss: 1.2466 detection_loss_cls: 0.0315 detection_loss_reg: 0.3340 caption_loss_cls: 2.1641 grounding_loss_reg: 2.5195 semantic_segmentation_loss_cls: 0.0081 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3250 instance_segmentation_loss_poly: 0.8739 +2024/01/07 17:52:58 - mmengine - INFO - Iter(train) [339500/640000] base_lr: 9.1539e-05 lr: 1.0140e-05 eta: 5 days, 3:10:02 time: 1.4800 data_time: 0.0244 memory: 25718 grad_norm: 2.8586 loss: 1.2408 detection_loss_cls: 0.0313 detection_loss_reg: 0.3334 caption_loss_cls: 2.1651 grounding_loss_reg: 2.5207 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3245 instance_segmentation_loss_poly: 0.8731 +2024/01/07 18:05:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 18:05:09 - mmengine - INFO - Iter(train) [340000/640000] base_lr: 9.1297e-05 lr: 1.0118e-05 eta: 5 days, 2:54:13 time: 1.4781 data_time: 0.0245 memory: 25718 grad_norm: 2.8529 loss: 1.2367 detection_loss_cls: 0.0313 detection_loss_reg: 0.3336 caption_loss_cls: 2.1612 grounding_loss_reg: 2.5200 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3253 instance_segmentation_loss_poly: 0.8737 +2024/01/07 18:05:09 - mmengine - INFO - Saving checkpoint at 340000 iterations +2024/01/07 18:17:28 - mmengine - INFO - Evaluating bbox... +2024/01/07 18:18:24 - mmengine - INFO - bbox_mAP_copypaste: 0.497 0.674 0.545 0.337 0.549 0.625 +2024/01/07 18:18:24 - mmengine - INFO - Evaluating segm... +2024/01/07 18:19:36 - mmengine - INFO - segm_mAP_copypaste: 0.331 0.586 0.331 0.184 0.377 0.496 +2024/01/07 18:26:54 - mmengine - INFO - per class results: +2024/01/07 18:26:54 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.02 | 87.78 | +| building | 82.91 | 91.96 | +| sky | 93.45 | 97.67 | +| floor | 82.52 | 89.9 | +| tree | 74.08 | 87.07 | +| ceiling | 84.56 | 92.94 | +| road | 82.69 | 90.72 | +| bed | 89.15 | 96.13 | +| windowpane | 62.38 | 82.17 | +| grass | 65.16 | 83.64 | +| cabinet | 59.84 | 69.15 | +| sidewalk | 65.74 | 79.82 | +| person | 81.53 | 91.61 | +| earth | 35.88 | 45.48 | +| door | 55.41 | 68.1 | +| table | 63.56 | 76.02 | +| mountain | 62.15 | 76.43 | +| plant | 52.45 | 65.59 | +| curtain | 75.89 | 87.24 | +| chair | 59.31 | 71.5 | +| car | 84.79 | 92.2 | +| water | 56.94 | 70.9 | +| painting | 69.87 | 87.44 | +| sofa | 69.64 | 81.94 | +| shelf | 47.16 | 69.44 | +| house | 42.66 | 57.62 | +| sea | 59.19 | 75.98 | +| mirror | 67.86 | 74.75 | +| rug | 71.32 | 79.34 | +| field | 26.61 | 39.39 | +| armchair | 48.05 | 69.99 | +| seat | 63.05 | 84.94 | +| fence | 47.46 | 67.87 | +| desk | 47.26 | 73.91 | +| rock | 46.07 | 65.69 | +| wardrobe | 46.83 | 67.39 | +| lamp | 60.43 | 77.02 | +| bathtub | 79.54 | 87.13 | +| railing | 39.57 | 62.86 | +| cushion | 59.08 | 72.85 | +| base | 27.44 | 42.69 | +| box | 28.56 | 41.88 | +| column | 49.69 | 65.0 | +| signboard | 38.72 | 56.22 | +| chest of drawers | 37.39 | 62.21 | +| counter | 33.07 | 51.42 | +| sand | 43.96 | 56.15 | +| sink | 72.88 | 80.81 | +| skyscraper | 62.37 | 81.38 | +| fireplace | 70.27 | 92.46 | +| refrigerator | 73.18 | 78.67 | +| grandstand | 43.41 | 70.33 | +| path | 20.2 | 33.33 | +| stairs | 24.87 | 33.99 | +| runway | 72.4 | 91.96 | +| case | 53.21 | 66.57 | +| pool table | 90.34 | 97.19 | +| pillow | 61.29 | 74.63 | +| screen door | 79.21 | 84.53 | +| stairway | 34.88 | 46.42 | +| river | 13.54 | 29.94 | +| bridge | 72.62 | 87.72 | +| bookcase | 39.65 | 60.49 | +| blind | 41.06 | 44.83 | +| coffee table | 65.88 | 83.28 | +| toilet | 86.19 | 90.1 | +| flower | 39.52 | 54.38 | +| book | 49.61 | 67.18 | +| hill | 15.02 | 28.5 | +| bench | 55.8 | 71.85 | +| countertop | 52.99 | 65.78 | +| stove | 79.1 | 88.52 | +| palm | 45.45 | 65.87 | +| kitchen island | 40.78 | 83.58 | +| computer | 71.69 | 84.3 | +| swivel chair | 40.47 | 56.51 | +| boat | 59.25 | 68.56 | +| bar | 53.59 | 66.52 | +| arcade machine | 52.15 | 56.13 | +| hovel | 21.94 | 23.85 | +| bus | 91.48 | 94.96 | +| towel | 58.92 | 70.26 | +| light | 51.74 | 63.57 | +| truck | 41.95 | 54.95 | +| tower | 29.71 | 52.04 | +| chandelier | 61.01 | 77.62 | +| awning | 33.27 | 40.38 | +| streetlight | 30.24 | 39.53 | +| booth | 35.83 | 40.62 | +| television receiver | 72.27 | 85.62 | +| airplane | 59.46 | 71.33 | +| dirt track | 9.5 | 30.13 | +| apparel | 35.42 | 54.82 | +| pole | 25.74 | 36.76 | +| land | 2.63 | 6.59 | +| bannister | 14.6 | 18.43 | +| escalator | 11.17 | 11.54 | +| ottoman | 47.63 | 67.12 | +| bottle | 21.06 | 26.02 | +| buffet | 57.73 | 84.4 | +| poster | 29.12 | 35.9 | +| stage | 14.04 | 23.39 | +| van | 43.67 | 55.97 | +| ship | 5.54 | 6.87 | +| fountain | 23.47 | 24.0 | +| conveyer belt | 66.07 | 92.19 | +| canopy | 29.38 | 48.85 | +| washer | 67.25 | 69.2 | +| plaything | 30.41 | 42.45 | +| swimming pool | 52.34 | 68.62 | +| stool | 47.11 | 60.21 | +| barrel | 18.69 | 63.68 | +| basket | 33.5 | 47.88 | +| waterfall | 58.08 | 87.44 | +| tent | 92.47 | 97.09 | +| bag | 19.66 | 26.7 | +| minibike | 72.57 | 79.53 | +| cradle | 76.49 | 96.64 | +| oven | 48.52 | 62.77 | +| ball | 54.66 | 78.22 | +| food | 58.89 | 70.18 | +| step | 4.43 | 4.7 | +| tank | 38.21 | 41.43 | +| trade name | 25.36 | 30.2 | +| microwave | 82.26 | 89.89 | +| pot | 52.89 | 63.73 | +| animal | 61.28 | 65.62 | +| bicycle | 57.71 | 70.81 | +| lake | 54.45 | 65.96 | +| dishwasher | 44.96 | 51.46 | +| screen | 51.68 | 71.14 | +| blanket | 11.02 | 12.63 | +| sculpture | 51.33 | 73.98 | +| hood | 56.84 | 72.27 | +| sconce | 43.03 | 56.13 | +| vase | 41.58 | 56.26 | +| traffic light | 40.01 | 63.8 | +| tray | 7.61 | 10.08 | +| ashcan | 45.44 | 57.42 | +| fan | 58.2 | 72.78 | +| pier | 36.26 | 43.54 | +| crt screen | 13.6 | 37.5 | +| plate | 55.67 | 73.31 | +| monitor | 17.22 | 25.82 | +| bulletin board | 18.64 | 20.56 | +| shower | 3.09 | 6.07 | +| radiator | 53.07 | 57.83 | +| glass | 18.72 | 19.92 | +| clock | 24.63 | 30.66 | +| flag | 27.34 | 31.81 | ++---------------------+-------+-------+ +2024/01/07 18:27:13 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4970 coco/bbox_mAP_50: 0.6740 coco/bbox_mAP_75: 0.5450 coco/bbox_mAP_s: 0.3370 coco/bbox_mAP_m: 0.5490 coco/bbox_mAP_l: 0.6250 coco/segm_mAP: 0.3310 coco/segm_mAP_50: 0.5860 coco/segm_mAP_75: 0.3310 coco/segm_mAP_s: 0.1840 coco/segm_mAP_m: 0.3770 coco/segm_mAP_l: 0.4960 Bleu_1: 0.7450 Bleu_2: 0.5749 Bleu_3: 0.4323 Bleu_4: 0.3222 METEOR: 0.2644 ROUGE_L: 0.5477 CIDEr: 1.0509 SPICE: 0.1979 aAcc: 83.3900 mIoU: 49.2200 mAcc: 62.1100 visual-grounding/miou: 0.7996 visual-grounding/acc: 0.8697 data_time: 0.0099 time: 1.3605 +2024/01/07 18:39:53 - mmengine - INFO - Iter(train) [340500/640000] base_lr: 9.1055e-05 lr: 1.0096e-05 eta: 5 days, 2:53:47 time: 1.4890 data_time: 0.0210 memory: 25719 grad_norm: 2.8120 loss: 1.2153 detection_loss_cls: 0.0312 detection_loss_reg: 0.3327 caption_loss_cls: 2.1609 grounding_loss_reg: 2.5174 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3243 instance_segmentation_loss_poly: 0.8720 +2024/01/07 18:52:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 18:52:29 - mmengine - INFO - Iter(train) [341000/640000] base_lr: 9.0813e-05 lr: 1.0074e-05 eta: 5 days, 2:49:23 time: 1.4968 data_time: 0.0214 memory: 25719 grad_norm: 2.7941 loss: 1.2096 detection_loss_cls: 0.0312 detection_loss_reg: 0.3324 caption_loss_cls: 2.1584 grounding_loss_reg: 2.5151 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3247 instance_segmentation_loss_poly: 0.8730 +2024/01/07 19:04:34 - mmengine - INFO - Iter(train) [341500/640000] base_lr: 9.0572e-05 lr: 1.0052e-05 eta: 5 days, 2:30:43 time: 1.4921 data_time: 0.0214 memory: 25719 grad_norm: 2.8751 loss: 1.2106 detection_loss_cls: 0.0313 detection_loss_reg: 0.3330 caption_loss_cls: 2.1617 grounding_loss_reg: 2.5131 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3242 instance_segmentation_loss_poly: 0.8718 +2024/01/07 19:15:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 19:15:48 - mmengine - INFO - Iter(train) [342000/640000] base_lr: 9.0330e-05 lr: 1.0030e-05 eta: 5 days, 1:51:24 time: 1.4773 data_time: 0.0214 memory: 25719 grad_norm: 2.9018 loss: 1.2108 detection_loss_cls: 0.0312 detection_loss_reg: 0.3329 caption_loss_cls: 2.1569 grounding_loss_reg: 2.5137 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3251 instance_segmentation_loss_poly: 0.8740 +2024/01/07 19:15:48 - mmengine - INFO - Saving checkpoint at 342000 iterations +2024/01/07 19:28:23 - mmengine - INFO - Iter(train) [342500/640000] base_lr: 9.0088e-05 lr: 1.0008e-05 eta: 5 days, 1:46:28 time: 1.4803 data_time: 0.0225 memory: 25719 grad_norm: 2.9372 loss: 1.2274 detection_loss_cls: 0.0313 detection_loss_reg: 0.3336 caption_loss_cls: 2.1575 grounding_loss_reg: 2.5134 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3252 instance_segmentation_loss_poly: 0.8732 +2024/01/07 19:39:49 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 19:39:49 - mmengine - INFO - Iter(train) [343000/640000] base_lr: 8.9847e-05 lr: 9.9861e-06 eta: 5 days, 1:14:48 time: 1.4695 data_time: 0.0226 memory: 25719 grad_norm: 2.9622 loss: 1.2375 detection_loss_cls: 0.0314 detection_loss_reg: 0.3343 caption_loss_cls: 2.1564 grounding_loss_reg: 2.5107 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3256 instance_segmentation_loss_poly: 0.8740 +2024/01/07 19:51:48 - mmengine - INFO - Iter(train) [343500/640000] base_lr: 8.9606e-05 lr: 9.9641e-06 eta: 5 days, 0:56:44 time: 1.4517 data_time: 0.0228 memory: 25719 grad_norm: 3.0051 loss: 1.2521 detection_loss_cls: 0.0313 detection_loss_reg: 0.3336 caption_loss_cls: 2.1502 grounding_loss_reg: 2.5149 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3259 instance_segmentation_loss_poly: 0.8747 +2024/01/07 20:04:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 20:04:15 - mmengine - INFO - Iter(train) [344000/640000] base_lr: 8.9364e-05 lr: 9.9422e-06 eta: 5 days, 0:48:40 time: 1.4555 data_time: 0.0231 memory: 25719 grad_norm: 2.9952 loss: 1.2578 detection_loss_cls: 0.0314 detection_loss_reg: 0.3345 caption_loss_cls: 2.1545 grounding_loss_reg: 2.5155 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3268 instance_segmentation_loss_poly: 0.8768 +2024/01/07 20:04:15 - mmengine - INFO - Saving checkpoint at 344000 iterations +2024/01/07 20:16:23 - mmengine - INFO - Iter(train) [344500/640000] base_lr: 8.9123e-05 lr: 9.9203e-06 eta: 5 days, 0:34:08 time: 1.4469 data_time: 0.0270 memory: 25719 grad_norm: 3.0392 loss: 1.2761 detection_loss_cls: 0.0313 detection_loss_reg: 0.3335 caption_loss_cls: 2.1549 grounding_loss_reg: 2.5138 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3265 instance_segmentation_loss_poly: 0.8757 +2024/01/07 20:28:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 20:28:19 - mmengine - INFO - Iter(train) [345000/640000] base_lr: 8.8882e-05 lr: 9.8983e-06 eta: 5 days, 0:15:35 time: 1.4367 data_time: 0.0268 memory: 25719 grad_norm: 3.0503 loss: 1.2863 detection_loss_cls: 0.0312 detection_loss_reg: 0.3326 caption_loss_cls: 2.1523 grounding_loss_reg: 2.5138 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3254 instance_segmentation_loss_poly: 0.8735 +2024/01/07 20:40:26 - mmengine - INFO - Iter(train) [345500/640000] base_lr: 8.8641e-05 lr: 9.8764e-06 eta: 5 days, 0:01:13 time: 1.4373 data_time: 0.0269 memory: 25719 grad_norm: 3.0087 loss: 1.2892 detection_loss_cls: 0.0313 detection_loss_reg: 0.3334 caption_loss_cls: 2.1564 grounding_loss_reg: 2.5133 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3259 instance_segmentation_loss_poly: 0.8735 +2024/01/07 20:52:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 20:52:38 - mmengine - INFO - Iter(train) [346000/640000] base_lr: 8.8400e-05 lr: 9.8545e-06 eta: 4 days, 23:48:33 time: 1.4519 data_time: 0.0270 memory: 25719 grad_norm: 2.9693 loss: 1.2854 detection_loss_cls: 0.0312 detection_loss_reg: 0.3334 caption_loss_cls: 2.1569 grounding_loss_reg: 2.5096 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3268 instance_segmentation_loss_poly: 0.8764 +2024/01/07 20:52:38 - mmengine - INFO - Saving checkpoint at 346000 iterations +2024/01/07 21:04:56 - mmengine - INFO - Iter(train) [346500/640000] base_lr: 8.8159e-05 lr: 9.8326e-06 eta: 4 days, 23:37:20 time: 1.4475 data_time: 0.0265 memory: 25719 grad_norm: 2.9478 loss: 1.2760 detection_loss_cls: 0.0312 detection_loss_reg: 0.3341 caption_loss_cls: 2.1559 grounding_loss_reg: 2.5072 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3258 instance_segmentation_loss_poly: 0.8748 +2024/01/07 21:17:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 21:17:56 - mmengine - INFO - Iter(train) [347000/640000] base_lr: 8.7918e-05 lr: 9.8107e-06 eta: 4 days, 23:38:32 time: 1.4712 data_time: 0.0270 memory: 25719 grad_norm: 2.9070 loss: 1.2694 detection_loss_cls: 0.0314 detection_loss_reg: 0.3354 caption_loss_cls: 2.1527 grounding_loss_reg: 2.5059 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3268 instance_segmentation_loss_poly: 0.8762 +2024/01/07 21:30:14 - mmengine - INFO - Iter(train) [347500/640000] base_lr: 8.7677e-05 lr: 9.7888e-06 eta: 4 days, 23:26:52 time: 1.4757 data_time: 0.0270 memory: 25719 grad_norm: 2.9040 loss: 1.2648 detection_loss_cls: 0.0313 detection_loss_reg: 0.3347 caption_loss_cls: 2.1540 grounding_loss_reg: 2.5037 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3266 instance_segmentation_loss_poly: 0.8755 +2024/01/07 21:42:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 21:42:04 - mmengine - INFO - Iter(train) [348000/640000] base_lr: 8.7436e-05 lr: 9.7669e-06 eta: 4 days, 23:07:54 time: 1.4667 data_time: 0.0267 memory: 25719 grad_norm: 2.9092 loss: 1.2651 detection_loss_cls: 0.0313 detection_loss_reg: 0.3337 caption_loss_cls: 2.1583 grounding_loss_reg: 2.5039 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3258 instance_segmentation_loss_poly: 0.8736 +2024/01/07 21:42:04 - mmengine - INFO - Saving checkpoint at 348000 iterations +2024/01/07 21:54:02 - mmengine - INFO - Iter(train) [348500/640000] base_lr: 8.7196e-05 lr: 9.7451e-06 eta: 4 days, 22:51:19 time: 1.4642 data_time: 0.0268 memory: 25719 grad_norm: 2.9303 loss: 1.2764 detection_loss_cls: 0.0315 detection_loss_reg: 0.3358 caption_loss_cls: 2.1607 grounding_loss_reg: 2.5036 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3259 instance_segmentation_loss_poly: 0.8747 +2024/01/07 22:06:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 22:06:52 - mmengine - INFO - Iter(train) [349000/640000] base_lr: 8.6955e-05 lr: 9.7232e-06 eta: 4 days, 22:48:06 time: 1.4777 data_time: 0.0271 memory: 25719 grad_norm: 2.9358 loss: 1.2690 detection_loss_cls: 0.0316 detection_loss_reg: 0.3363 caption_loss_cls: 2.1545 grounding_loss_reg: 2.5018 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3274 instance_segmentation_loss_poly: 0.8777 +2024/01/07 22:20:05 - mmengine - INFO - Iter(train) [349500/640000] base_lr: 8.6715e-05 lr: 9.7013e-06 eta: 4 days, 22:50:19 time: 1.4942 data_time: 0.0273 memory: 25719 grad_norm: 2.8730 loss: 1.2471 detection_loss_cls: 0.0315 detection_loss_reg: 0.3358 caption_loss_cls: 2.1525 grounding_loss_reg: 2.4992 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3277 instance_segmentation_loss_poly: 0.8789 +2024/01/07 22:32:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 22:32:19 - mmengine - INFO - Iter(train) [350000/640000] base_lr: 8.6474e-05 lr: 9.6795e-06 eta: 4 days, 22:37:14 time: 1.4944 data_time: 0.0274 memory: 25719 grad_norm: 2.8869 loss: 1.2567 detection_loss_cls: 0.0314 detection_loss_reg: 0.3355 caption_loss_cls: 2.1530 grounding_loss_reg: 2.5003 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3279 instance_segmentation_loss_poly: 0.8791 +2024/01/07 22:32:19 - mmengine - INFO - Saving checkpoint at 350000 iterations +2024/01/07 22:45:15 - mmengine - INFO - Iter(train) [350500/640000] base_lr: 8.6234e-05 lr: 9.6576e-06 eta: 4 days, 22:34:25 time: 1.5043 data_time: 0.0277 memory: 25719 grad_norm: 2.8590 loss: 1.2581 detection_loss_cls: 0.0314 detection_loss_reg: 0.3352 caption_loss_cls: 2.1543 grounding_loss_reg: 2.4956 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0296 instance_segmentation_loss_reg: 0.3290 instance_segmentation_loss_poly: 0.8801 +2024/01/07 22:57:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 22:57:10 - mmengine - INFO - Iter(train) [351000/640000] base_lr: 8.5994e-05 lr: 9.6358e-06 eta: 4 days, 22:16:53 time: 1.4878 data_time: 0.0272 memory: 25719 grad_norm: 3.0195 loss: 1.2592 detection_loss_cls: 0.0314 detection_loss_reg: 0.3342 caption_loss_cls: 2.1554 grounding_loss_reg: 2.4964 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3275 instance_segmentation_loss_poly: 0.8771 +2024/01/07 23:09:42 - mmengine - INFO - Iter(train) [351500/640000] base_lr: 8.5754e-05 lr: 9.6140e-06 eta: 4 days, 22:07:52 time: 1.4914 data_time: 0.0275 memory: 25719 grad_norm: 3.0184 loss: 1.2629 detection_loss_cls: 0.0314 detection_loss_reg: 0.3345 caption_loss_cls: 2.1542 grounding_loss_reg: 2.4986 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3272 instance_segmentation_loss_poly: 0.8772 +2024/01/07 23:22:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 23:22:32 - mmengine - INFO - Iter(train) [352000/640000] base_lr: 8.5513e-05 lr: 9.5921e-06 eta: 4 days, 22:02:49 time: 1.5064 data_time: 0.0277 memory: 25719 grad_norm: 2.9749 loss: 1.2387 detection_loss_cls: 0.0315 detection_loss_reg: 0.3343 caption_loss_cls: 2.1489 grounding_loss_reg: 2.4971 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3269 instance_segmentation_loss_poly: 0.8763 +2024/01/07 23:22:32 - mmengine - INFO - Saving checkpoint at 352000 iterations +2024/01/07 23:35:08 - mmengine - INFO - Iter(train) [352500/640000] base_lr: 8.5274e-05 lr: 9.5703e-06 eta: 4 days, 21:54:23 time: 1.5159 data_time: 0.0279 memory: 25719 grad_norm: 2.9576 loss: 1.2282 detection_loss_cls: 0.0314 detection_loss_reg: 0.3335 caption_loss_cls: 2.1488 grounding_loss_reg: 2.4946 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3265 instance_segmentation_loss_poly: 0.8745 +2024/01/07 23:46:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/07 23:46:57 - mmengine - INFO - Iter(train) [353000/640000] base_lr: 8.5034e-05 lr: 9.5485e-06 eta: 4 days, 21:35:53 time: 1.5007 data_time: 0.0276 memory: 25719 grad_norm: 2.9312 loss: 1.2308 detection_loss_cls: 0.0314 detection_loss_reg: 0.3335 caption_loss_cls: 2.1524 grounding_loss_reg: 2.4938 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3272 instance_segmentation_loss_poly: 0.8755 +2024/01/07 23:58:52 - mmengine - INFO - Iter(train) [353500/640000] base_lr: 8.4794e-05 lr: 9.5267e-06 eta: 4 days, 21:18:58 time: 1.4811 data_time: 0.0272 memory: 25719 grad_norm: 3.2474 loss: 1.2408 detection_loss_cls: 0.0313 detection_loss_reg: 0.3321 caption_loss_cls: 2.1543 grounding_loss_reg: 2.4946 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3252 instance_segmentation_loss_poly: 0.8709 +2024/01/08 00:10:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 00:10:25 - mmengine - INFO - Iter(train) [354000/640000] base_lr: 8.4554e-05 lr: 9.5049e-06 eta: 4 days, 20:57:42 time: 1.4708 data_time: 0.0269 memory: 25719 grad_norm: 3.2723 loss: 1.2416 detection_loss_cls: 0.0314 detection_loss_reg: 0.3329 caption_loss_cls: 2.1569 grounding_loss_reg: 2.4995 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3260 instance_segmentation_loss_poly: 0.8729 +2024/01/08 00:10:25 - mmengine - INFO - Saving checkpoint at 354000 iterations +2024/01/08 00:22:45 - mmengine - INFO - Iter(train) [354500/640000] base_lr: 8.4315e-05 lr: 9.4832e-06 eta: 4 days, 20:46:08 time: 1.4616 data_time: 0.0267 memory: 25719 grad_norm: 3.3553 loss: 1.2472 detection_loss_cls: 0.0312 detection_loss_reg: 0.3311 caption_loss_cls: 2.1540 grounding_loss_reg: 2.4949 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3269 instance_segmentation_loss_poly: 0.8747 +2024/01/08 00:35:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 00:35:24 - mmengine - INFO - Iter(train) [355000/640000] base_lr: 8.4075e-05 lr: 9.4614e-06 eta: 4 days, 20:38:12 time: 1.4728 data_time: 0.0269 memory: 25719 grad_norm: 3.2298 loss: 1.2387 detection_loss_cls: 0.0313 detection_loss_reg: 0.3316 caption_loss_cls: 2.1553 grounding_loss_reg: 2.4945 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3249 instance_segmentation_loss_poly: 0.8705 +2024/01/08 00:48:07 - mmengine - INFO - Iter(train) [355500/640000] base_lr: 8.3836e-05 lr: 9.4396e-06 eta: 4 days, 20:30:47 time: 1.4757 data_time: 0.0268 memory: 25719 grad_norm: 3.2364 loss: 1.2286 detection_loss_cls: 0.0313 detection_loss_reg: 0.3325 caption_loss_cls: 2.1553 grounding_loss_reg: 2.4957 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3252 instance_segmentation_loss_poly: 0.8706 +2024/01/08 01:00:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 01:00:44 - mmengine - INFO - Iter(train) [356000/640000] base_lr: 8.3597e-05 lr: 9.4179e-06 eta: 4 days, 20:22:03 time: 1.4723 data_time: 0.0270 memory: 25719 grad_norm: 3.2966 loss: 1.2443 detection_loss_cls: 0.0312 detection_loss_reg: 0.3317 caption_loss_cls: 2.1492 grounding_loss_reg: 2.4963 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3262 instance_segmentation_loss_poly: 0.8724 +2024/01/08 01:00:44 - mmengine - INFO - Saving checkpoint at 356000 iterations +2024/01/08 01:13:40 - mmengine - INFO - Iter(train) [356500/640000] base_lr: 8.3358e-05 lr: 9.3961e-06 eta: 4 days, 20:16:36 time: 1.4773 data_time: 0.0269 memory: 25719 grad_norm: 3.2925 loss: 1.2323 detection_loss_cls: 0.0311 detection_loss_reg: 0.3318 caption_loss_cls: 2.1497 grounding_loss_reg: 2.4952 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3255 instance_segmentation_loss_poly: 0.8701 +2024/01/08 01:26:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 01:26:27 - mmengine - INFO - Iter(train) [357000/640000] base_lr: 8.3118e-05 lr: 9.3744e-06 eta: 4 days, 20:09:09 time: 1.4917 data_time: 0.0271 memory: 25719 grad_norm: 3.3042 loss: 1.2294 detection_loss_cls: 0.0311 detection_loss_reg: 0.3315 caption_loss_cls: 2.1481 grounding_loss_reg: 2.4965 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3255 instance_segmentation_loss_poly: 0.8704 +2024/01/08 01:39:52 - mmengine - INFO - Iter(train) [357500/640000] base_lr: 8.2880e-05 lr: 9.3527e-06 eta: 4 days, 20:08:10 time: 1.5142 data_time: 0.0277 memory: 25719 grad_norm: 3.0051 loss: 1.2246 detection_loss_cls: 0.0309 detection_loss_reg: 0.3310 caption_loss_cls: 2.1512 grounding_loss_reg: 2.4998 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3249 instance_segmentation_loss_poly: 0.8696 +2024/01/08 01:51:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 01:51:48 - mmengine - INFO - Iter(train) [358000/640000] base_lr: 8.2641e-05 lr: 9.3310e-06 eta: 4 days, 19:51:50 time: 1.5203 data_time: 0.0278 memory: 25719 grad_norm: 2.9997 loss: 1.2220 detection_loss_cls: 0.0309 detection_loss_reg: 0.3310 caption_loss_cls: 2.1568 grounding_loss_reg: 2.4969 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3250 instance_segmentation_loss_poly: 0.8700 +2024/01/08 01:51:48 - mmengine - INFO - Saving checkpoint at 358000 iterations +2024/01/08 02:04:15 - mmengine - INFO - Iter(train) [358500/640000] base_lr: 8.2402e-05 lr: 9.3093e-06 eta: 4 days, 19:40:38 time: 1.5220 data_time: 0.0279 memory: 25719 grad_norm: 2.9752 loss: 1.2193 detection_loss_cls: 0.0311 detection_loss_reg: 0.3331 caption_loss_cls: 2.1580 grounding_loss_reg: 2.4963 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3265 instance_segmentation_loss_poly: 0.8734 +2024/01/08 02:16:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 02:16:54 - mmengine - INFO - Iter(train) [359000/640000] base_lr: 8.2163e-05 lr: 9.2876e-06 eta: 4 days, 19:31:25 time: 1.5220 data_time: 0.0279 memory: 25719 grad_norm: 2.9968 loss: 1.2234 detection_loss_cls: 0.0310 detection_loss_reg: 0.3327 caption_loss_cls: 2.1575 grounding_loss_reg: 2.5003 semantic_segmentation_loss_cls: 0.0080 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3262 instance_segmentation_loss_poly: 0.8720 +2024/01/08 02:28:55 - mmengine - INFO - Iter(train) [359500/640000] base_lr: 8.1925e-05 lr: 9.2659e-06 eta: 4 days, 19:15:54 time: 1.5113 data_time: 0.0277 memory: 25719 grad_norm: 3.0436 loss: 1.2314 detection_loss_cls: 0.0311 detection_loss_reg: 0.3332 caption_loss_cls: 2.1564 grounding_loss_reg: 2.4994 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3264 instance_segmentation_loss_poly: 0.8720 +2024/01/08 02:40:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 02:40:52 - mmengine - INFO - Iter(train) [360000/640000] base_lr: 8.1687e-05 lr: 9.2442e-06 eta: 4 days, 19:00:07 time: 1.5014 data_time: 0.0274 memory: 25719 grad_norm: 3.0336 loss: 1.2292 detection_loss_cls: 0.0309 detection_loss_reg: 0.3315 caption_loss_cls: 2.1611 grounding_loss_reg: 2.4946 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3250 instance_segmentation_loss_poly: 0.8694 +2024/01/08 02:40:52 - mmengine - INFO - Saving checkpoint at 360000 iterations +2024/01/08 02:53:42 - mmengine - INFO - Evaluating bbox... +2024/01/08 02:54:40 - mmengine - INFO - bbox_mAP_copypaste: 0.495 0.677 0.542 0.335 0.545 0.636 +2024/01/08 02:54:40 - mmengine - INFO - Evaluating segm... +2024/01/08 02:55:53 - mmengine - INFO - segm_mAP_copypaste: 0.333 0.593 0.330 0.186 0.383 0.506 +2024/01/08 03:02:53 - mmengine - INFO - per class results: +2024/01/08 03:02:53 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.24 | 89.14 | +| building | 81.48 | 90.81 | +| sky | 92.86 | 98.22 | +| floor | 82.45 | 89.23 | +| tree | 71.78 | 79.4 | +| ceiling | 84.09 | 94.32 | +| road | 82.42 | 89.54 | +| bed | 88.15 | 95.17 | +| windowpane | 61.68 | 76.8 | +| grass | 66.49 | 81.42 | +| cabinet | 59.32 | 70.42 | +| sidewalk | 65.11 | 77.9 | +| person | 80.33 | 91.52 | +| earth | 37.43 | 48.09 | +| door | 53.39 | 64.25 | +| table | 63.14 | 77.53 | +| mountain | 60.51 | 74.73 | +| plant | 52.68 | 67.61 | +| curtain | 72.53 | 87.46 | +| chair | 60.15 | 75.83 | +| car | 83.83 | 91.64 | +| water | 55.93 | 71.33 | +| painting | 73.31 | 85.53 | +| sofa | 70.6 | 81.52 | +| shelf | 42.54 | 71.17 | +| house | 41.37 | 61.51 | +| sea | 52.72 | 65.56 | +| mirror | 68.37 | 79.03 | +| rug | 72.0 | 79.3 | +| field | 29.49 | 57.14 | +| armchair | 50.76 | 72.08 | +| seat | 60.61 | 72.85 | +| fence | 45.02 | 59.16 | +| desk | 52.16 | 71.67 | +| rock | 46.76 | 74.01 | +| wardrobe | 32.8 | 45.86 | +| lamp | 61.95 | 73.53 | +| bathtub | 79.12 | 84.58 | +| railing | 35.47 | 48.38 | +| cushion | 58.48 | 69.9 | +| base | 25.02 | 38.66 | +| box | 26.23 | 37.46 | +| column | 49.93 | 63.87 | +| signboard | 38.97 | 52.65 | +| chest of drawers | 34.2 | 64.9 | +| counter | 41.22 | 48.37 | +| sand | 44.73 | 71.02 | +| sink | 71.27 | 82.34 | +| skyscraper | 68.5 | 92.77 | +| fireplace | 68.36 | 90.98 | +| refrigerator | 75.75 | 82.5 | +| grandstand | 31.05 | 77.4 | +| path | 23.87 | 43.66 | +| stairs | 27.04 | 32.06 | +| runway | 67.76 | 93.08 | +| case | 54.54 | 69.31 | +| pool table | 86.79 | 96.81 | +| pillow | 57.14 | 69.63 | +| screen door | 78.33 | 84.1 | +| stairway | 29.36 | 47.21 | +| river | 12.87 | 31.1 | +| bridge | 57.71 | 88.13 | +| bookcase | 36.39 | 56.91 | +| blind | 40.07 | 49.77 | +| coffee table | 64.38 | 85.8 | +| toilet | 86.67 | 89.93 | +| flower | 40.16 | 51.95 | +| book | 48.61 | 69.82 | +| hill | 13.77 | 22.85 | +| bench | 52.37 | 61.33 | +| countertop | 60.12 | 73.25 | +| stove | 76.25 | 81.84 | +| palm | 47.82 | 69.49 | +| kitchen island | 45.88 | 90.9 | +| computer | 73.6 | 84.23 | +| swivel chair | 43.95 | 61.02 | +| boat | 58.29 | 62.06 | +| bar | 44.34 | 52.89 | +| arcade machine | 56.26 | 60.08 | +| hovel | 23.64 | 49.06 | +| bus | 91.46 | 95.6 | +| towel | 61.68 | 70.29 | +| light | 48.3 | 54.95 | +| truck | 40.15 | 58.62 | +| tower | 21.01 | 46.97 | +| chandelier | 64.37 | 77.94 | +| awning | 32.51 | 39.66 | +| streetlight | 29.86 | 41.16 | +| booth | 33.45 | 38.83 | +| television receiver | 70.77 | 83.07 | +| airplane | 59.11 | 67.62 | +| dirt track | 9.16 | 16.6 | +| apparel | 32.4 | 44.22 | +| pole | 26.69 | 35.12 | +| land | 4.27 | 5.44 | +| bannister | 17.73 | 22.6 | +| escalator | 37.65 | 43.94 | +| ottoman | 51.42 | 63.34 | +| bottle | 23.07 | 28.48 | +| buffet | 36.03 | 43.19 | +| poster | 31.78 | 37.31 | +| stage | 10.11 | 22.21 | +| van | 46.07 | 57.76 | +| ship | 7.34 | 10.02 | +| fountain | 15.41 | 16.43 | +| conveyer belt | 85.1 | 90.17 | +| canopy | 18.31 | 26.62 | +| washer | 72.56 | 73.49 | +| plaything | 21.54 | 22.77 | +| swimming pool | 59.83 | 73.0 | +| stool | 52.65 | 64.93 | +| barrel | 12.89 | 66.23 | +| basket | 35.7 | 54.53 | +| waterfall | 49.1 | 77.38 | +| tent | 92.03 | 96.77 | +| bag | 20.91 | 27.52 | +| minibike | 72.89 | 81.6 | +| cradle | 70.63 | 97.19 | +| oven | 53.92 | 65.6 | +| ball | 50.74 | 70.43 | +| food | 49.32 | 52.37 | +| step | 9.61 | 13.45 | +| tank | 43.25 | 55.05 | +| trade name | 21.86 | 23.99 | +| microwave | 86.28 | 91.83 | +| pot | 54.13 | 65.68 | +| animal | 60.67 | 65.22 | +| bicycle | 57.22 | 74.32 | +| lake | 44.39 | 47.76 | +| dishwasher | 56.6 | 65.6 | +| screen | 52.53 | 69.21 | +| blanket | 13.43 | 15.26 | +| sculpture | 55.17 | 69.74 | +| hood | 57.06 | 67.09 | +| sconce | 37.5 | 43.01 | +| vase | 43.33 | 59.4 | +| traffic light | 39.42 | 51.26 | +| tray | 7.23 | 14.17 | +| ashcan | 45.96 | 58.45 | +| fan | 56.37 | 70.78 | +| pier | 33.64 | 41.02 | +| crt screen | 13.12 | 42.41 | +| plate | 54.9 | 76.91 | +| monitor | 13.3 | 17.47 | +| bulletin board | 32.21 | 40.19 | +| shower | 3.19 | 7.59 | +| radiator | 61.39 | 69.56 | +| glass | 18.62 | 20.29 | +| clock | 26.46 | 30.44 | +| flag | 24.65 | 27.71 | ++---------------------+-------+-------+ +2024/01/08 03:03:10 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4950 coco/bbox_mAP_50: 0.6770 coco/bbox_mAP_75: 0.5420 coco/bbox_mAP_s: 0.3350 coco/bbox_mAP_m: 0.5450 coco/bbox_mAP_l: 0.6360 coco/segm_mAP: 0.3330 coco/segm_mAP_50: 0.5930 coco/segm_mAP_75: 0.3300 coco/segm_mAP_s: 0.1860 coco/segm_mAP_m: 0.3830 coco/segm_mAP_l: 0.5060 Bleu_1: 0.7484 Bleu_2: 0.5762 Bleu_3: 0.4317 Bleu_4: 0.3206 METEOR: 0.2626 ROUGE_L: 0.5456 CIDEr: 1.0434 SPICE: 0.1962 aAcc: 82.9000 mIoU: 48.8900 mAcc: 61.4900 visual-grounding/miou: 0.8055 visual-grounding/acc: 0.8733 data_time: 0.0046 time: 1.3566 +2024/01/08 03:15:49 - mmengine - INFO - Iter(train) [360500/640000] base_lr: 8.1448e-05 lr: 9.2226e-06 eta: 4 days, 18:50:59 time: 1.4975 data_time: 0.0233 memory: 25719 grad_norm: 3.0274 loss: 1.2367 detection_loss_cls: 0.0310 detection_loss_reg: 0.3329 caption_loss_cls: 2.1584 grounding_loss_reg: 2.4940 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3259 instance_segmentation_loss_poly: 0.8706 +2024/01/08 03:27:26 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 03:27:26 - mmengine - INFO - Iter(train) [361000/640000] base_lr: 8.1210e-05 lr: 9.2009e-06 eta: 4 days, 18:32:15 time: 1.4802 data_time: 0.0230 memory: 25719 grad_norm: 3.0681 loss: 1.2469 detection_loss_cls: 0.0310 detection_loss_reg: 0.3330 caption_loss_cls: 2.1554 grounding_loss_reg: 2.4945 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3259 instance_segmentation_loss_poly: 0.8699 +2024/01/08 03:39:30 - mmengine - INFO - Iter(train) [361500/640000] base_lr: 8.0972e-05 lr: 9.1793e-06 eta: 4 days, 18:17:39 time: 1.4599 data_time: 0.0226 memory: 25719 grad_norm: 3.1421 loss: 1.2464 detection_loss_cls: 0.0309 detection_loss_reg: 0.3322 caption_loss_cls: 2.1528 grounding_loss_reg: 2.4935 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3253 instance_segmentation_loss_poly: 0.8682 +2024/01/08 03:51:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 03:51:11 - mmengine - INFO - Iter(train) [362000/640000] base_lr: 8.0734e-05 lr: 9.1577e-06 eta: 4 days, 17:59:51 time: 1.4560 data_time: 0.0225 memory: 25719 grad_norm: 3.1416 loss: 1.2448 detection_loss_cls: 0.0308 detection_loss_reg: 0.3325 caption_loss_cls: 2.1542 grounding_loss_reg: 2.4910 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3253 instance_segmentation_loss_poly: 0.8684 +2024/01/08 03:51:11 - mmengine - INFO - Saving checkpoint at 362000 iterations +2024/01/08 04:03:05 - mmengine - INFO - Iter(train) [362500/640000] base_lr: 8.0496e-05 lr: 9.1360e-06 eta: 4 days, 17:44:03 time: 1.4478 data_time: 0.0223 memory: 25719 grad_norm: 3.1536 loss: 1.2458 detection_loss_cls: 0.0307 detection_loss_reg: 0.3323 caption_loss_cls: 2.1520 grounding_loss_reg: 2.4914 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3249 instance_segmentation_loss_poly: 0.8684 +2024/01/08 04:15:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 04:15:01 - mmengine - INFO - Iter(train) [363000/640000] base_lr: 8.0259e-05 lr: 9.1144e-06 eta: 4 days, 17:28:41 time: 1.4370 data_time: 0.0222 memory: 25719 grad_norm: 3.1360 loss: 1.2553 detection_loss_cls: 0.0306 detection_loss_reg: 0.3324 caption_loss_cls: 2.1524 grounding_loss_reg: 2.4918 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3243 instance_segmentation_loss_poly: 0.8674 +2024/01/08 04:27:03 - mmengine - INFO - Iter(train) [363500/640000] base_lr: 8.0021e-05 lr: 9.0928e-06 eta: 4 days, 17:14:19 time: 1.4376 data_time: 0.0222 memory: 25719 grad_norm: 3.1081 loss: 1.2579 detection_loss_cls: 0.0306 detection_loss_reg: 0.3324 caption_loss_cls: 2.1505 grounding_loss_reg: 2.4902 semantic_segmentation_loss_cls: 0.0079 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3254 instance_segmentation_loss_poly: 0.8695 +2024/01/08 04:39:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 04:39:25 - mmengine - INFO - Iter(train) [364000/640000] base_lr: 7.9784e-05 lr: 9.0713e-06 eta: 4 days, 17:02:38 time: 1.4437 data_time: 0.0222 memory: 25719 grad_norm: 3.0758 loss: 1.2569 detection_loss_cls: 0.0307 detection_loss_reg: 0.3327 caption_loss_cls: 2.1549 grounding_loss_reg: 2.4870 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3245 instance_segmentation_loss_poly: 0.8679 +2024/01/08 04:39:25 - mmengine - INFO - Saving checkpoint at 364000 iterations +2024/01/08 04:51:55 - mmengine - INFO - Iter(train) [364500/640000] base_lr: 7.9547e-05 lr: 9.0497e-06 eta: 4 days, 16:51:57 time: 1.4409 data_time: 0.0263 memory: 25719 grad_norm: 3.0528 loss: 1.2625 detection_loss_cls: 0.0307 detection_loss_reg: 0.3334 caption_loss_cls: 2.1540 grounding_loss_reg: 2.4882 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3260 instance_segmentation_loss_poly: 0.8709 +2024/01/08 05:04:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 05:04:21 - mmengine - INFO - Iter(train) [365000/640000] base_lr: 7.9309e-05 lr: 9.0281e-06 eta: 4 days, 16:40:45 time: 1.4531 data_time: 0.0266 memory: 25719 grad_norm: 3.0750 loss: 1.2612 detection_loss_cls: 0.0308 detection_loss_reg: 0.3346 caption_loss_cls: 2.1533 grounding_loss_reg: 2.4851 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3266 instance_segmentation_loss_poly: 0.8728 +2024/01/08 05:17:46 - mmengine - INFO - Iter(train) [365500/640000] base_lr: 7.9072e-05 lr: 9.0066e-06 eta: 4 days, 16:37:06 time: 1.4734 data_time: 0.0271 memory: 25719 grad_norm: 2.9924 loss: 1.2608 detection_loss_cls: 0.0308 detection_loss_reg: 0.3343 caption_loss_cls: 2.1476 grounding_loss_reg: 2.4844 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3276 instance_segmentation_loss_poly: 0.8747 +2024/01/08 05:30:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 05:30:32 - mmengine - INFO - Iter(train) [366000/640000] base_lr: 7.8836e-05 lr: 8.9851e-06 eta: 4 days, 16:28:14 time: 1.4896 data_time: 0.0274 memory: 25719 grad_norm: 2.9302 loss: 1.2544 detection_loss_cls: 0.0309 detection_loss_reg: 0.3349 caption_loss_cls: 2.1505 grounding_loss_reg: 2.4831 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3278 instance_segmentation_loss_poly: 0.8739 +2024/01/08 05:30:32 - mmengine - INFO - Saving checkpoint at 366000 iterations +2024/01/08 05:42:33 - mmengine - INFO - Iter(train) [366500/640000] base_lr: 7.8599e-05 lr: 8.9635e-06 eta: 4 days, 16:13:41 time: 1.4915 data_time: 0.0276 memory: 25719 grad_norm: 2.9152 loss: 1.2561 detection_loss_cls: 0.0309 detection_loss_reg: 0.3345 caption_loss_cls: 2.1511 grounding_loss_reg: 2.4836 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3284 instance_segmentation_loss_poly: 0.8745 +2024/01/08 05:54:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 05:54:36 - mmengine - INFO - Iter(train) [367000/640000] base_lr: 7.8362e-05 lr: 8.9420e-06 eta: 4 days, 15:59:20 time: 1.4931 data_time: 0.0284 memory: 25719 grad_norm: 2.9287 loss: 1.2592 detection_loss_cls: 0.0308 detection_loss_reg: 0.3335 caption_loss_cls: 2.1506 grounding_loss_reg: 2.4858 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3277 instance_segmentation_loss_poly: 0.8721 +2024/01/08 06:07:11 - mmengine - INFO - Iter(train) [367500/640000] base_lr: 7.8126e-05 lr: 8.9205e-06 eta: 4 days, 15:49:02 time: 1.5012 data_time: 0.0284 memory: 25719 grad_norm: 2.9028 loss: 1.2529 detection_loss_cls: 0.0308 detection_loss_reg: 0.3339 caption_loss_cls: 2.1505 grounding_loss_reg: 2.4829 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3274 instance_segmentation_loss_poly: 0.8729 +2024/01/08 06:19:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 06:19:12 - mmengine - INFO - Iter(train) [368000/640000] base_lr: 7.7889e-05 lr: 8.8990e-06 eta: 4 days, 15:34:36 time: 1.4960 data_time: 0.0286 memory: 25719 grad_norm: 2.9489 loss: 1.2617 detection_loss_cls: 0.0309 detection_loss_reg: 0.3351 caption_loss_cls: 2.1478 grounding_loss_reg: 2.4803 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3291 instance_segmentation_loss_poly: 0.8765 +2024/01/08 06:19:12 - mmengine - INFO - Saving checkpoint at 368000 iterations +2024/01/08 06:32:22 - mmengine - INFO - Iter(train) [368500/640000] base_lr: 7.7653e-05 lr: 8.8776e-06 eta: 4 days, 15:28:22 time: 1.5062 data_time: 0.0287 memory: 25719 grad_norm: 2.9526 loss: 1.2523 detection_loss_cls: 0.0307 detection_loss_reg: 0.3340 caption_loss_cls: 2.1503 grounding_loss_reg: 2.4777 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3284 instance_segmentation_loss_poly: 0.8738 +2024/01/08 06:44:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 06:44:35 - mmengine - INFO - Iter(train) [369000/640000] base_lr: 7.7417e-05 lr: 8.8561e-06 eta: 4 days, 15:15:14 time: 1.5028 data_time: 0.0286 memory: 25719 grad_norm: 2.9199 loss: 1.2488 detection_loss_cls: 0.0307 detection_loss_reg: 0.3337 caption_loss_cls: 2.1496 grounding_loss_reg: 2.4764 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3281 instance_segmentation_loss_poly: 0.8735 +2024/01/08 06:56:57 - mmengine - INFO - Iter(train) [369500/640000] base_lr: 7.7181e-05 lr: 8.8347e-06 eta: 4 days, 15:03:19 time: 1.4872 data_time: 0.0281 memory: 25719 grad_norm: 2.9394 loss: 1.2443 detection_loss_cls: 0.0307 detection_loss_reg: 0.3334 caption_loss_cls: 2.1472 grounding_loss_reg: 2.4769 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3279 instance_segmentation_loss_poly: 0.8729 +2024/01/08 07:09:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 07:09:39 - mmengine - INFO - Iter(train) [370000/640000] base_lr: 7.6945e-05 lr: 8.8132e-06 eta: 4 days, 14:53:28 time: 1.4860 data_time: 0.0279 memory: 25719 grad_norm: 2.9245 loss: 1.2395 detection_loss_cls: 0.0307 detection_loss_reg: 0.3335 caption_loss_cls: 2.1505 grounding_loss_reg: 2.4760 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3277 instance_segmentation_loss_poly: 0.8724 +2024/01/08 07:09:39 - mmengine - INFO - Saving checkpoint at 370000 iterations +2024/01/08 07:22:33 - mmengine - INFO - Iter(train) [370500/640000] base_lr: 7.6710e-05 lr: 8.7918e-06 eta: 4 days, 14:44:57 time: 1.4992 data_time: 0.0282 memory: 25719 grad_norm: 2.8907 loss: 1.2301 detection_loss_cls: 0.0305 detection_loss_reg: 0.3326 caption_loss_cls: 2.1473 grounding_loss_reg: 2.4729 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3275 instance_segmentation_loss_poly: 0.8723 +2024/01/08 07:35:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 07:35:13 - mmengine - INFO - Iter(train) [371000/640000] base_lr: 7.6474e-05 lr: 8.7704e-06 eta: 4 days, 14:34:49 time: 1.5086 data_time: 0.0275 memory: 25719 grad_norm: 2.8315 loss: 1.2153 detection_loss_cls: 0.0306 detection_loss_reg: 0.3336 caption_loss_cls: 2.1469 grounding_loss_reg: 2.4733 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3286 instance_segmentation_loss_poly: 0.8737 +2024/01/08 07:47:22 - mmengine - INFO - Iter(train) [371500/640000] base_lr: 7.6239e-05 lr: 8.7490e-06 eta: 4 days, 14:21:19 time: 1.5022 data_time: 0.0275 memory: 25719 grad_norm: 2.8551 loss: 1.2267 detection_loss_cls: 0.0308 detection_loss_reg: 0.3349 caption_loss_cls: 2.1511 grounding_loss_reg: 2.4711 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3281 instance_segmentation_loss_poly: 0.8722 +2024/01/08 07:59:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 07:59:43 - mmengine - INFO - Iter(train) [372000/640000] base_lr: 7.6004e-05 lr: 8.7276e-06 eta: 4 days, 14:09:06 time: 1.5072 data_time: 0.0275 memory: 25719 grad_norm: 2.8225 loss: 1.2144 detection_loss_cls: 0.0307 detection_loss_reg: 0.3345 caption_loss_cls: 2.1506 grounding_loss_reg: 2.4707 semantic_segmentation_loss_cls: 0.0078 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3298 instance_segmentation_loss_poly: 0.8752 +2024/01/08 07:59:43 - mmengine - INFO - Saving checkpoint at 372000 iterations +2024/01/08 08:12:37 - mmengine - INFO - Iter(train) [372500/640000] base_lr: 7.5769e-05 lr: 8.7063e-06 eta: 4 days, 14:00:20 time: 1.5031 data_time: 0.0275 memory: 25719 grad_norm: 2.8507 loss: 1.2140 detection_loss_cls: 0.0308 detection_loss_reg: 0.3348 caption_loss_cls: 2.1447 grounding_loss_reg: 2.4701 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3297 instance_segmentation_loss_poly: 0.8746 +2024/01/08 08:24:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 08:24:52 - mmengine - INFO - Iter(train) [373000/640000] base_lr: 7.5534e-05 lr: 8.6849e-06 eta: 4 days, 13:47:25 time: 1.5038 data_time: 0.0276 memory: 25719 grad_norm: 2.8531 loss: 1.2212 detection_loss_cls: 0.0308 detection_loss_reg: 0.3350 caption_loss_cls: 2.1474 grounding_loss_reg: 2.4706 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3301 instance_segmentation_loss_poly: 0.8759 +2024/01/08 08:37:30 - mmengine - INFO - Iter(train) [373500/640000] base_lr: 7.5299e-05 lr: 8.6636e-06 eta: 4 days, 13:36:50 time: 1.5075 data_time: 0.0278 memory: 25719 grad_norm: 2.8569 loss: 1.2312 detection_loss_cls: 0.0309 detection_loss_reg: 0.3360 caption_loss_cls: 2.1509 grounding_loss_reg: 2.4674 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3303 instance_segmentation_loss_poly: 0.8759 +2024/01/08 08:49:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 08:49:17 - mmengine - INFO - Iter(train) [374000/640000] base_lr: 7.5065e-05 lr: 8.6422e-06 eta: 4 days, 13:21:05 time: 1.4939 data_time: 0.0278 memory: 25719 grad_norm: 2.9492 loss: 1.2470 detection_loss_cls: 0.0309 detection_loss_reg: 0.3360 caption_loss_cls: 2.1502 grounding_loss_reg: 2.4656 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3302 instance_segmentation_loss_poly: 0.8750 +2024/01/08 08:49:17 - mmengine - INFO - Saving checkpoint at 374000 iterations +2024/01/08 09:02:56 - mmengine - INFO - Iter(train) [374500/640000] base_lr: 7.4830e-05 lr: 8.6209e-06 eta: 4 days, 13:16:37 time: 1.5052 data_time: 0.0279 memory: 25719 grad_norm: 2.9324 loss: 1.2436 detection_loss_cls: 0.0309 detection_loss_reg: 0.3362 caption_loss_cls: 2.1522 grounding_loss_reg: 2.4620 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3313 instance_segmentation_loss_poly: 0.8766 +2024/01/08 09:15:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 09:15:50 - mmengine - INFO - Iter(train) [375000/640000] base_lr: 7.4596e-05 lr: 8.5996e-06 eta: 4 days, 13:07:28 time: 1.5087 data_time: 0.0279 memory: 25719 grad_norm: 2.9989 loss: 1.2477 detection_loss_cls: 0.0309 detection_loss_reg: 0.3358 caption_loss_cls: 2.1510 grounding_loss_reg: 2.4658 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3310 instance_segmentation_loss_poly: 0.8767 +2024/01/08 09:28:02 - mmengine - INFO - Iter(train) [375500/640000] base_lr: 7.4362e-05 lr: 8.5783e-06 eta: 4 days, 12:54:09 time: 1.5093 data_time: 0.0280 memory: 25719 grad_norm: 3.0133 loss: 1.2401 detection_loss_cls: 0.0309 detection_loss_reg: 0.3366 caption_loss_cls: 2.1517 grounding_loss_reg: 2.4630 semantic_segmentation_loss_cls: 0.0077 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3298 instance_segmentation_loss_poly: 0.8733 +2024/01/08 09:40:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 09:40:27 - mmengine - INFO - Iter(train) [376000/640000] base_lr: 7.4128e-05 lr: 8.5571e-06 eta: 4 days, 12:42:11 time: 1.5103 data_time: 0.0279 memory: 25719 grad_norm: 3.0397 loss: 1.2418 detection_loss_cls: 0.0308 detection_loss_reg: 0.3356 caption_loss_cls: 2.1529 grounding_loss_reg: 2.4646 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3303 instance_segmentation_loss_poly: 0.8746 +2024/01/08 09:40:27 - mmengine - INFO - Saving checkpoint at 376000 iterations +2024/01/08 09:52:40 - mmengine - INFO - Iter(train) [376500/640000] base_lr: 7.3894e-05 lr: 8.5358e-06 eta: 4 days, 12:29:01 time: 1.5000 data_time: 0.0277 memory: 25719 grad_norm: 3.0583 loss: 1.2525 detection_loss_cls: 0.0308 detection_loss_reg: 0.3355 caption_loss_cls: 2.1567 grounding_loss_reg: 2.4638 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3306 instance_segmentation_loss_poly: 0.8748 +2024/01/08 10:05:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 10:05:23 - mmengine - INFO - Iter(train) [377000/640000] base_lr: 7.3660e-05 lr: 8.5146e-06 eta: 4 days, 12:18:40 time: 1.5069 data_time: 0.0278 memory: 25719 grad_norm: 3.0254 loss: 1.2399 detection_loss_cls: 0.0308 detection_loss_reg: 0.3360 caption_loss_cls: 2.1578 grounding_loss_reg: 2.4636 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3319 instance_segmentation_loss_poly: 0.8768 +2024/01/08 10:17:11 - mmengine - INFO - Iter(train) [377500/640000] base_lr: 7.3427e-05 lr: 8.4934e-06 eta: 4 days, 12:03:15 time: 1.4946 data_time: 0.0276 memory: 25719 grad_norm: 3.0417 loss: 1.2429 detection_loss_cls: 0.0308 detection_loss_reg: 0.3366 caption_loss_cls: 2.1516 grounding_loss_reg: 2.4626 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0295 instance_segmentation_loss_reg: 0.3324 instance_segmentation_loss_poly: 0.8781 +2024/01/08 10:29:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 10:29:13 - mmengine - INFO - Iter(train) [378000/640000] base_lr: 7.3194e-05 lr: 8.4722e-06 eta: 4 days, 11:49:07 time: 1.4984 data_time: 0.0276 memory: 25719 grad_norm: 2.9958 loss: 1.2282 detection_loss_cls: 0.0308 detection_loss_reg: 0.3363 caption_loss_cls: 2.1422 grounding_loss_reg: 2.4602 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3323 instance_segmentation_loss_poly: 0.8772 +2024/01/08 10:29:13 - mmengine - INFO - Saving checkpoint at 378000 iterations +2024/01/08 10:41:46 - mmengine - INFO - Iter(train) [378500/640000] base_lr: 7.2961e-05 lr: 8.4510e-06 eta: 4 days, 11:37:50 time: 1.4817 data_time: 0.0274 memory: 25719 grad_norm: 3.0199 loss: 1.2370 detection_loss_cls: 0.0309 detection_loss_reg: 0.3368 caption_loss_cls: 2.1474 grounding_loss_reg: 2.4586 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3320 instance_segmentation_loss_poly: 0.8774 +2024/01/08 10:55:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 10:55:30 - mmengine - INFO - Iter(train) [379000/640000] base_lr: 7.2728e-05 lr: 8.4298e-06 eta: 4 days, 11:32:48 time: 1.4942 data_time: 0.0276 memory: 25719 grad_norm: 2.9924 loss: 1.2425 detection_loss_cls: 0.0308 detection_loss_reg: 0.3356 caption_loss_cls: 2.1531 grounding_loss_reg: 2.4577 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3329 instance_segmentation_loss_poly: 0.8806 +2024/01/08 11:08:00 - mmengine - INFO - Iter(train) [379500/640000] base_lr: 7.2495e-05 lr: 8.4086e-06 eta: 4 days, 11:21:12 time: 1.4989 data_time: 0.0276 memory: 25719 grad_norm: 2.9632 loss: 1.2377 detection_loss_cls: 0.0308 detection_loss_reg: 0.3364 caption_loss_cls: 2.1493 grounding_loss_reg: 2.4561 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3334 instance_segmentation_loss_poly: 0.8817 +2024/01/08 11:20:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 11:20:17 - mmengine - INFO - Iter(train) [380000/640000] base_lr: 7.2262e-05 lr: 8.3875e-06 eta: 4 days, 11:08:20 time: 1.4966 data_time: 0.0275 memory: 25719 grad_norm: 2.9757 loss: 1.2331 detection_loss_cls: 0.0309 detection_loss_reg: 0.3365 caption_loss_cls: 2.1469 grounding_loss_reg: 2.4576 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3326 instance_segmentation_loss_poly: 0.8795 +2024/01/08 11:20:17 - mmengine - INFO - Saving checkpoint at 380000 iterations +2024/01/08 11:33:25 - mmengine - INFO - Evaluating bbox... +2024/01/08 11:34:22 - mmengine - INFO - bbox_mAP_copypaste: 0.497 0.677 0.543 0.343 0.549 0.638 +2024/01/08 11:34:22 - mmengine - INFO - Evaluating segm... +2024/01/08 11:35:33 - mmengine - INFO - segm_mAP_copypaste: 0.333 0.596 0.326 0.187 0.384 0.507 +2024/01/08 11:42:48 - mmengine - INFO - per class results: +2024/01/08 11:42:48 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 77.12 | 88.93 | +| building | 82.38 | 91.47 | +| sky | 93.0 | 97.99 | +| floor | 82.66 | 90.26 | +| tree | 73.26 | 86.82 | +| ceiling | 81.7 | 88.58 | +| road | 81.58 | 91.61 | +| bed | 89.24 | 95.65 | +| windowpane | 62.96 | 82.63 | +| grass | 64.87 | 83.14 | +| cabinet | 64.54 | 76.64 | +| sidewalk | 59.56 | 69.0 | +| person | 80.47 | 91.76 | +| earth | 37.93 | 48.26 | +| door | 51.84 | 70.49 | +| table | 64.37 | 75.18 | +| mountain | 58.0 | 67.69 | +| plant | 50.56 | 60.57 | +| curtain | 72.42 | 86.86 | +| chair | 59.49 | 71.44 | +| car | 83.91 | 91.74 | +| water | 50.5 | 63.51 | +| painting | 70.53 | 87.34 | +| sofa | 70.52 | 80.73 | +| shelf | 45.53 | 64.28 | +| house | 44.66 | 57.95 | +| sea | 49.3 | 75.47 | +| mirror | 66.28 | 80.25 | +| rug | 68.15 | 76.04 | +| field | 30.16 | 52.62 | +| armchair | 49.15 | 71.58 | +| seat | 64.51 | 81.85 | +| fence | 44.13 | 59.37 | +| desk | 48.63 | 61.43 | +| rock | 49.99 | 70.61 | +| wardrobe | 46.95 | 55.85 | +| lamp | 61.97 | 71.78 | +| bathtub | 80.54 | 86.39 | +| railing | 38.2 | 52.19 | +| cushion | 60.68 | 76.05 | +| base | 28.7 | 49.44 | +| box | 26.44 | 35.56 | +| column | 49.19 | 66.67 | +| signboard | 37.05 | 51.98 | +| chest of drawers | 40.24 | 59.3 | +| counter | 36.37 | 45.98 | +| sand | 42.82 | 62.14 | +| sink | 72.29 | 82.09 | +| skyscraper | 64.26 | 82.67 | +| fireplace | 71.55 | 88.86 | +| refrigerator | 72.59 | 80.18 | +| grandstand | 40.6 | 77.81 | +| path | 25.13 | 48.4 | +| stairs | 32.71 | 44.24 | +| runway | 66.52 | 79.82 | +| case | 55.41 | 67.09 | +| pool table | 86.31 | 96.87 | +| pillow | 54.57 | 63.59 | +| screen door | 76.3 | 81.42 | +| stairway | 33.11 | 49.52 | +| river | 16.43 | 27.89 | +| bridge | 66.77 | 83.63 | +| bookcase | 39.02 | 56.71 | +| blind | 31.08 | 33.13 | +| coffee table | 67.96 | 85.27 | +| toilet | 85.31 | 89.75 | +| flower | 36.81 | 59.93 | +| book | 49.56 | 68.71 | +| hill | 13.83 | 28.01 | +| bench | 53.23 | 70.29 | +| countertop | 55.98 | 70.3 | +| stove | 78.22 | 85.4 | +| palm | 48.39 | 68.89 | +| kitchen island | 46.36 | 85.35 | +| computer | 74.42 | 86.35 | +| swivel chair | 46.63 | 65.15 | +| boat | 47.92 | 50.49 | +| bar | 40.21 | 48.9 | +| arcade machine | 62.6 | 67.13 | +| hovel | 22.15 | 23.85 | +| bus | 92.34 | 95.43 | +| towel | 64.91 | 72.07 | +| light | 49.63 | 56.74 | +| truck | 42.43 | 57.69 | +| tower | 27.72 | 59.11 | +| chandelier | 65.81 | 81.3 | +| awning | 34.08 | 40.05 | +| streetlight | 27.18 | 33.87 | +| booth | 47.95 | 49.04 | +| television receiver | 72.46 | 84.3 | +| airplane | 62.26 | 72.96 | +| dirt track | 9.37 | 17.2 | +| apparel | 27.87 | 38.11 | +| pole | 27.11 | 41.0 | +| land | 3.51 | 4.23 | +| bannister | 14.78 | 17.97 | +| escalator | 22.35 | 23.79 | +| ottoman | 52.13 | 71.58 | +| bottle | 22.87 | 28.85 | +| buffet | 47.96 | 64.41 | +| poster | 28.13 | 36.03 | +| stage | 9.81 | 15.88 | +| van | 39.85 | 52.06 | +| ship | 6.77 | 10.1 | +| fountain | 22.75 | 25.14 | +| conveyer belt | 82.72 | 90.86 | +| canopy | 19.56 | 33.31 | +| washer | 68.58 | 69.11 | +| plaything | 31.5 | 41.77 | +| swimming pool | 69.24 | 72.0 | +| stool | 48.85 | 65.88 | +| barrel | 17.85 | 62.85 | +| basket | 32.5 | 48.48 | +| waterfall | 58.84 | 92.38 | +| tent | 83.67 | 97.36 | +| bag | 20.26 | 26.36 | +| minibike | 69.88 | 82.25 | +| cradle | 73.47 | 96.33 | +| oven | 61.05 | 70.79 | +| ball | 50.91 | 65.97 | +| food | 47.33 | 52.52 | +| step | 9.37 | 14.55 | +| tank | 39.37 | 43.41 | +| trade name | 18.09 | 19.49 | +| microwave | 85.78 | 94.54 | +| pot | 54.05 | 61.72 | +| animal | 56.28 | 58.93 | +| bicycle | 57.21 | 73.97 | +| lake | 57.05 | 62.43 | +| dishwasher | 54.75 | 67.26 | +| screen | 60.46 | 72.55 | +| blanket | 13.55 | 16.35 | +| sculpture | 48.25 | 73.22 | +| hood | 60.78 | 64.46 | +| sconce | 43.24 | 53.07 | +| vase | 42.11 | 56.16 | +| traffic light | 39.38 | 56.78 | +| tray | 5.34 | 7.71 | +| ashcan | 40.14 | 52.49 | +| fan | 56.0 | 62.22 | +| pier | 16.18 | 43.75 | +| crt screen | 16.3 | 37.45 | +| plate | 54.26 | 71.49 | +| monitor | 13.88 | 16.4 | +| bulletin board | 40.41 | 54.82 | +| shower | 3.69 | 6.1 | +| radiator | 59.45 | 66.93 | +| glass | 20.07 | 22.2 | +| clock | 25.71 | 31.48 | +| flag | 25.1 | 29.63 | ++---------------------+-------+-------+ +2024/01/08 11:43:04 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4970 coco/bbox_mAP_50: 0.6770 coco/bbox_mAP_75: 0.5430 coco/bbox_mAP_s: 0.3430 coco/bbox_mAP_m: 0.5490 coco/bbox_mAP_l: 0.6380 coco/segm_mAP: 0.3330 coco/segm_mAP_50: 0.5960 coco/segm_mAP_75: 0.3260 coco/segm_mAP_s: 0.1870 coco/segm_mAP_m: 0.3840 coco/segm_mAP_l: 0.5070 Bleu_1: 0.7494 Bleu_2: 0.5826 Bleu_3: 0.4404 Bleu_4: 0.3299 METEOR: 0.2690 ROUGE_L: 0.5522 CIDEr: 1.0774 SPICE: 0.1997 aAcc: 82.9700 mIoU: 49.2100 mAcc: 61.4000 visual-grounding/miou: 0.8078 visual-grounding/acc: 0.8742 data_time: 0.0042 time: 1.3570 +2024/01/08 11:55:19 - mmengine - INFO - Iter(train) [380500/640000] base_lr: 7.2030e-05 lr: 8.3663e-06 eta: 4 days, 10:55:29 time: 1.4976 data_time: 0.0234 memory: 25719 grad_norm: 2.9408 loss: 1.2209 detection_loss_cls: 0.0309 detection_loss_reg: 0.3377 caption_loss_cls: 2.1464 grounding_loss_reg: 2.4562 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3339 instance_segmentation_loss_poly: 0.8824 +2024/01/08 12:07:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 12:07:30 - mmengine - INFO - Iter(train) [381000/640000] base_lr: 7.1798e-05 lr: 8.3452e-06 eta: 4 days, 10:42:13 time: 1.4897 data_time: 0.0232 memory: 25719 grad_norm: 2.9524 loss: 1.2212 detection_loss_cls: 0.0307 detection_loss_reg: 0.3362 caption_loss_cls: 2.1478 grounding_loss_reg: 2.4547 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3334 instance_segmentation_loss_poly: 0.8815 +2024/01/08 12:19:26 - mmengine - INFO - Iter(train) [381500/640000] base_lr: 7.1566e-05 lr: 8.3241e-06 eta: 4 days, 10:27:43 time: 1.4917 data_time: 0.0232 memory: 25719 grad_norm: 2.9616 loss: 1.2228 detection_loss_cls: 0.0307 detection_loss_reg: 0.3358 caption_loss_cls: 2.1509 grounding_loss_reg: 2.4585 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3343 instance_segmentation_loss_poly: 0.8830 +2024/01/08 12:31:36 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 12:31:36 - mmengine - INFO - Iter(train) [382000/640000] base_lr: 7.1334e-05 lr: 8.3031e-06 eta: 4 days, 10:14:24 time: 1.4937 data_time: 0.0232 memory: 25719 grad_norm: 2.9711 loss: 1.2249 detection_loss_cls: 0.0307 detection_loss_reg: 0.3365 caption_loss_cls: 2.1498 grounding_loss_reg: 2.4566 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3345 instance_segmentation_loss_poly: 0.8836 +2024/01/08 12:31:36 - mmengine - INFO - Saving checkpoint at 382000 iterations +2024/01/08 12:44:28 - mmengine - INFO - Iter(train) [382500/640000] base_lr: 7.1102e-05 lr: 8.2820e-06 eta: 4 days, 10:04:29 time: 1.4983 data_time: 0.0231 memory: 25719 grad_norm: 2.9802 loss: 1.2216 detection_loss_cls: 0.0308 detection_loss_reg: 0.3357 caption_loss_cls: 2.1506 grounding_loss_reg: 2.4548 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3345 instance_segmentation_loss_poly: 0.8831 +2024/01/08 12:56:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 12:56:56 - mmengine - INFO - Iter(train) [383000/640000] base_lr: 7.0870e-05 lr: 8.2609e-06 eta: 4 days, 9:52:36 time: 1.4794 data_time: 0.0229 memory: 25719 grad_norm: 3.0042 loss: 1.2185 detection_loss_cls: 0.0309 detection_loss_reg: 0.3373 caption_loss_cls: 2.1508 grounding_loss_reg: 2.4520 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3333 instance_segmentation_loss_poly: 0.8806 +2024/01/08 13:08:53 - mmengine - INFO - Iter(train) [383500/640000] base_lr: 7.0639e-05 lr: 8.2399e-06 eta: 4 days, 9:38:19 time: 1.4712 data_time: 0.0227 memory: 25719 grad_norm: 3.0016 loss: 1.2130 detection_loss_cls: 0.0308 detection_loss_reg: 0.3364 caption_loss_cls: 2.1515 grounding_loss_reg: 2.4468 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3352 instance_segmentation_loss_poly: 0.8850 +2024/01/08 13:21:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 13:21:20 - mmengine - INFO - Iter(train) [384000/640000] base_lr: 7.0408e-05 lr: 8.2189e-06 eta: 4 days, 9:26:23 time: 1.4738 data_time: 0.0227 memory: 25719 grad_norm: 2.9970 loss: 1.2168 detection_loss_cls: 0.0307 detection_loss_reg: 0.3361 caption_loss_cls: 2.1455 grounding_loss_reg: 2.4458 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3341 instance_segmentation_loss_poly: 0.8831 +2024/01/08 13:21:20 - mmengine - INFO - Saving checkpoint at 384000 iterations +2024/01/08 13:33:37 - mmengine - INFO - Iter(train) [384500/640000] base_lr: 7.0177e-05 lr: 8.1979e-06 eta: 4 days, 9:13:38 time: 1.4738 data_time: 0.0268 memory: 25719 grad_norm: 3.0855 loss: 1.2261 detection_loss_cls: 0.0306 detection_loss_reg: 0.3353 caption_loss_cls: 2.1435 grounding_loss_reg: 2.4447 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3335 instance_segmentation_loss_poly: 0.8811 +2024/01/08 13:46:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240107_135549 +2024/01/08 13:46:22 - mmengine - INFO - Iter(train) [385000/640000] base_lr: 6.9946e-05 lr: 8.1769e-06 eta: 4 days, 9:03:07 time: 1.4824 data_time: 0.0269 memory: 25719 grad_norm: 3.0985 loss: 1.2284 detection_loss_cls: 0.0306 detection_loss_reg: 0.3351 caption_loss_cls: 2.1461 grounding_loss_reg: 2.4415 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3326 instance_segmentation_loss_poly: 0.8801 +2024/01/08 14:47:02 - mmengine - INFO - Iter(train) [385500/640000] base_lr: 6.9715e-05 lr: 8.1559e-06 eta: 4 days, 16:01:23 time: 1.5223 data_time: 0.0216 memory: 25723 grad_norm: 3.0996 loss: 1.2206 detection_loss_cls: 0.0307 detection_loss_reg: 0.3368 caption_loss_cls: 2.1418 grounding_loss_reg: 2.4389 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0294 instance_segmentation_loss_reg: 0.3342 instance_segmentation_loss_poly: 0.8845 +2024/01/08 15:00:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 15:00:05 - mmengine - INFO - Iter(train) [386000/640000] base_lr: 6.9485e-05 lr: 8.1350e-06 eta: 4 days, 15:26:56 time: 1.5354 data_time: 0.0213 memory: 25723 grad_norm: 3.1529 loss: 1.2175 detection_loss_cls: 0.0306 detection_loss_reg: 0.3370 caption_loss_cls: 2.1365 grounding_loss_reg: 2.4369 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3345 instance_segmentation_loss_poly: 0.8845 +2024/01/08 15:00:05 - mmengine - INFO - Saving checkpoint at 386000 iterations +2024/01/08 15:13:41 - mmengine - INFO - Iter(train) [386500/640000] base_lr: 6.9255e-05 lr: 8.1141e-06 eta: 4 days, 15:57:20 time: 1.5466 data_time: 0.0209 memory: 25723 grad_norm: 3.1787 loss: 1.2243 detection_loss_cls: 0.0305 detection_loss_reg: 0.3358 caption_loss_cls: 2.1357 grounding_loss_reg: 2.4338 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3340 instance_segmentation_loss_poly: 0.8840 +2024/01/08 15:26:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 15:26:46 - mmengine - INFO - Iter(train) [387000/640000] base_lr: 6.9025e-05 lr: 8.0931e-06 eta: 4 days, 15:29:37 time: 1.5559 data_time: 0.0206 memory: 25723 grad_norm: 3.1720 loss: 1.2218 detection_loss_cls: 0.0306 detection_loss_reg: 0.3361 caption_loss_cls: 2.1327 grounding_loss_reg: 2.4312 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0293 instance_segmentation_loss_reg: 0.3344 instance_segmentation_loss_poly: 0.8846 +2024/01/08 15:39:42 - mmengine - INFO - Iter(train) [387500/640000] base_lr: 6.8795e-05 lr: 8.0722e-06 eta: 4 days, 14:55:41 time: 1.5705 data_time: 0.0203 memory: 25723 grad_norm: 3.2241 loss: 1.2265 detection_loss_cls: 0.0304 detection_loss_reg: 0.3354 caption_loss_cls: 2.1301 grounding_loss_reg: 2.4282 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3329 instance_segmentation_loss_poly: 0.8814 +2024/01/08 15:53:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 15:53:06 - mmengine - INFO - Iter(train) [388000/640000] base_lr: 6.8565e-05 lr: 8.0514e-06 eta: 4 days, 14:55:49 time: 1.5847 data_time: 0.0202 memory: 25723 grad_norm: 3.2337 loss: 1.2186 detection_loss_cls: 0.0304 detection_loss_reg: 0.3351 caption_loss_cls: 2.1269 grounding_loss_reg: 2.4285 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3329 instance_segmentation_loss_poly: 0.8807 +2024/01/08 15:53:06 - mmengine - INFO - Saving checkpoint at 388000 iterations +2024/01/08 16:05:44 - mmengine - INFO - Iter(train) [388500/640000] base_lr: 6.8336e-05 lr: 8.0305e-06 eta: 4 days, 14:10:43 time: 1.5749 data_time: 0.0245 memory: 25723 grad_norm: 3.3269 loss: 1.2276 detection_loss_cls: 0.0305 detection_loss_reg: 0.3355 caption_loss_cls: 2.1220 grounding_loss_reg: 2.4281 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3335 instance_segmentation_loss_poly: 0.8822 +2024/01/08 16:19:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 16:19:18 - mmengine - INFO - Iter(train) [389000/640000] base_lr: 6.8106e-05 lr: 8.0097e-06 eta: 4 days, 14:18:42 time: 1.5781 data_time: 0.0247 memory: 25723 grad_norm: 3.2787 loss: 1.2183 detection_loss_cls: 0.0305 detection_loss_reg: 0.3365 caption_loss_cls: 2.1238 grounding_loss_reg: 2.4263 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3344 instance_segmentation_loss_poly: 0.8844 +2024/01/08 16:32:25 - mmengine - INFO - Iter(train) [389500/640000] base_lr: 6.7877e-05 lr: 7.9888e-06 eta: 4 days, 14:01:51 time: 1.5800 data_time: 0.0248 memory: 25723 grad_norm: 3.2959 loss: 1.2252 detection_loss_cls: 0.0304 detection_loss_reg: 0.3370 caption_loss_cls: 2.1237 grounding_loss_reg: 2.4260 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3344 instance_segmentation_loss_poly: 0.8841 +2024/01/08 16:45:27 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 16:45:27 - mmengine - INFO - Iter(train) [390000/640000] base_lr: 6.7648e-05 lr: 7.9680e-06 eta: 4 days, 13:42:24 time: 1.5799 data_time: 0.0250 memory: 25723 grad_norm: 3.2873 loss: 1.2306 detection_loss_cls: 0.0305 detection_loss_reg: 0.3367 caption_loss_cls: 2.1186 grounding_loss_reg: 2.4253 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3346 instance_segmentation_loss_poly: 0.8848 +2024/01/08 16:45:27 - mmengine - INFO - Saving checkpoint at 390000 iterations +2024/01/08 16:58:20 - mmengine - INFO - Iter(train) [390500/640000] base_lr: 6.7420e-05 lr: 7.9472e-06 eta: 4 days, 13:18:01 time: 1.5691 data_time: 0.0248 memory: 25723 grad_norm: 3.3043 loss: 1.2314 detection_loss_cls: 0.0305 detection_loss_reg: 0.3372 caption_loss_cls: 2.1226 grounding_loss_reg: 2.4250 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0292 instance_segmentation_loss_reg: 0.3347 instance_segmentation_loss_poly: 0.8845 +2024/01/08 17:11:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 17:11:17 - mmengine - INFO - Iter(train) [391000/640000] base_lr: 6.7191e-05 lr: 7.9265e-06 eta: 4 days, 12:58:16 time: 1.5672 data_time: 0.0248 memory: 25723 grad_norm: 3.3164 loss: 1.2235 detection_loss_cls: 0.0305 detection_loss_reg: 0.3361 caption_loss_cls: 2.1191 grounding_loss_reg: 2.4208 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3337 instance_segmentation_loss_poly: 0.8832 +2024/01/08 17:24:35 - mmengine - INFO - Iter(train) [391500/640000] base_lr: 6.6963e-05 lr: 7.9057e-06 eta: 4 days, 12:50:14 time: 1.5725 data_time: 0.0250 memory: 25723 grad_norm: 3.2845 loss: 1.2256 detection_loss_cls: 0.0304 detection_loss_reg: 0.3364 caption_loss_cls: 2.1120 grounding_loss_reg: 2.4210 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0291 instance_segmentation_loss_reg: 0.3342 instance_segmentation_loss_poly: 0.8848 +2024/01/08 17:37:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 17:37:41 - mmengine - INFO - Iter(train) [392000/640000] base_lr: 6.6735e-05 lr: 7.8850e-06 eta: 4 days, 12:35:54 time: 1.5681 data_time: 0.0251 memory: 25723 grad_norm: 3.3059 loss: 1.2349 detection_loss_cls: 0.0303 detection_loss_reg: 0.3351 caption_loss_cls: 2.1111 grounding_loss_reg: 2.4155 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3326 instance_segmentation_loss_poly: 0.8811 +2024/01/08 17:37:41 - mmengine - INFO - Saving checkpoint at 392000 iterations +2024/01/08 17:50:49 - mmengine - INFO - Iter(train) [392500/640000] base_lr: 6.6507e-05 lr: 7.8643e-06 eta: 4 days, 12:22:30 time: 1.5755 data_time: 0.0251 memory: 25723 grad_norm: 3.1810 loss: 1.2253 detection_loss_cls: 0.0304 detection_loss_reg: 0.3358 caption_loss_cls: 2.1131 grounding_loss_reg: 2.4137 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3326 instance_segmentation_loss_poly: 0.8821 +2024/01/08 18:03:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 18:03:46 - mmengine - INFO - Iter(train) [393000/640000] base_lr: 6.6279e-05 lr: 7.8436e-06 eta: 4 days, 12:04:07 time: 1.5663 data_time: 0.0249 memory: 25723 grad_norm: 3.2190 loss: 1.2224 detection_loss_cls: 0.0303 detection_loss_reg: 0.3350 caption_loss_cls: 2.1092 grounding_loss_reg: 2.4117 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3323 instance_segmentation_loss_poly: 0.8806 +2024/01/08 18:17:42 - mmengine - INFO - Iter(train) [393500/640000] base_lr: 6.6052e-05 lr: 7.8229e-06 eta: 4 days, 12:11:51 time: 1.5786 data_time: 0.0251 memory: 25723 grad_norm: 3.1486 loss: 1.2100 detection_loss_cls: 0.0302 detection_loss_reg: 0.3347 caption_loss_cls: 2.1061 grounding_loss_reg: 2.4115 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3324 instance_segmentation_loss_poly: 0.8803 +2024/01/08 18:30:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 18:30:42 - mmengine - INFO - Iter(train) [394000/640000] base_lr: 6.5825e-05 lr: 7.8022e-06 eta: 4 days, 11:54:17 time: 1.5781 data_time: 0.0251 memory: 25723 grad_norm: 3.1297 loss: 1.2051 detection_loss_cls: 0.0301 detection_loss_reg: 0.3350 caption_loss_cls: 2.1076 grounding_loss_reg: 2.4071 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3319 instance_segmentation_loss_poly: 0.8793 +2024/01/08 18:30:42 - mmengine - INFO - Saving checkpoint at 394000 iterations +2024/01/08 18:44:37 - mmengine - INFO - Iter(train) [394500/640000] base_lr: 6.5598e-05 lr: 7.7816e-06 eta: 4 days, 11:58:41 time: 1.5936 data_time: 0.0251 memory: 25723 grad_norm: 3.0783 loss: 1.1844 detection_loss_cls: 0.0301 detection_loss_reg: 0.3344 caption_loss_cls: 2.1047 grounding_loss_reg: 2.4060 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3313 instance_segmentation_loss_poly: 0.8792 +2024/01/08 18:58:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 18:58:12 - mmengine - INFO - Iter(train) [395000/640000] base_lr: 6.5371e-05 lr: 7.7610e-06 eta: 4 days, 11:54:00 time: 1.6029 data_time: 0.0252 memory: 25723 grad_norm: 3.1102 loss: 1.1799 detection_loss_cls: 0.0302 detection_loss_reg: 0.3355 caption_loss_cls: 2.1035 grounding_loss_reg: 2.4003 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3310 instance_segmentation_loss_poly: 0.8779 +2024/01/08 19:11:17 - mmengine - INFO - Iter(train) [395500/640000] base_lr: 6.5144e-05 lr: 7.7404e-06 eta: 4 days, 11:37:59 time: 1.5999 data_time: 0.0252 memory: 25723 grad_norm: 3.1445 loss: 1.1780 detection_loss_cls: 0.0302 detection_loss_reg: 0.3354 caption_loss_cls: 2.0983 grounding_loss_reg: 2.3971 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0290 instance_segmentation_loss_reg: 0.3336 instance_segmentation_loss_poly: 0.8831 +2024/01/08 19:23:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 19:23:28 - mmengine - INFO - Iter(train) [396000/640000] base_lr: 6.4918e-05 lr: 7.7198e-06 eta: 4 days, 11:03:37 time: 1.5859 data_time: 0.0251 memory: 25723 grad_norm: 3.1646 loss: 1.1853 detection_loss_cls: 0.0303 detection_loss_reg: 0.3363 caption_loss_cls: 2.0963 grounding_loss_reg: 2.3939 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3335 instance_segmentation_loss_poly: 0.8835 +2024/01/08 19:23:28 - mmengine - INFO - Saving checkpoint at 396000 iterations +2024/01/08 19:37:06 - mmengine - INFO - Iter(train) [396500/640000] base_lr: 6.4692e-05 lr: 7.6992e-06 eta: 4 days, 10:59:29 time: 1.5934 data_time: 0.0252 memory: 25723 grad_norm: 3.1887 loss: 1.1845 detection_loss_cls: 0.0303 detection_loss_reg: 0.3359 caption_loss_cls: 2.0944 grounding_loss_reg: 2.3924 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0289 instance_segmentation_loss_reg: 0.3334 instance_segmentation_loss_poly: 0.8837 +2024/01/08 19:49:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 19:49:33 - mmengine - INFO - Iter(train) [397000/640000] base_lr: 6.4466e-05 lr: 7.6787e-06 eta: 4 days, 10:32:39 time: 1.5860 data_time: 0.0250 memory: 25723 grad_norm: 3.2309 loss: 1.1870 detection_loss_cls: 0.0303 detection_loss_reg: 0.3354 caption_loss_cls: 2.0931 grounding_loss_reg: 2.3903 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3329 instance_segmentation_loss_poly: 0.8827 +2024/01/08 20:02:30 - mmengine - INFO - Iter(train) [397500/640000] base_lr: 6.4240e-05 lr: 7.6582e-06 eta: 4 days, 10:15:37 time: 1.5711 data_time: 0.0249 memory: 25723 grad_norm: 3.2674 loss: 1.2032 detection_loss_cls: 0.0303 detection_loss_reg: 0.3348 caption_loss_cls: 2.0976 grounding_loss_reg: 2.3890 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3325 instance_segmentation_loss_poly: 0.8820 +2024/01/08 20:15:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 20:15:50 - mmengine - INFO - Iter(train) [398000/640000] base_lr: 6.4015e-05 lr: 7.6377e-06 eta: 4 days, 10:05:47 time: 1.5763 data_time: 0.0250 memory: 25723 grad_norm: 3.2330 loss: 1.2046 detection_loss_cls: 0.0301 detection_loss_reg: 0.3335 caption_loss_cls: 2.0991 grounding_loss_reg: 2.3873 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0286 instance_segmentation_loss_reg: 0.3304 instance_segmentation_loss_poly: 0.8780 +2024/01/08 20:15:50 - mmengine - INFO - Saving checkpoint at 398000 iterations +2024/01/08 20:28:54 - mmengine - INFO - Iter(train) [398500/640000] base_lr: 6.3789e-05 lr: 7.6172e-06 eta: 4 days, 9:51:05 time: 1.5635 data_time: 0.0250 memory: 25723 grad_norm: 3.2685 loss: 1.2254 detection_loss_cls: 0.0302 detection_loss_reg: 0.3336 caption_loss_cls: 2.0963 grounding_loss_reg: 2.3863 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0287 instance_segmentation_loss_reg: 0.3307 instance_segmentation_loss_poly: 0.8787 +2024/01/08 20:41:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 20:41:45 - mmengine - INFO - Iter(train) [399000/640000] base_lr: 6.3564e-05 lr: 7.5967e-06 eta: 4 days, 9:33:01 time: 1.5525 data_time: 0.0249 memory: 25723 grad_norm: 3.2236 loss: 1.2358 detection_loss_cls: 0.0301 detection_loss_reg: 0.3329 caption_loss_cls: 2.0965 grounding_loss_reg: 2.3876 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0287 instance_segmentation_loss_reg: 0.3298 instance_segmentation_loss_poly: 0.8755 +2024/01/08 20:54:51 - mmengine - INFO - Iter(train) [399500/640000] base_lr: 6.3339e-05 lr: 7.5763e-06 eta: 4 days, 9:19:09 time: 1.5527 data_time: 0.0249 memory: 25723 grad_norm: 3.1976 loss: 1.2370 detection_loss_cls: 0.0300 detection_loss_reg: 0.3332 caption_loss_cls: 2.0957 grounding_loss_reg: 2.3870 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0287 instance_segmentation_loss_reg: 0.3300 instance_segmentation_loss_poly: 0.8748 +2024/01/08 21:08:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 21:08:01 - mmengine - INFO - Iter(train) [400000/640000] base_lr: 6.3115e-05 lr: 7.5559e-06 eta: 4 days, 9:06:16 time: 1.5675 data_time: 0.0249 memory: 25723 grad_norm: 3.1369 loss: 1.2287 detection_loss_cls: 0.0300 detection_loss_reg: 0.3329 caption_loss_cls: 2.0976 grounding_loss_reg: 2.3846 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3293 instance_segmentation_loss_poly: 0.8733 +2024/01/08 21:08:01 - mmengine - INFO - Saving checkpoint at 400000 iterations +2024/01/08 21:20:18 - mmengine - INFO - Evaluating bbox... +2024/01/08 21:21:14 - mmengine - INFO - bbox_mAP_copypaste: 0.499 0.678 0.545 0.338 0.549 0.638 +2024/01/08 21:21:14 - mmengine - INFO - Evaluating segm... +2024/01/08 21:22:28 - mmengine - INFO - segm_mAP_copypaste: 0.333 0.595 0.328 0.186 0.382 0.506 +2024/01/08 21:29:33 - mmengine - INFO - per class results: +2024/01/08 21:29:33 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.33 | 88.06 | +| building | 83.46 | 92.36 | +| sky | 93.69 | 98.07 | +| floor | 82.59 | 91.09 | +| tree | 73.6 | 87.38 | +| ceiling | 84.19 | 94.73 | +| road | 83.45 | 90.49 | +| bed | 90.2 | 95.56 | +| windowpane | 63.53 | 80.37 | +| grass | 64.97 | 83.84 | +| cabinet | 60.83 | 74.94 | +| sidewalk | 66.64 | 80.02 | +| person | 81.69 | 91.69 | +| earth | 37.69 | 47.9 | +| door | 53.84 | 72.36 | +| table | 64.73 | 76.88 | +| mountain | 62.35 | 78.67 | +| plant | 50.49 | 58.76 | +| curtain | 73.6 | 86.21 | +| chair | 60.29 | 72.49 | +| car | 84.95 | 92.06 | +| water | 51.32 | 67.83 | +| painting | 70.84 | 88.22 | +| sofa | 70.09 | 85.23 | +| shelf | 46.03 | 63.89 | +| house | 42.75 | 58.37 | +| sea | 47.14 | 68.78 | +| mirror | 67.33 | 76.5 | +| rug | 65.59 | 74.34 | +| field | 25.43 | 39.35 | +| armchair | 47.42 | 65.96 | +| seat | 63.14 | 82.16 | +| fence | 49.45 | 63.58 | +| desk | 52.64 | 71.35 | +| rock | 48.04 | 74.52 | +| wardrobe | 45.49 | 59.49 | +| lamp | 62.83 | 75.27 | +| bathtub | 81.08 | 84.76 | +| railing | 36.83 | 54.22 | +| cushion | 57.36 | 65.8 | +| base | 25.6 | 32.69 | +| box | 29.17 | 42.47 | +| column | 48.81 | 64.52 | +| signboard | 38.54 | 52.3 | +| chest of drawers | 36.51 | 57.22 | +| counter | 38.14 | 52.59 | +| sand | 42.14 | 70.79 | +| sink | 73.52 | 81.49 | +| skyscraper | 65.13 | 82.84 | +| fireplace | 73.35 | 90.58 | +| refrigerator | 72.85 | 80.03 | +| grandstand | 43.52 | 75.79 | +| path | 23.82 | 36.34 | +| stairs | 30.17 | 40.99 | +| runway | 72.85 | 89.83 | +| case | 50.19 | 69.84 | +| pool table | 87.63 | 97.4 | +| pillow | 58.44 | 71.44 | +| screen door | 72.41 | 74.41 | +| stairway | 36.21 | 51.21 | +| river | 16.72 | 23.61 | +| bridge | 70.32 | 89.01 | +| bookcase | 39.1 | 62.52 | +| blind | 42.02 | 49.04 | +| coffee table | 62.55 | 83.79 | +| toilet | 87.78 | 91.52 | +| flower | 39.17 | 56.39 | +| book | 47.61 | 68.39 | +| hill | 15.64 | 24.3 | +| bench | 57.52 | 70.58 | +| countertop | 57.19 | 70.52 | +| stove | 77.94 | 85.33 | +| palm | 43.11 | 58.08 | +| kitchen island | 46.6 | 84.93 | +| computer | 70.42 | 80.2 | +| swivel chair | 36.53 | 48.48 | +| boat | 78.23 | 84.28 | +| bar | 29.7 | 40.65 | +| arcade machine | 51.11 | 54.19 | +| hovel | 15.94 | 16.69 | +| bus | 91.64 | 93.8 | +| towel | 62.67 | 74.7 | +| light | 51.0 | 59.28 | +| truck | 43.0 | 59.19 | +| tower | 26.57 | 37.89 | +| chandelier | 63.75 | 74.77 | +| awning | 30.53 | 38.5 | +| streetlight | 33.02 | 48.82 | +| booth | 33.76 | 38.34 | +| television receiver | 69.72 | 82.36 | +| airplane | 60.91 | 65.25 | +| dirt track | 17.33 | 24.7 | +| apparel | 31.48 | 42.08 | +| pole | 27.61 | 41.55 | +| land | 2.83 | 4.79 | +| bannister | 16.39 | 21.21 | +| escalator | 25.26 | 27.83 | +| ottoman | 53.21 | 66.52 | +| bottle | 21.39 | 25.21 | +| buffet | 43.73 | 56.24 | +| poster | 32.97 | 43.35 | +| stage | 12.16 | 19.19 | +| van | 45.41 | 58.42 | +| ship | 10.42 | 11.42 | +| fountain | 14.47 | 15.07 | +| conveyer belt | 78.88 | 91.66 | +| canopy | 24.6 | 26.74 | +| washer | 70.72 | 72.05 | +| plaything | 22.83 | 25.6 | +| swimming pool | 62.71 | 74.9 | +| stool | 50.69 | 59.23 | +| barrel | 29.94 | 54.02 | +| basket | 32.14 | 49.08 | +| waterfall | 51.94 | 69.97 | +| tent | 89.24 | 97.09 | +| bag | 19.56 | 25.57 | +| minibike | 73.58 | 84.5 | +| cradle | 76.67 | 95.69 | +| oven | 59.47 | 71.62 | +| ball | 45.02 | 55.2 | +| food | 49.2 | 53.95 | +| step | 16.15 | 25.74 | +| tank | 35.69 | 39.62 | +| trade name | 26.26 | 31.51 | +| microwave | 86.02 | 93.79 | +| pot | 47.61 | 54.56 | +| animal | 59.19 | 61.49 | +| bicycle | 57.16 | 73.49 | +| lake | 56.64 | 63.9 | +| dishwasher | 58.25 | 71.9 | +| screen | 55.37 | 71.68 | +| blanket | 15.62 | 19.54 | +| sculpture | 54.69 | 68.87 | +| hood | 56.95 | 68.56 | +| sconce | 46.67 | 60.04 | +| vase | 43.2 | 59.91 | +| traffic light | 40.56 | 64.99 | +| tray | 7.32 | 13.79 | +| ashcan | 45.49 | 65.42 | +| fan | 60.16 | 71.49 | +| pier | 22.96 | 41.27 | +| crt screen | 12.2 | 19.71 | +| plate | 56.34 | 75.6 | +| monitor | 26.69 | 35.8 | +| bulletin board | 29.88 | 32.47 | +| shower | 1.13 | 1.46 | +| radiator | 58.21 | 66.25 | +| glass | 19.38 | 21.29 | +| clock | 28.58 | 35.52 | +| flag | 35.37 | 42.75 | ++---------------------+-------+-------+ +2024/01/08 21:29:51 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.4990 coco/bbox_mAP_50: 0.6780 coco/bbox_mAP_75: 0.5450 coco/bbox_mAP_s: 0.3380 coco/bbox_mAP_m: 0.5490 coco/bbox_mAP_l: 0.6380 coco/segm_mAP: 0.3330 coco/segm_mAP_50: 0.5950 coco/segm_mAP_75: 0.3280 coco/segm_mAP_s: 0.1860 coco/segm_mAP_m: 0.3820 coco/segm_mAP_l: 0.5060 Bleu_1: 0.7573 Bleu_2: 0.5918 Bleu_3: 0.4497 Bleu_4: 0.3380 METEOR: 0.2679 ROUGE_L: 0.5553 CIDEr: 1.0829 SPICE: 0.2001 aAcc: 83.5500 mIoU: 49.6600 mAcc: 61.3400 visual-grounding/miou: 0.8123 visual-grounding/acc: 0.8778 data_time: 0.0107 time: 1.3587 +2024/01/08 21:42:36 - mmengine - INFO - Iter(train) [400500/640000] base_lr: 6.2890e-05 lr: 7.5355e-06 eta: 4 days, 8:48:02 time: 1.5549 data_time: 0.0212 memory: 25726 grad_norm: 3.1157 loss: 1.2287 detection_loss_cls: 0.0300 detection_loss_reg: 0.3322 caption_loss_cls: 2.1008 grounding_loss_reg: 2.3846 semantic_segmentation_loss_cls: 0.0076 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3301 instance_segmentation_loss_poly: 0.8751 +2024/01/08 21:56:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 21:56:25 - mmengine - INFO - Iter(train) [401000/640000] base_lr: 6.2666e-05 lr: 7.5151e-06 eta: 4 days, 8:44:36 time: 1.5754 data_time: 0.0220 memory: 25726 grad_norm: 3.0436 loss: 1.2230 detection_loss_cls: 0.0302 detection_loss_reg: 0.3326 caption_loss_cls: 2.0978 grounding_loss_reg: 2.3846 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3297 instance_segmentation_loss_poly: 0.8749 +2024/01/08 22:09:31 - mmengine - INFO - Iter(train) [401500/640000] base_lr: 6.2442e-05 lr: 7.4948e-06 eta: 4 days, 8:30:36 time: 1.5776 data_time: 0.0221 memory: 25726 grad_norm: 3.0366 loss: 1.2210 detection_loss_cls: 0.0301 detection_loss_reg: 0.3322 caption_loss_cls: 2.0938 grounding_loss_reg: 2.3807 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0288 instance_segmentation_loss_reg: 0.3291 instance_segmentation_loss_poly: 0.8741 +2024/01/08 22:22:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 22:22:04 - mmengine - INFO - Iter(train) [402000/640000] base_lr: 6.2219e-05 lr: 7.4744e-06 eta: 4 days, 8:09:28 time: 1.5657 data_time: 0.0222 memory: 25726 grad_norm: 3.0612 loss: 1.2197 detection_loss_cls: 0.0300 detection_loss_reg: 0.3308 caption_loss_cls: 2.0938 grounding_loss_reg: 2.3789 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0287 instance_segmentation_loss_reg: 0.3282 instance_segmentation_loss_poly: 0.8720 +2024/01/08 22:22:04 - mmengine - INFO - Saving checkpoint at 402000 iterations +2024/01/08 22:34:58 - mmengine - INFO - Iter(train) [402500/640000] base_lr: 6.1995e-05 lr: 7.4541e-06 eta: 4 days, 7:53:17 time: 1.5632 data_time: 0.0231 memory: 25726 grad_norm: 3.1023 loss: 1.2165 detection_loss_cls: 0.0300 detection_loss_reg: 0.3309 caption_loss_cls: 2.0897 grounding_loss_reg: 2.3772 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0286 instance_segmentation_loss_reg: 0.3276 instance_segmentation_loss_poly: 0.8713 +2024/01/08 22:48:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 22:48:33 - mmengine - INFO - Iter(train) [403000/640000] base_lr: 6.1772e-05 lr: 7.4338e-06 eta: 4 days, 7:45:51 time: 1.5742 data_time: 0.0235 memory: 25726 grad_norm: 3.0968 loss: 1.2100 detection_loss_cls: 0.0300 detection_loss_reg: 0.3309 caption_loss_cls: 2.0906 grounding_loss_reg: 2.3745 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0286 instance_segmentation_loss_reg: 0.3283 instance_segmentation_loss_poly: 0.8733 +2024/01/08 23:02:34 - mmengine - INFO - Iter(train) [403500/640000] base_lr: 6.1549e-05 lr: 7.4135e-06 eta: 4 days, 7:43:27 time: 1.5881 data_time: 0.0239 memory: 25726 grad_norm: 3.0481 loss: 1.2004 detection_loss_cls: 0.0298 detection_loss_reg: 0.3299 caption_loss_cls: 2.0888 grounding_loss_reg: 2.3752 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0285 instance_segmentation_loss_reg: 0.3282 instance_segmentation_loss_poly: 0.8726 +2024/01/08 23:15:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 23:15:38 - mmengine - INFO - Iter(train) [404000/640000] base_lr: 6.1326e-05 lr: 7.3933e-06 eta: 4 days, 7:29:04 time: 1.5866 data_time: 0.0243 memory: 25726 grad_norm: 3.0665 loss: 1.2042 detection_loss_cls: 0.0299 detection_loss_reg: 0.3306 caption_loss_cls: 2.0882 grounding_loss_reg: 2.3731 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0284 instance_segmentation_loss_reg: 0.3267 instance_segmentation_loss_poly: 0.8684 +2024/01/08 23:15:38 - mmengine - INFO - Saving checkpoint at 404000 iterations +2024/01/08 23:29:20 - mmengine - INFO - Iter(train) [404500/640000] base_lr: 6.1104e-05 lr: 7.3731e-06 eta: 4 days, 7:22:03 time: 1.6002 data_time: 0.0285 memory: 25726 grad_norm: 3.0540 loss: 1.2003 detection_loss_cls: 0.0299 detection_loss_reg: 0.3302 caption_loss_cls: 2.0841 grounding_loss_reg: 2.3726 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0284 instance_segmentation_loss_reg: 0.3272 instance_segmentation_loss_poly: 0.8689 +2024/01/08 23:42:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/08 23:42:06 - mmengine - INFO - Iter(train) [405000/640000] base_lr: 6.0882e-05 lr: 7.3529e-06 eta: 4 days, 7:04:21 time: 1.5843 data_time: 0.0281 memory: 25726 grad_norm: 3.0810 loss: 1.2060 detection_loss_cls: 0.0300 detection_loss_reg: 0.3311 caption_loss_cls: 2.0893 grounding_loss_reg: 2.3705 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0284 instance_segmentation_loss_reg: 0.3267 instance_segmentation_loss_poly: 0.8683 +2024/01/08 23:55:23 - mmengine - INFO - Iter(train) [405500/640000] base_lr: 6.0660e-05 lr: 7.3327e-06 eta: 4 days, 6:52:30 time: 1.5872 data_time: 0.0283 memory: 25726 grad_norm: 3.0835 loss: 1.2074 detection_loss_cls: 0.0299 detection_loss_reg: 0.3303 caption_loss_cls: 2.0906 grounding_loss_reg: 2.3674 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0284 instance_segmentation_loss_reg: 0.3268 instance_segmentation_loss_poly: 0.8677 +2024/01/09 00:09:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 00:09:05 - mmengine - INFO - Iter(train) [406000/640000] base_lr: 6.0438e-05 lr: 7.3125e-06 eta: 4 days, 6:44:58 time: 1.6045 data_time: 0.0284 memory: 25726 grad_norm: 3.0348 loss: 1.1909 detection_loss_cls: 0.0300 detection_loss_reg: 0.3293 caption_loss_cls: 2.0879 grounding_loss_reg: 2.3675 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0282 instance_segmentation_loss_reg: 0.3249 instance_segmentation_loss_poly: 0.8639 +2024/01/09 00:09:05 - mmengine - INFO - Saving checkpoint at 406000 iterations +2024/01/09 00:22:32 - mmengine - INFO - Iter(train) [406500/640000] base_lr: 6.0216e-05 lr: 7.2924e-06 eta: 4 days, 6:34:38 time: 1.6128 data_time: 0.0282 memory: 25726 grad_norm: 3.0048 loss: 1.1935 detection_loss_cls: 0.0301 detection_loss_reg: 0.3306 caption_loss_cls: 2.0867 grounding_loss_reg: 2.3693 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0284 instance_segmentation_loss_reg: 0.3265 instance_segmentation_loss_poly: 0.8671 +2024/01/09 00:35:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 00:35:12 - mmengine - INFO - Iter(train) [407000/640000] base_lr: 5.9995e-05 lr: 7.2723e-06 eta: 4 days, 6:16:16 time: 1.5991 data_time: 0.0279 memory: 25726 grad_norm: 2.9831 loss: 1.1982 detection_loss_cls: 0.0301 detection_loss_reg: 0.3305 caption_loss_cls: 2.0872 grounding_loss_reg: 2.3713 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0283 instance_segmentation_loss_reg: 0.3254 instance_segmentation_loss_poly: 0.8641 +2024/01/09 00:47:56 - mmengine - INFO - Iter(train) [407500/640000] base_lr: 5.9774e-05 lr: 7.2522e-06 eta: 4 days, 5:58:43 time: 1.5797 data_time: 0.0276 memory: 25726 grad_norm: 3.0296 loss: 1.2081 detection_loss_cls: 0.0301 detection_loss_reg: 0.3304 caption_loss_cls: 2.0893 grounding_loss_reg: 2.3723 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0284 instance_segmentation_loss_reg: 0.3262 instance_segmentation_loss_poly: 0.8652 +2024/01/09 01:00:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 01:00:20 - mmengine - INFO - Iter(train) [408000/640000] base_lr: 5.9553e-05 lr: 7.2321e-06 eta: 4 days, 5:38:07 time: 1.5697 data_time: 0.0272 memory: 25726 grad_norm: 3.0419 loss: 1.2059 detection_loss_cls: 0.0302 detection_loss_reg: 0.3307 caption_loss_cls: 2.0916 grounding_loss_reg: 2.3727 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0284 instance_segmentation_loss_reg: 0.3256 instance_segmentation_loss_poly: 0.8638 +2024/01/09 01:00:20 - mmengine - INFO - Saving checkpoint at 408000 iterations +2024/01/09 01:13:33 - mmengine - INFO - Iter(train) [408500/640000] base_lr: 5.9333e-05 lr: 7.2121e-06 eta: 4 days, 5:25:36 time: 1.5625 data_time: 0.0273 memory: 25726 grad_norm: 3.0810 loss: 1.2121 detection_loss_cls: 0.0301 detection_loss_reg: 0.3301 caption_loss_cls: 2.0876 grounding_loss_reg: 2.3724 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0284 instance_segmentation_loss_reg: 0.3258 instance_segmentation_loss_poly: 0.8642 +2024/01/09 01:27:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 01:27:03 - mmengine - INFO - Iter(train) [409000/640000] base_lr: 5.9112e-05 lr: 7.1920e-06 eta: 4 days, 5:15:42 time: 1.5735 data_time: 0.0275 memory: 25726 grad_norm: 3.0569 loss: 1.2033 detection_loss_cls: 0.0299 detection_loss_reg: 0.3282 caption_loss_cls: 2.0873 grounding_loss_reg: 2.3717 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0284 instance_segmentation_loss_reg: 0.3244 instance_segmentation_loss_poly: 0.8613 +2024/01/09 01:40:32 - mmengine - INFO - Iter(train) [409500/640000] base_lr: 5.8892e-05 lr: 7.1720e-06 eta: 4 days, 5:05:36 time: 1.5766 data_time: 0.0275 memory: 25726 grad_norm: 3.0380 loss: 1.1884 detection_loss_cls: 0.0298 detection_loss_reg: 0.3279 caption_loss_cls: 2.0847 grounding_loss_reg: 2.3698 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0283 instance_segmentation_loss_reg: 0.3235 instance_segmentation_loss_poly: 0.8586 +2024/01/09 01:54:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 01:54:02 - mmengine - INFO - Iter(train) [410000/640000] base_lr: 5.8672e-05 lr: 7.1520e-06 eta: 4 days, 4:55:23 time: 1.5736 data_time: 0.0277 memory: 25726 grad_norm: 3.0837 loss: 1.2019 detection_loss_cls: 0.0299 detection_loss_reg: 0.3285 caption_loss_cls: 2.0804 grounding_loss_reg: 2.3685 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0282 instance_segmentation_loss_reg: 0.3237 instance_segmentation_loss_poly: 0.8585 +2024/01/09 01:54:02 - mmengine - INFO - Saving checkpoint at 410000 iterations +2024/01/09 02:07:49 - mmengine - INFO - Iter(train) [410500/640000] base_lr: 5.8453e-05 lr: 7.1321e-06 eta: 4 days, 4:47:33 time: 1.5786 data_time: 0.0279 memory: 25726 grad_norm: 3.0593 loss: 1.1877 detection_loss_cls: 0.0297 detection_loss_reg: 0.3279 caption_loss_cls: 2.0796 grounding_loss_reg: 2.3667 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0282 instance_segmentation_loss_reg: 0.3237 instance_segmentation_loss_poly: 0.8583 +2024/01/09 02:21:26 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 02:21:26 - mmengine - INFO - Iter(train) [411000/640000] base_lr: 5.8234e-05 lr: 7.1122e-06 eta: 4 days, 4:38:00 time: 1.5927 data_time: 0.0283 memory: 25726 grad_norm: 3.0766 loss: 1.1861 detection_loss_cls: 0.0299 detection_loss_reg: 0.3298 caption_loss_cls: 2.0819 grounding_loss_reg: 2.3669 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0283 instance_segmentation_loss_reg: 0.3248 instance_segmentation_loss_poly: 0.8598 +2024/01/09 02:35:38 - mmengine - INFO - Iter(train) [411500/640000] base_lr: 5.8015e-05 lr: 7.0922e-06 eta: 4 days, 4:33:15 time: 1.6148 data_time: 0.0287 memory: 25726 grad_norm: 3.0524 loss: 1.1690 detection_loss_cls: 0.0297 detection_loss_reg: 0.3283 caption_loss_cls: 2.0844 grounding_loss_reg: 2.3649 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0282 instance_segmentation_loss_reg: 0.3236 instance_segmentation_loss_poly: 0.8569 +2024/01/09 02:48:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 02:48:21 - mmengine - INFO - Iter(train) [412000/640000] base_lr: 5.7796e-05 lr: 7.0724e-06 eta: 4 days, 4:15:58 time: 1.6194 data_time: 0.0289 memory: 25726 grad_norm: 3.0208 loss: 1.1659 detection_loss_cls: 0.0297 detection_loss_reg: 0.3281 caption_loss_cls: 2.0832 grounding_loss_reg: 2.3637 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0281 instance_segmentation_loss_reg: 0.3228 instance_segmentation_loss_poly: 0.8558 +2024/01/09 02:48:21 - mmengine - INFO - Saving checkpoint at 412000 iterations +2024/01/09 03:01:39 - mmengine - INFO - Iter(train) [412500/640000] base_lr: 5.7577e-05 lr: 7.0525e-06 eta: 4 days, 4:03:36 time: 1.6208 data_time: 0.0289 memory: 25726 grad_norm: 3.0014 loss: 1.1674 detection_loss_cls: 0.0297 detection_loss_reg: 0.3279 caption_loss_cls: 2.0783 grounding_loss_reg: 2.3666 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0282 instance_segmentation_loss_reg: 0.3241 instance_segmentation_loss_poly: 0.8581 +2024/01/09 03:14:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 03:14:59 - mmengine - INFO - Iter(train) [413000/640000] base_lr: 5.7359e-05 lr: 7.0327e-06 eta: 4 days, 3:51:26 time: 1.6182 data_time: 0.0288 memory: 25726 grad_norm: 3.0301 loss: 1.1701 detection_loss_cls: 0.0296 detection_loss_reg: 0.3285 caption_loss_cls: 2.0809 grounding_loss_reg: 2.3646 semantic_segmentation_loss_cls: 0.0075 instance_segmentation_loss_cls: 0.0282 instance_segmentation_loss_reg: 0.3238 instance_segmentation_loss_poly: 0.8572 +2024/01/09 03:27:54 - mmengine - INFO - Iter(train) [413500/640000] base_lr: 5.7141e-05 lr: 7.0128e-06 eta: 4 days, 3:36:04 time: 1.6096 data_time: 0.0286 memory: 25726 grad_norm: 3.0821 loss: 1.1821 detection_loss_cls: 0.0298 detection_loss_reg: 0.3294 caption_loss_cls: 2.0804 grounding_loss_reg: 2.3609 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0280 instance_segmentation_loss_reg: 0.3227 instance_segmentation_loss_poly: 0.8553 +2024/01/09 03:40:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 03:40:40 - mmengine - INFO - Iter(train) [414000/640000] base_lr: 5.6924e-05 lr: 6.9930e-06 eta: 4 days, 3:19:37 time: 1.5987 data_time: 0.0285 memory: 25726 grad_norm: 3.0890 loss: 1.1862 detection_loss_cls: 0.0297 detection_loss_reg: 0.3280 caption_loss_cls: 2.0805 grounding_loss_reg: 2.3615 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0281 instance_segmentation_loss_reg: 0.3229 instance_segmentation_loss_poly: 0.8564 +2024/01/09 03:40:40 - mmengine - INFO - Saving checkpoint at 414000 iterations +2024/01/09 03:54:26 - mmengine - INFO - Iter(train) [414500/640000] base_lr: 5.6706e-05 lr: 6.9733e-06 eta: 4 days, 3:10:40 time: 1.5984 data_time: 0.0283 memory: 25726 grad_norm: 3.0914 loss: 1.1920 detection_loss_cls: 0.0297 detection_loss_reg: 0.3281 caption_loss_cls: 2.0787 grounding_loss_reg: 2.3626 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0280 instance_segmentation_loss_reg: 0.3229 instance_segmentation_loss_poly: 0.8561 +2024/01/09 04:06:50 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 04:06:50 - mmengine - INFO - Iter(train) [415000/640000] base_lr: 5.6489e-05 lr: 6.9535e-06 eta: 4 days, 2:51:39 time: 1.5802 data_time: 0.0279 memory: 25726 grad_norm: 3.1101 loss: 1.1972 detection_loss_cls: 0.0296 detection_loss_reg: 0.3288 caption_loss_cls: 2.0808 grounding_loss_reg: 2.3607 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0281 instance_segmentation_loss_reg: 0.3242 instance_segmentation_loss_poly: 0.8585 +2024/01/09 04:19:40 - mmengine - INFO - Iter(train) [415500/640000] base_lr: 5.6272e-05 lr: 6.9338e-06 eta: 4 days, 2:35:59 time: 1.5597 data_time: 0.0275 memory: 25726 grad_norm: 3.1217 loss: 1.2111 detection_loss_cls: 0.0294 detection_loss_reg: 0.3263 caption_loss_cls: 2.0793 grounding_loss_reg: 2.3624 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0279 instance_segmentation_loss_reg: 0.3223 instance_segmentation_loss_poly: 0.8550 +2024/01/09 04:32:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 04:32:10 - mmengine - INFO - Iter(train) [416000/640000] base_lr: 5.6055e-05 lr: 6.9141e-06 eta: 4 days, 2:18:05 time: 1.5567 data_time: 0.0274 memory: 25726 grad_norm: 3.1811 loss: 1.2127 detection_loss_cls: 0.0293 detection_loss_reg: 0.3251 caption_loss_cls: 2.0808 grounding_loss_reg: 2.3649 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0279 instance_segmentation_loss_reg: 0.3207 instance_segmentation_loss_poly: 0.8514 +2024/01/09 04:32:10 - mmengine - INFO - Saving checkpoint at 416000 iterations +2024/01/09 04:44:56 - mmengine - INFO - Iter(train) [416500/640000] base_lr: 5.5839e-05 lr: 6.8945e-06 eta: 4 days, 2:02:04 time: 1.5485 data_time: 0.0271 memory: 25726 grad_norm: 3.2172 loss: 1.2042 detection_loss_cls: 0.0292 detection_loss_reg: 0.3250 caption_loss_cls: 2.0757 grounding_loss_reg: 2.3664 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3201 instance_segmentation_loss_poly: 0.8502 +2024/01/09 04:57:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 04:57:41 - mmengine - INFO - Iter(train) [417000/640000] base_lr: 5.5623e-05 lr: 6.8748e-06 eta: 4 days, 1:46:06 time: 1.5398 data_time: 0.0270 memory: 25726 grad_norm: 3.2258 loss: 1.2093 detection_loss_cls: 0.0292 detection_loss_reg: 0.3258 caption_loss_cls: 2.0764 grounding_loss_reg: 2.3618 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3204 instance_segmentation_loss_poly: 0.8510 +2024/01/09 05:10:32 - mmengine - INFO - Iter(train) [417500/640000] base_lr: 5.5407e-05 lr: 6.8552e-06 eta: 4 days, 1:30:57 time: 1.5388 data_time: 0.0270 memory: 25726 grad_norm: 3.2144 loss: 1.2101 detection_loss_cls: 0.0292 detection_loss_reg: 0.3257 caption_loss_cls: 2.0767 grounding_loss_reg: 2.3605 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3204 instance_segmentation_loss_poly: 0.8507 +2024/01/09 05:23:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 05:23:40 - mmengine - INFO - Iter(train) [418000/640000] base_lr: 5.5192e-05 lr: 6.8356e-06 eta: 4 days, 1:17:40 time: 1.5444 data_time: 0.0269 memory: 25726 grad_norm: 3.1905 loss: 1.1995 detection_loss_cls: 0.0292 detection_loss_reg: 0.3270 caption_loss_cls: 2.0751 grounding_loss_reg: 2.3585 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0279 instance_segmentation_loss_reg: 0.3213 instance_segmentation_loss_poly: 0.8521 +2024/01/09 05:23:40 - mmengine - INFO - Saving checkpoint at 418000 iterations +2024/01/09 05:36:59 - mmengine - INFO - Iter(train) [418500/640000] base_lr: 5.4976e-05 lr: 6.8160e-06 eta: 4 days, 1:05:29 time: 1.5375 data_time: 0.0268 memory: 25726 grad_norm: 3.1690 loss: 1.2037 detection_loss_cls: 0.0292 detection_loss_reg: 0.3272 caption_loss_cls: 2.0754 grounding_loss_reg: 2.3553 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0278 instance_segmentation_loss_reg: 0.3218 instance_segmentation_loss_poly: 0.8524 +2024/01/09 05:50:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 05:50:16 - mmengine - INFO - Iter(train) [419000/640000] base_lr: 5.4761e-05 lr: 6.7965e-06 eta: 4 days, 0:53:09 time: 1.5508 data_time: 0.0270 memory: 25726 grad_norm: 3.1557 loss: 1.2009 detection_loss_cls: 0.0292 detection_loss_reg: 0.3280 caption_loss_cls: 2.0778 grounding_loss_reg: 2.3526 semantic_segmentation_loss_cls: 0.0074 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3218 instance_segmentation_loss_poly: 0.8534 +2024/01/09 06:04:31 - mmengine - INFO - Iter(train) [419500/640000] base_lr: 5.4547e-05 lr: 6.7770e-06 eta: 4 days, 0:46:45 time: 1.5719 data_time: 0.0275 memory: 25726 grad_norm: 3.1103 loss: 1.1975 detection_loss_cls: 0.0292 detection_loss_reg: 0.3288 caption_loss_cls: 2.0751 grounding_loss_reg: 2.3523 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3224 instance_segmentation_loss_poly: 0.8557 +2024/01/09 06:18:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 06:18:11 - mmengine - INFO - Iter(train) [420000/640000] base_lr: 5.4332e-05 lr: 6.7575e-06 eta: 4 days, 0:36:35 time: 1.5892 data_time: 0.0279 memory: 25726 grad_norm: 3.0347 loss: 1.1920 detection_loss_cls: 0.0292 detection_loss_reg: 0.3282 caption_loss_cls: 2.0760 grounding_loss_reg: 2.3527 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0277 instance_segmentation_loss_reg: 0.3235 instance_segmentation_loss_poly: 0.8570 +2024/01/09 06:18:11 - mmengine - INFO - Saving checkpoint at 420000 iterations +2024/01/09 06:30:50 - mmengine - INFO - Evaluating bbox... +2024/01/09 06:31:48 - mmengine - INFO - bbox_mAP_copypaste: 0.504 0.684 0.550 0.342 0.553 0.643 +2024/01/09 06:31:48 - mmengine - INFO - Evaluating segm... +2024/01/09 06:33:01 - mmengine - INFO - segm_mAP_copypaste: 0.340 0.602 0.336 0.192 0.388 0.515 +2024/01/09 06:40:16 - mmengine - INFO - per class results: +2024/01/09 06:40:16 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.25 | 90.18 | +| building | 82.69 | 90.84 | +| sky | 93.35 | 97.59 | +| floor | 82.97 | 90.08 | +| tree | 73.29 | 86.37 | +| ceiling | 85.47 | 94.18 | +| road | 83.98 | 89.99 | +| bed | 89.15 | 95.45 | +| windowpane | 63.95 | 78.76 | +| grass | 66.1 | 84.12 | +| cabinet | 64.17 | 76.8 | +| sidewalk | 69.01 | 82.61 | +| person | 81.57 | 90.41 | +| earth | 39.34 | 50.19 | +| door | 53.12 | 67.29 | +| table | 64.7 | 77.71 | +| mountain | 59.19 | 71.24 | +| plant | 50.36 | 60.35 | +| curtain | 75.45 | 86.96 | +| chair | 60.66 | 74.55 | +| car | 84.02 | 91.96 | +| water | 54.23 | 69.26 | +| painting | 71.0 | 85.95 | +| sofa | 71.01 | 85.15 | +| shelf | 46.57 | 65.36 | +| house | 49.76 | 72.2 | +| sea | 49.91 | 73.53 | +| mirror | 68.28 | 75.5 | +| rug | 71.28 | 82.22 | +| field | 28.68 | 47.29 | +| armchair | 48.54 | 61.77 | +| seat | 62.33 | 81.14 | +| fence | 45.67 | 60.84 | +| desk | 50.64 | 69.86 | +| rock | 49.81 | 77.07 | +| wardrobe | 48.8 | 54.71 | +| lamp | 63.28 | 74.59 | +| bathtub | 83.43 | 88.35 | +| railing | 37.48 | 57.19 | +| cushion | 61.24 | 74.52 | +| base | 22.75 | 29.58 | +| box | 30.46 | 41.84 | +| column | 50.57 | 64.73 | +| signboard | 38.47 | 50.18 | +| chest of drawers | 35.49 | 63.82 | +| counter | 30.74 | 52.06 | +| sand | 38.93 | 69.32 | +| sink | 74.82 | 82.29 | +| skyscraper | 61.25 | 77.39 | +| fireplace | 79.73 | 87.51 | +| refrigerator | 69.94 | 77.24 | +| grandstand | 42.24 | 73.99 | +| path | 21.11 | 30.72 | +| stairs | 33.92 | 44.8 | +| runway | 71.32 | 86.97 | +| case | 47.7 | 63.83 | +| pool table | 86.28 | 96.98 | +| pillow | 59.4 | 72.42 | +| screen door | 72.87 | 84.59 | +| stairway | 39.18 | 48.31 | +| river | 17.69 | 29.62 | +| bridge | 62.69 | 68.58 | +| bookcase | 35.33 | 49.13 | +| blind | 39.54 | 44.31 | +| coffee table | 69.92 | 83.69 | +| toilet | 84.41 | 91.44 | +| flower | 38.51 | 59.62 | +| book | 51.08 | 75.71 | +| hill | 13.03 | 21.32 | +| bench | 53.59 | 68.54 | +| countertop | 57.9 | 74.28 | +| stove | 77.09 | 83.89 | +| palm | 45.82 | 62.81 | +| kitchen island | 47.19 | 93.04 | +| computer | 70.37 | 79.46 | +| swivel chair | 42.0 | 57.87 | +| boat | 77.44 | 86.85 | +| bar | 37.83 | 51.94 | +| arcade machine | 22.49 | 23.52 | +| hovel | 16.6 | 17.89 | +| bus | 92.6 | 96.06 | +| towel | 63.99 | 79.96 | +| light | 52.53 | 63.3 | +| truck | 40.34 | 59.48 | +| tower | 20.6 | 35.05 | +| chandelier | 65.86 | 78.79 | +| awning | 34.54 | 43.03 | +| streetlight | 30.67 | 40.07 | +| booth | 33.94 | 44.77 | +| television receiver | 66.53 | 78.97 | +| airplane | 60.26 | 67.89 | +| dirt track | 7.14 | 9.45 | +| apparel | 29.72 | 46.95 | +| pole | 23.81 | 31.15 | +| land | 2.52 | 4.55 | +| bannister | 14.54 | 20.61 | +| escalator | 26.32 | 29.63 | +| ottoman | 52.63 | 68.74 | +| bottle | 23.3 | 30.72 | +| buffet | 46.08 | 50.36 | +| poster | 35.6 | 43.11 | +| stage | 9.9 | 17.84 | +| van | 44.67 | 55.62 | +| ship | 66.22 | 74.23 | +| fountain | 22.03 | 23.09 | +| conveyer belt | 81.15 | 90.72 | +| canopy | 31.04 | 38.84 | +| washer | 71.49 | 74.29 | +| plaything | 32.97 | 40.55 | +| swimming pool | 55.32 | 72.46 | +| stool | 52.51 | 65.86 | +| barrel | 46.56 | 61.1 | +| basket | 30.79 | 49.92 | +| waterfall | 40.7 | 55.06 | +| tent | 81.81 | 96.8 | +| bag | 22.05 | 28.89 | +| minibike | 73.02 | 82.01 | +| cradle | 71.96 | 96.18 | +| oven | 54.54 | 80.26 | +| ball | 55.78 | 74.97 | +| food | 53.7 | 60.06 | +| step | 19.25 | 25.47 | +| tank | 36.4 | 43.29 | +| trade name | 22.79 | 24.39 | +| microwave | 83.5 | 89.26 | +| pot | 47.42 | 54.92 | +| animal | 57.08 | 59.14 | +| bicycle | 58.73 | 72.65 | +| lake | 55.37 | 63.28 | +| dishwasher | 61.02 | 76.06 | +| screen | 52.62 | 68.74 | +| blanket | 20.99 | 24.66 | +| sculpture | 58.11 | 68.05 | +| hood | 58.48 | 68.62 | +| sconce | 39.81 | 46.43 | +| vase | 44.29 | 62.29 | +| traffic light | 39.73 | 60.72 | +| tray | 7.88 | 14.22 | +| ashcan | 47.19 | 62.04 | +| fan | 60.89 | 77.87 | +| pier | 54.5 | 65.56 | +| crt screen | 15.22 | 38.82 | +| plate | 55.2 | 74.0 | +| monitor | 2.93 | 4.02 | +| bulletin board | 42.75 | 49.4 | +| shower | 3.15 | 3.3 | +| radiator | 53.92 | 59.07 | +| glass | 18.62 | 19.92 | +| clock | 27.0 | 33.95 | +| flag | 23.78 | 26.62 | ++---------------------+-------+-------+ +2024/01/09 06:40:32 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.5040 coco/bbox_mAP_50: 0.6840 coco/bbox_mAP_75: 0.5500 coco/bbox_mAP_s: 0.3420 coco/bbox_mAP_m: 0.5530 coco/bbox_mAP_l: 0.6430 coco/segm_mAP: 0.3400 coco/segm_mAP_50: 0.6020 coco/segm_mAP_75: 0.3360 coco/segm_mAP_s: 0.1920 coco/segm_mAP_m: 0.3880 coco/segm_mAP_l: 0.5150 Bleu_1: 0.7565 Bleu_2: 0.5952 Bleu_3: 0.4550 Bleu_4: 0.3439 METEOR: 0.2695 ROUGE_L: 0.5576 CIDEr: 1.0962 SPICE: 0.2006 aAcc: 83.6800 mIoU: 50.1400 mAcc: 62.0300 visual-grounding/miou: 0.8142 visual-grounding/acc: 0.8804 data_time: 0.0042 time: 1.3525 +2024/01/09 06:53:05 - mmengine - INFO - Iter(train) [420500/640000] base_lr: 5.4118e-05 lr: 6.7380e-06 eta: 4 days, 0:19:48 time: 1.5866 data_time: 0.0238 memory: 25726 grad_norm: 3.0322 loss: 1.1954 detection_loss_cls: 0.0291 detection_loss_reg: 0.3283 caption_loss_cls: 2.0719 grounding_loss_reg: 2.3491 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3226 instance_segmentation_loss_poly: 0.8546 +2024/01/09 07:05:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 07:05:56 - mmengine - INFO - Iter(train) [421000/640000] base_lr: 5.3904e-05 lr: 6.7186e-06 eta: 4 days, 0:04:40 time: 1.5879 data_time: 0.0238 memory: 25726 grad_norm: 3.0472 loss: 1.1961 detection_loss_cls: 0.0290 detection_loss_reg: 0.3286 caption_loss_cls: 2.0742 grounding_loss_reg: 2.3462 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3221 instance_segmentation_loss_poly: 0.8533 +2024/01/09 07:19:22 - mmengine - INFO - Iter(train) [421500/640000] base_lr: 5.3691e-05 lr: 6.6991e-06 eta: 3 days, 23:53:05 time: 1.5966 data_time: 0.0240 memory: 25726 grad_norm: 3.0161 loss: 1.1906 detection_loss_cls: 0.0290 detection_loss_reg: 0.3280 caption_loss_cls: 2.0705 grounding_loss_reg: 2.3434 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3227 instance_segmentation_loss_poly: 0.8541 +2024/01/09 07:32:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 07:32:18 - mmengine - INFO - Iter(train) [422000/640000] base_lr: 5.3477e-05 lr: 6.6797e-06 eta: 3 days, 23:38:32 time: 1.5936 data_time: 0.0240 memory: 25726 grad_norm: 3.0355 loss: 1.1991 detection_loss_cls: 0.0290 detection_loss_reg: 0.3284 caption_loss_cls: 2.0699 grounding_loss_reg: 2.3421 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0276 instance_segmentation_loss_reg: 0.3223 instance_segmentation_loss_poly: 0.8535 +2024/01/09 07:32:18 - mmengine - INFO - Saving checkpoint at 422000 iterations +2024/01/09 07:46:18 - mmengine - INFO - Iter(train) [422500/640000] base_lr: 5.3264e-05 lr: 6.6604e-06 eta: 3 days, 23:30:05 time: 1.6040 data_time: 0.0241 memory: 25726 grad_norm: 3.0391 loss: 1.1856 detection_loss_cls: 0.0288 detection_loss_reg: 0.3270 caption_loss_cls: 2.0710 grounding_loss_reg: 2.3422 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0275 instance_segmentation_loss_reg: 0.3216 instance_segmentation_loss_poly: 0.8513 +2024/01/09 07:59:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 07:59:25 - mmengine - INFO - Iter(train) [423000/640000] base_lr: 5.3052e-05 lr: 6.6410e-06 eta: 3 days, 23:16:33 time: 1.6014 data_time: 0.0241 memory: 25726 grad_norm: 3.0409 loss: 1.1870 detection_loss_cls: 0.0286 detection_loss_reg: 0.3257 caption_loss_cls: 2.0728 grounding_loss_reg: 2.3446 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3211 instance_segmentation_loss_poly: 0.8490 +2024/01/09 08:12:37 - mmengine - INFO - Iter(train) [423500/640000] base_lr: 5.2839e-05 lr: 6.6217e-06 eta: 3 days, 23:03:32 time: 1.5859 data_time: 0.0236 memory: 25726 grad_norm: 3.0843 loss: 1.1818 detection_loss_cls: 0.0286 detection_loss_reg: 0.3251 caption_loss_cls: 2.0715 grounding_loss_reg: 2.3480 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0274 instance_segmentation_loss_reg: 0.3204 instance_segmentation_loss_poly: 0.8476 +2024/01/09 08:26:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 08:26:05 - mmengine - INFO - Iter(train) [424000/640000] base_lr: 5.2627e-05 lr: 6.6024e-06 eta: 3 days, 22:51:57 time: 1.5830 data_time: 0.0235 memory: 25726 grad_norm: 3.0635 loss: 1.1762 detection_loss_cls: 0.0285 detection_loss_reg: 0.3257 caption_loss_cls: 2.0726 grounding_loss_reg: 2.3467 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0273 instance_segmentation_loss_reg: 0.3200 instance_segmentation_loss_poly: 0.8466 +2024/01/09 08:26:05 - mmengine - INFO - Saving checkpoint at 424000 iterations +2024/01/09 08:39:55 - mmengine - INFO - Iter(train) [424500/640000] base_lr: 5.2415e-05 lr: 6.5832e-06 eta: 3 days, 22:42:11 time: 1.6016 data_time: 0.0282 memory: 25726 grad_norm: 3.0242 loss: 1.1730 detection_loss_cls: 0.0285 detection_loss_reg: 0.3257 caption_loss_cls: 2.0684 grounding_loss_reg: 2.3456 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0273 instance_segmentation_loss_reg: 0.3203 instance_segmentation_loss_poly: 0.8472 +2024/01/09 08:53:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 08:53:24 - mmengine - INFO - Iter(train) [425000/640000] base_lr: 5.2204e-05 lr: 6.5640e-06 eta: 3 days, 22:30:34 time: 1.6114 data_time: 0.0283 memory: 25726 grad_norm: 2.9626 loss: 1.1590 detection_loss_cls: 0.0285 detection_loss_reg: 0.3255 caption_loss_cls: 2.0663 grounding_loss_reg: 2.3432 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0273 instance_segmentation_loss_reg: 0.3208 instance_segmentation_loss_poly: 0.8470 +2024/01/09 09:06:31 - mmengine - INFO - Iter(train) [425500/640000] base_lr: 5.1992e-05 lr: 6.5447e-06 eta: 3 days, 22:17:00 time: 1.6066 data_time: 0.0283 memory: 25726 grad_norm: 2.9947 loss: 1.1695 detection_loss_cls: 0.0284 detection_loss_reg: 0.3242 caption_loss_cls: 2.0690 grounding_loss_reg: 2.3438 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3200 instance_segmentation_loss_poly: 0.8452 +2024/01/09 09:19:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 09:19:42 - mmengine - INFO - Iter(train) [426000/640000] base_lr: 5.1781e-05 lr: 6.5256e-06 eta: 3 days, 22:03:45 time: 1.6103 data_time: 0.0284 memory: 25726 grad_norm: 2.9825 loss: 1.1613 detection_loss_cls: 0.0284 detection_loss_reg: 0.3244 caption_loss_cls: 2.0687 grounding_loss_reg: 2.3448 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0273 instance_segmentation_loss_reg: 0.3210 instance_segmentation_loss_poly: 0.8473 +2024/01/09 09:19:42 - mmengine - INFO - Saving checkpoint at 426000 iterations +2024/01/09 09:33:23 - mmengine - INFO - Iter(train) [426500/640000] base_lr: 5.1571e-05 lr: 6.5064e-06 eta: 3 days, 21:52:59 time: 1.6054 data_time: 0.0283 memory: 25726 grad_norm: 3.0093 loss: 1.1670 detection_loss_cls: 0.0284 detection_loss_reg: 0.3242 caption_loss_cls: 2.0699 grounding_loss_reg: 2.3433 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0271 instance_segmentation_loss_reg: 0.3198 instance_segmentation_loss_poly: 0.8447 +2024/01/09 09:46:26 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 09:46:26 - mmengine - INFO - Iter(train) [427000/640000] base_lr: 5.1360e-05 lr: 6.4873e-06 eta: 3 days, 21:39:03 time: 1.6045 data_time: 0.0284 memory: 25726 grad_norm: 3.0134 loss: 1.1653 detection_loss_cls: 0.0282 detection_loss_reg: 0.3242 caption_loss_cls: 2.0638 grounding_loss_reg: 2.3409 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0271 instance_segmentation_loss_reg: 0.3201 instance_segmentation_loss_poly: 0.8462 +2024/01/09 09:59:52 - mmengine - INFO - Iter(train) [427500/640000] base_lr: 5.1150e-05 lr: 6.4682e-06 eta: 3 days, 21:27:01 time: 1.6079 data_time: 0.0286 memory: 25726 grad_norm: 3.0509 loss: 1.1704 detection_loss_cls: 0.0282 detection_loss_reg: 0.3243 caption_loss_cls: 2.0645 grounding_loss_reg: 2.3372 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0270 instance_segmentation_loss_reg: 0.3202 instance_segmentation_loss_poly: 0.8461 +2024/01/09 10:12:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 10:12:31 - mmengine - INFO - Iter(train) [428000/640000] base_lr: 5.0940e-05 lr: 6.4491e-06 eta: 3 days, 21:11:11 time: 1.5955 data_time: 0.0285 memory: 25726 grad_norm: 3.1462 loss: 1.1912 detection_loss_cls: 0.0282 detection_loss_reg: 0.3252 caption_loss_cls: 2.0645 grounding_loss_reg: 2.3343 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0270 instance_segmentation_loss_reg: 0.3203 instance_segmentation_loss_poly: 0.8462 +2024/01/09 10:12:31 - mmengine - INFO - Saving checkpoint at 428000 iterations +2024/01/09 10:27:01 - mmengine - INFO - Iter(train) [428500/640000] base_lr: 5.0731e-05 lr: 6.4301e-06 eta: 3 days, 21:04:15 time: 1.6059 data_time: 0.0286 memory: 25726 grad_norm: 3.1374 loss: 1.1848 detection_loss_cls: 0.0282 detection_loss_reg: 0.3254 caption_loss_cls: 2.0655 grounding_loss_reg: 2.3341 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0270 instance_segmentation_loss_reg: 0.3203 instance_segmentation_loss_poly: 0.8463 +2024/01/09 10:40:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 10:40:46 - mmengine - INFO - Iter(train) [429000/640000] base_lr: 5.0522e-05 lr: 6.4111e-06 eta: 3 days, 20:53:33 time: 1.6096 data_time: 0.0287 memory: 25726 grad_norm: 3.1626 loss: 1.1966 detection_loss_cls: 0.0282 detection_loss_reg: 0.3251 caption_loss_cls: 2.0675 grounding_loss_reg: 2.3329 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0270 instance_segmentation_loss_reg: 0.3208 instance_segmentation_loss_poly: 0.8474 +2024/01/09 10:53:47 - mmengine - INFO - Iter(train) [429500/640000] base_lr: 5.0313e-05 lr: 6.3921e-06 eta: 3 days, 20:39:26 time: 1.6081 data_time: 0.0287 memory: 25726 grad_norm: 3.1718 loss: 1.1923 detection_loss_cls: 0.0282 detection_loss_reg: 0.3255 caption_loss_cls: 2.0686 grounding_loss_reg: 2.3313 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0271 instance_segmentation_loss_reg: 0.3217 instance_segmentation_loss_poly: 0.8493 +2024/01/09 11:07:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 11:07:08 - mmengine - INFO - Iter(train) [430000/640000] base_lr: 5.0104e-05 lr: 6.3731e-06 eta: 3 days, 20:26:50 time: 1.6105 data_time: 0.0288 memory: 25726 grad_norm: 3.1871 loss: 1.2005 detection_loss_cls: 0.0282 detection_loss_reg: 0.3254 caption_loss_cls: 2.0710 grounding_loss_reg: 2.3333 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3221 instance_segmentation_loss_poly: 0.8512 +2024/01/09 11:07:08 - mmengine - INFO - Saving checkpoint at 430000 iterations +2024/01/09 11:20:18 - mmengine - INFO - Iter(train) [430500/640000] base_lr: 4.9896e-05 lr: 6.3542e-06 eta: 3 days, 20:13:27 time: 1.6030 data_time: 0.0287 memory: 25726 grad_norm: 3.2165 loss: 1.2058 detection_loss_cls: 0.0282 detection_loss_reg: 0.3251 caption_loss_cls: 2.0701 grounding_loss_reg: 2.3318 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3214 instance_segmentation_loss_poly: 0.8500 +2024/01/09 11:33:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 11:33:48 - mmengine - INFO - Iter(train) [431000/640000] base_lr: 4.9688e-05 lr: 6.3353e-06 eta: 3 days, 20:01:30 time: 1.6097 data_time: 0.0287 memory: 25726 grad_norm: 3.1935 loss: 1.2008 detection_loss_cls: 0.0283 detection_loss_reg: 0.3246 caption_loss_cls: 2.0739 grounding_loss_reg: 2.3314 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3220 instance_segmentation_loss_poly: 0.8506 +2024/01/09 11:46:28 - mmengine - INFO - Iter(train) [431500/640000] base_lr: 4.9480e-05 lr: 6.3164e-06 eta: 3 days, 19:45:55 time: 1.5984 data_time: 0.0284 memory: 25726 grad_norm: 3.1962 loss: 1.2038 detection_loss_cls: 0.0282 detection_loss_reg: 0.3236 caption_loss_cls: 2.0718 grounding_loss_reg: 2.3315 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0273 instance_segmentation_loss_reg: 0.3231 instance_segmentation_loss_poly: 0.8527 +2024/01/09 11:59:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 11:59:20 - mmengine - INFO - Iter(train) [432000/640000] base_lr: 4.9273e-05 lr: 6.2976e-06 eta: 3 days, 19:31:13 time: 1.6015 data_time: 0.0284 memory: 25726 grad_norm: 3.1714 loss: 1.1890 detection_loss_cls: 0.0282 detection_loss_reg: 0.3243 caption_loss_cls: 2.0746 grounding_loss_reg: 2.3304 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3222 instance_segmentation_loss_poly: 0.8505 +2024/01/09 11:59:20 - mmengine - INFO - Saving checkpoint at 432000 iterations +2024/01/09 12:12:43 - mmengine - INFO - Iter(train) [432500/640000] base_lr: 4.9066e-05 lr: 6.2787e-06 eta: 3 days, 19:18:48 time: 1.5847 data_time: 0.0281 memory: 25726 grad_norm: 3.1745 loss: 1.1951 detection_loss_cls: 0.0283 detection_loss_reg: 0.3254 caption_loss_cls: 2.0677 grounding_loss_reg: 2.3283 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3220 instance_segmentation_loss_poly: 0.8509 +2024/01/09 12:26:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 12:26:21 - mmengine - INFO - Iter(train) [433000/640000] base_lr: 4.8859e-05 lr: 6.2599e-06 eta: 3 days, 19:07:22 time: 1.5830 data_time: 0.0281 memory: 25726 grad_norm: 3.1926 loss: 1.1956 detection_loss_cls: 0.0283 detection_loss_reg: 0.3256 caption_loss_cls: 2.0686 grounding_loss_reg: 2.3270 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3233 instance_segmentation_loss_poly: 0.8547 +2024/01/09 12:39:44 - mmengine - INFO - Iter(train) [433500/640000] base_lr: 4.8653e-05 lr: 6.2412e-06 eta: 3 days, 18:54:52 time: 1.5885 data_time: 0.0281 memory: 25726 grad_norm: 3.1715 loss: 1.1881 detection_loss_cls: 0.0284 detection_loss_reg: 0.3261 caption_loss_cls: 2.0667 grounding_loss_reg: 2.3272 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3236 instance_segmentation_loss_poly: 0.8544 +2024/01/09 12:52:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 12:52:53 - mmengine - INFO - Iter(train) [434000/640000] base_lr: 4.8447e-05 lr: 6.2224e-06 eta: 3 days, 18:41:22 time: 1.5855 data_time: 0.0279 memory: 25726 grad_norm: 3.1737 loss: 1.1816 detection_loss_cls: 0.0284 detection_loss_reg: 0.3261 caption_loss_cls: 2.0650 grounding_loss_reg: 2.3239 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3237 instance_segmentation_loss_poly: 0.8545 +2024/01/09 12:52:53 - mmengine - INFO - Saving checkpoint at 434000 iterations +2024/01/09 13:07:14 - mmengine - INFO - Iter(train) [434500/640000] base_lr: 4.8241e-05 lr: 6.2037e-06 eta: 3 days, 18:32:50 time: 1.6033 data_time: 0.0280 memory: 25726 grad_norm: 3.1472 loss: 1.1719 detection_loss_cls: 0.0284 detection_loss_reg: 0.3270 caption_loss_cls: 2.0649 grounding_loss_reg: 2.3254 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0271 instance_segmentation_loss_reg: 0.3219 instance_segmentation_loss_poly: 0.8512 +2024/01/09 13:20:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 13:20:22 - mmengine - INFO - Iter(train) [435000/640000] base_lr: 4.8036e-05 lr: 6.1851e-06 eta: 3 days, 18:19:11 time: 1.5977 data_time: 0.0279 memory: 25726 grad_norm: 3.1804 loss: 1.1729 detection_loss_cls: 0.0283 detection_loss_reg: 0.3259 caption_loss_cls: 2.0661 grounding_loss_reg: 2.3227 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0271 instance_segmentation_loss_reg: 0.3221 instance_segmentation_loss_poly: 0.8513 +2024/01/09 13:33:11 - mmengine - INFO - Iter(train) [435500/640000] base_lr: 4.7831e-05 lr: 6.1664e-06 eta: 3 days, 18:04:22 time: 1.5998 data_time: 0.0279 memory: 25726 grad_norm: 3.1921 loss: 1.1724 detection_loss_cls: 0.0284 detection_loss_reg: 0.3267 caption_loss_cls: 2.0664 grounding_loss_reg: 2.3256 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0271 instance_segmentation_loss_reg: 0.3225 instance_segmentation_loss_poly: 0.8515 +2024/01/09 13:46:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240108_140404 +2024/01/09 13:46:12 - mmengine - INFO - Iter(train) [436000/640000] base_lr: 4.7626e-05 lr: 6.1478e-06 eta: 3 days, 17:50:21 time: 1.6021 data_time: 0.0280 memory: 25726 grad_norm: 3.1859 loss: 1.1772 detection_loss_cls: 0.0285 detection_loss_reg: 0.3286 caption_loss_cls: 2.0701 grounding_loss_reg: 2.3208 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0272 instance_segmentation_loss_reg: 0.3238 instance_segmentation_loss_poly: 0.8545 +2024/01/09 13:46:12 - mmengine - INFO - Saving checkpoint at 436000 iterations +2024/01/09 13:59:53 - mmengine - INFO - Iter(train) [436500/640000] base_lr: 4.7421e-05 lr: 6.1292e-06 eta: 3 days, 17:38:59 time: 1.6067 data_time: 0.0280 memory: 25726 grad_norm: 3.2625 loss: 1.1785 detection_loss_cls: 0.0285 detection_loss_reg: 0.3287 caption_loss_cls: 2.0728 grounding_loss_reg: 2.3169 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0273 instance_segmentation_loss_reg: 0.3239 instance_segmentation_loss_poly: 0.8551 +2024/01/09 15:06:52 - mmengine - INFO - Iter(train) [437000/640000] base_lr: 4.7217e-05 lr: 6.1106e-06 eta: 3 days, 16:57:50 time: 1.5914 data_time: 0.0224 memory: 25718 grad_norm: 3.2483 loss: 1.1688 detection_loss_cls: 0.0284 detection_loss_reg: 0.3288 caption_loss_cls: 2.0659 grounding_loss_reg: 2.3151 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0271 instance_segmentation_loss_reg: 0.3235 instance_segmentation_loss_poly: 0.8539 +2024/01/09 15:19:51 - mmengine - INFO - Iter(train) [437500/640000] base_lr: 4.7013e-05 lr: 6.0921e-06 eta: 3 days, 16:20:21 time: 1.5853 data_time: 0.0218 memory: 25718 grad_norm: 3.3164 loss: 1.1623 detection_loss_cls: 0.0285 detection_loss_reg: 0.3283 caption_loss_cls: 2.0650 grounding_loss_reg: 2.3133 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0271 instance_segmentation_loss_reg: 0.3236 instance_segmentation_loss_poly: 0.8549 +2024/01/09 15:32:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 15:32:53 - mmengine - INFO - Iter(train) [438000/640000] base_lr: 4.6810e-05 lr: 6.0736e-06 eta: 3 days, 16:00:32 time: 1.5835 data_time: 0.0214 memory: 25718 grad_norm: 3.3391 loss: 1.1616 detection_loss_cls: 0.0284 detection_loss_reg: 0.3276 caption_loss_cls: 2.0610 grounding_loss_reg: 2.3105 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3227 instance_segmentation_loss_poly: 0.8533 +2024/01/09 15:32:53 - mmengine - INFO - Saving checkpoint at 438000 iterations +2024/01/09 15:46:29 - mmengine - INFO - Iter(train) [438500/640000] base_lr: 4.6607e-05 lr: 6.0551e-06 eta: 3 days, 16:30:03 time: 1.5722 data_time: 0.0210 memory: 25718 grad_norm: 3.3773 loss: 1.1713 detection_loss_cls: 0.0284 detection_loss_reg: 0.3270 caption_loss_cls: 2.0575 grounding_loss_reg: 2.3146 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3224 instance_segmentation_loss_poly: 0.8524 +2024/01/09 15:59:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 15:59:31 - mmengine - INFO - Iter(train) [439000/640000] base_lr: 4.6404e-05 lr: 6.0367e-06 eta: 3 days, 16:07:18 time: 1.5710 data_time: 0.0206 memory: 25718 grad_norm: 3.3868 loss: 1.1712 detection_loss_cls: 0.0283 detection_loss_reg: 0.3265 caption_loss_cls: 2.0512 grounding_loss_reg: 2.3135 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3221 instance_segmentation_loss_poly: 0.8524 +2024/01/09 16:12:26 - mmengine - INFO - Iter(train) [439500/640000] base_lr: 4.6201e-05 lr: 6.0183e-06 eta: 3 days, 15:39:41 time: 1.5723 data_time: 0.0204 memory: 25718 grad_norm: 3.3964 loss: 1.1705 detection_loss_cls: 0.0282 detection_loss_reg: 0.3255 caption_loss_cls: 2.0477 grounding_loss_reg: 2.3117 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3216 instance_segmentation_loss_poly: 0.8516 +2024/01/09 16:25:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 16:25:45 - mmengine - INFO - Iter(train) [440000/640000] base_lr: 4.5999e-05 lr: 5.9999e-06 eta: 3 days, 15:36:37 time: 1.5770 data_time: 0.0201 memory: 25718 grad_norm: 3.3625 loss: 1.1612 detection_loss_cls: 0.0283 detection_loss_reg: 0.3255 caption_loss_cls: 2.0473 grounding_loss_reg: 2.3091 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3216 instance_segmentation_loss_poly: 0.8516 +2024/01/09 16:25:45 - mmengine - INFO - Saving checkpoint at 440000 iterations +2024/01/09 16:38:05 - mmengine - INFO - Evaluating bbox... +2024/01/09 16:39:03 - mmengine - INFO - bbox_mAP_copypaste: 0.506 0.684 0.556 0.350 0.554 0.635 +2024/01/09 16:39:03 - mmengine - INFO - Evaluating segm... +2024/01/09 16:40:17 - mmengine - INFO - segm_mAP_copypaste: 0.341 0.604 0.337 0.198 0.386 0.513 +2024/01/09 16:48:12 - mmengine - INFO - per class results: +2024/01/09 16:48:12 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.76 | 88.55 | +| building | 82.99 | 92.68 | +| sky | 93.59 | 97.94 | +| floor | 82.82 | 89.56 | +| tree | 74.17 | 86.62 | +| ceiling | 84.58 | 92.89 | +| road | 83.39 | 88.16 | +| bed | 90.39 | 96.22 | +| windowpane | 63.0 | 79.51 | +| grass | 65.44 | 80.47 | +| cabinet | 62.53 | 74.29 | +| sidewalk | 65.67 | 80.52 | +| person | 81.81 | 91.46 | +| earth | 40.22 | 55.96 | +| door | 55.97 | 70.15 | +| table | 64.14 | 79.7 | +| mountain | 60.24 | 77.53 | +| plant | 53.97 | 66.55 | +| curtain | 73.68 | 86.95 | +| chair | 61.31 | 76.01 | +| car | 84.91 | 92.02 | +| water | 55.63 | 69.73 | +| painting | 68.94 | 87.52 | +| sofa | 70.63 | 86.17 | +| shelf | 45.72 | 65.82 | +| house | 46.91 | 64.6 | +| sea | 52.89 | 71.8 | +| mirror | 69.36 | 77.19 | +| rug | 70.56 | 81.22 | +| field | 29.6 | 47.54 | +| armchair | 47.52 | 60.76 | +| seat | 65.06 | 83.3 | +| fence | 45.52 | 66.55 | +| desk | 50.1 | 66.72 | +| rock | 36.12 | 54.55 | +| wardrobe | 47.08 | 61.25 | +| lamp | 63.59 | 76.5 | +| bathtub | 80.59 | 83.8 | +| railing | 35.91 | 51.97 | +| cushion | 60.33 | 71.93 | +| base | 24.94 | 36.14 | +| box | 28.11 | 41.11 | +| column | 52.2 | 71.15 | +| signboard | 37.37 | 49.9 | +| chest of drawers | 39.98 | 61.16 | +| counter | 26.52 | 35.86 | +| sand | 39.86 | 56.61 | +| sink | 75.95 | 83.63 | +| skyscraper | 54.19 | 68.01 | +| fireplace | 79.13 | 86.45 | +| refrigerator | 72.63 | 78.97 | +| grandstand | 41.72 | 77.05 | +| path | 22.29 | 33.99 | +| stairs | 26.77 | 34.83 | +| runway | 77.09 | 86.48 | +| case | 53.38 | 75.34 | +| pool table | 91.43 | 95.51 | +| pillow | 59.31 | 72.17 | +| screen door | 81.24 | 87.39 | +| stairway | 29.85 | 45.35 | +| river | 18.56 | 40.01 | +| bridge | 52.84 | 77.14 | +| bookcase | 39.06 | 61.59 | +| blind | 37.73 | 42.1 | +| coffee table | 67.42 | 85.86 | +| toilet | 87.54 | 91.83 | +| flower | 40.8 | 58.42 | +| book | 50.93 | 68.24 | +| hill | 13.84 | 25.23 | +| bench | 56.01 | 63.71 | +| countertop | 57.67 | 66.19 | +| stove | 77.56 | 87.22 | +| palm | 48.96 | 70.62 | +| kitchen island | 43.07 | 83.24 | +| computer | 71.77 | 81.13 | +| swivel chair | 41.3 | 54.64 | +| boat | 58.36 | 65.0 | +| bar | 39.91 | 56.3 | +| arcade machine | 52.12 | 56.73 | +| hovel | 15.96 | 17.07 | +| bus | 92.67 | 95.86 | +| towel | 66.62 | 77.74 | +| light | 53.8 | 66.69 | +| truck | 43.39 | 57.88 | +| tower | 22.52 | 36.66 | +| chandelier | 65.8 | 83.08 | +| awning | 34.94 | 39.72 | +| streetlight | 33.5 | 47.55 | +| booth | 35.31 | 41.26 | +| television receiver | 70.97 | 78.95 | +| airplane | 62.51 | 70.15 | +| dirt track | 10.51 | 19.75 | +| apparel | 39.44 | 58.82 | +| pole | 29.18 | 41.89 | +| land | 3.28 | 5.66 | +| bannister | 15.63 | 20.1 | +| escalator | 21.46 | 22.6 | +| ottoman | 52.6 | 73.66 | +| bottle | 24.63 | 34.22 | +| buffet | 46.86 | 62.33 | +| poster | 35.06 | 45.42 | +| stage | 10.84 | 19.27 | +| van | 48.36 | 64.03 | +| ship | 16.08 | 21.6 | +| fountain | 22.19 | 22.4 | +| conveyer belt | 81.04 | 89.77 | +| canopy | 19.61 | 24.33 | +| washer | 68.14 | 72.47 | +| plaything | 25.39 | 32.56 | +| swimming pool | 51.7 | 74.79 | +| stool | 52.44 | 66.23 | +| barrel | 64.14 | 78.26 | +| basket | 31.96 | 51.72 | +| waterfall | 56.52 | 75.03 | +| tent | 72.13 | 94.65 | +| bag | 21.5 | 32.4 | +| minibike | 73.34 | 86.05 | +| cradle | 70.32 | 96.13 | +| oven | 47.19 | 60.67 | +| ball | 54.37 | 71.75 | +| food | 52.55 | 58.1 | +| step | 16.68 | 27.61 | +| tank | 36.14 | 44.98 | +| trade name | 32.73 | 45.75 | +| microwave | 79.73 | 85.36 | +| pot | 52.45 | 62.11 | +| animal | 59.36 | 62.23 | +| bicycle | 57.04 | 72.74 | +| lake | 60.93 | 63.27 | +| dishwasher | 63.06 | 77.36 | +| screen | 56.91 | 81.97 | +| blanket | 20.15 | 24.07 | +| sculpture | 57.27 | 68.8 | +| hood | 59.84 | 68.54 | +| sconce | 43.81 | 51.95 | +| vase | 44.59 | 60.96 | +| traffic light | 40.47 | 56.12 | +| tray | 7.59 | 12.25 | +| ashcan | 45.57 | 65.97 | +| fan | 60.6 | 72.14 | +| pier | 31.05 | 48.81 | +| crt screen | 14.49 | 20.3 | +| plate | 54.91 | 75.41 | +| monitor | 8.11 | 10.53 | +| bulletin board | 43.85 | 51.09 | +| shower | 6.12 | 8.77 | +| radiator | 57.3 | 62.25 | +| glass | 20.63 | 22.95 | +| clock | 27.61 | 34.3 | +| flag | 45.29 | 54.08 | ++---------------------+-------+-------+ +2024/01/09 16:48:30 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.5060 coco/bbox_mAP_50: 0.6840 coco/bbox_mAP_75: 0.5560 coco/bbox_mAP_s: 0.3500 coco/bbox_mAP_m: 0.5540 coco/bbox_mAP_l: 0.6350 coco/segm_mAP: 0.3410 coco/segm_mAP_50: 0.6040 coco/segm_mAP_75: 0.3370 coco/segm_mAP_s: 0.1980 coco/segm_mAP_m: 0.3860 coco/segm_mAP_l: 0.5130 Bleu_1: 0.7590 Bleu_2: 0.5945 Bleu_3: 0.4531 Bleu_4: 0.3428 METEOR: 0.2727 ROUGE_L: 0.5593 CIDEr: 1.1071 SPICE: 0.2037 aAcc: 83.6200 mIoU: 50.2400 mAcc: 62.4500 visual-grounding/miou: 0.8161 visual-grounding/acc: 0.8798 data_time: 0.0103 time: 1.3561 +2024/01/09 17:00:44 - mmengine - INFO - Iter(train) [440500/640000] base_lr: 4.5797e-05 lr: 5.9816e-06 eta: 3 days, 14:44:20 time: 1.5656 data_time: 0.0209 memory: 25718 grad_norm: 3.4130 loss: 1.1741 detection_loss_cls: 0.0284 detection_loss_reg: 0.3268 caption_loss_cls: 2.0454 grounding_loss_reg: 2.3062 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0269 instance_segmentation_loss_reg: 0.3225 instance_segmentation_loss_poly: 0.8537 +2024/01/09 17:14:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 17:14:13 - mmengine - INFO - Iter(train) [441000/640000] base_lr: 4.5596e-05 lr: 5.9632e-06 eta: 3 days, 14:48:54 time: 1.5687 data_time: 0.0211 memory: 25718 grad_norm: 3.3613 loss: 1.1612 detection_loss_cls: 0.0282 detection_loss_reg: 0.3249 caption_loss_cls: 2.0435 grounding_loss_reg: 2.3034 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3218 instance_segmentation_loss_poly: 0.8513 +2024/01/09 17:27:14 - mmengine - INFO - Iter(train) [441500/640000] base_lr: 4.5394e-05 lr: 5.9449e-06 eta: 3 days, 14:32:52 time: 1.5693 data_time: 0.0214 memory: 25718 grad_norm: 3.3088 loss: 1.1636 detection_loss_cls: 0.0282 detection_loss_reg: 0.3240 caption_loss_cls: 2.0406 grounding_loss_reg: 2.3024 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0267 instance_segmentation_loss_reg: 0.3199 instance_segmentation_loss_poly: 0.8482 +2024/01/09 17:40:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 17:40:11 - mmengine - INFO - Iter(train) [442000/640000] base_lr: 4.5193e-05 lr: 5.9267e-06 eta: 3 days, 14:15:35 time: 1.5683 data_time: 0.0216 memory: 25718 grad_norm: 3.3420 loss: 1.1669 detection_loss_cls: 0.0281 detection_loss_reg: 0.3234 caption_loss_cls: 2.0434 grounding_loss_reg: 2.2995 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0267 instance_segmentation_loss_reg: 0.3195 instance_segmentation_loss_poly: 0.8476 +2024/01/09 17:40:11 - mmengine - INFO - Saving checkpoint at 442000 iterations +2024/01/09 17:52:58 - mmengine - INFO - Iter(train) [442500/640000] base_lr: 4.4993e-05 lr: 5.9085e-06 eta: 3 days, 13:53:30 time: 1.5559 data_time: 0.0221 memory: 25718 grad_norm: 3.3387 loss: 1.1617 detection_loss_cls: 0.0282 detection_loss_reg: 0.3239 caption_loss_cls: 2.0400 grounding_loss_reg: 2.2998 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0267 instance_segmentation_loss_reg: 0.3194 instance_segmentation_loss_poly: 0.8479 +2024/01/09 18:05:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 18:05:48 - mmengine - INFO - Iter(train) [443000/640000] base_lr: 4.4793e-05 lr: 5.8903e-06 eta: 3 days, 13:34:22 time: 1.5529 data_time: 0.0222 memory: 25718 grad_norm: 3.3764 loss: 1.1591 detection_loss_cls: 0.0282 detection_loss_reg: 0.3244 caption_loss_cls: 2.0370 grounding_loss_reg: 2.2982 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0267 instance_segmentation_loss_reg: 0.3195 instance_segmentation_loss_poly: 0.8486 +2024/01/09 18:18:56 - mmengine - INFO - Iter(train) [443500/640000] base_lr: 4.4593e-05 lr: 5.8721e-06 eta: 3 days, 13:23:30 time: 1.5561 data_time: 0.0226 memory: 25718 grad_norm: 3.3650 loss: 1.1663 detection_loss_cls: 0.0283 detection_loss_reg: 0.3266 caption_loss_cls: 2.0387 grounding_loss_reg: 2.2973 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3206 instance_segmentation_loss_poly: 0.8506 +2024/01/09 18:31:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 18:31:57 - mmengine - INFO - Iter(train) [444000/640000] base_lr: 4.4393e-05 lr: 5.8539e-06 eta: 3 days, 13:10:03 time: 1.5516 data_time: 0.0229 memory: 25718 grad_norm: 3.4542 loss: 1.1778 detection_loss_cls: 0.0284 detection_loss_reg: 0.3272 caption_loss_cls: 2.0355 grounding_loss_reg: 2.2947 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0268 instance_segmentation_loss_reg: 0.3213 instance_segmentation_loss_poly: 0.8525 +2024/01/09 18:31:57 - mmengine - INFO - Saving checkpoint at 444000 iterations +2024/01/09 18:45:08 - mmengine - INFO - Iter(train) [444500/640000] base_lr: 4.4194e-05 lr: 5.8358e-06 eta: 3 days, 13:00:08 time: 1.5653 data_time: 0.0271 memory: 25718 grad_norm: 3.4091 loss: 1.1654 detection_loss_cls: 0.0285 detection_loss_reg: 0.3264 caption_loss_cls: 2.0355 grounding_loss_reg: 2.2922 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0267 instance_segmentation_loss_reg: 0.3208 instance_segmentation_loss_poly: 0.8520 +2024/01/09 18:58:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 18:58:01 - mmengine - INFO - Iter(train) [445000/640000] base_lr: 4.3995e-05 lr: 5.8178e-06 eta: 3 days, 12:43:34 time: 1.5562 data_time: 0.0269 memory: 25718 grad_norm: 3.5053 loss: 1.1742 detection_loss_cls: 0.0283 detection_loss_reg: 0.3260 caption_loss_cls: 2.0359 grounding_loss_reg: 2.2895 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0267 instance_segmentation_loss_reg: 0.3204 instance_segmentation_loss_poly: 0.8523 +2024/01/09 19:11:54 - mmengine - INFO - Iter(train) [445500/640000] base_lr: 4.3797e-05 lr: 5.7997e-06 eta: 3 days, 12:47:33 time: 1.5691 data_time: 0.0272 memory: 25718 grad_norm: 3.4482 loss: 1.1661 detection_loss_cls: 0.0283 detection_loss_reg: 0.3255 caption_loss_cls: 2.0340 grounding_loss_reg: 2.2869 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0267 instance_segmentation_loss_reg: 0.3199 instance_segmentation_loss_poly: 0.8519 +2024/01/09 19:24:49 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 19:24:49 - mmengine - INFO - Iter(train) [446000/640000] base_lr: 4.3599e-05 lr: 5.7817e-06 eta: 3 days, 12:31:21 time: 1.5686 data_time: 0.0273 memory: 25718 grad_norm: 3.4256 loss: 1.1689 detection_loss_cls: 0.0282 detection_loss_reg: 0.3257 caption_loss_cls: 2.0345 grounding_loss_reg: 2.2865 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0266 instance_segmentation_loss_reg: 0.3193 instance_segmentation_loss_poly: 0.8509 +2024/01/09 19:24:49 - mmengine - INFO - Saving checkpoint at 446000 iterations +2024/01/09 19:38:39 - mmengine - INFO - Iter(train) [446500/640000] base_lr: 4.3401e-05 lr: 5.7637e-06 eta: 3 days, 12:32:14 time: 1.5844 data_time: 0.0271 memory: 25718 grad_norm: 3.3872 loss: 1.1523 detection_loss_cls: 0.0282 detection_loss_reg: 0.3246 caption_loss_cls: 2.0355 grounding_loss_reg: 2.2847 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0266 instance_segmentation_loss_reg: 0.3194 instance_segmentation_loss_poly: 0.8509 +2024/01/09 19:52:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 19:52:05 - mmengine - INFO - Iter(train) [447000/640000] base_lr: 4.3204e-05 lr: 5.7458e-06 eta: 3 days, 12:24:50 time: 1.5934 data_time: 0.0274 memory: 25718 grad_norm: 3.3117 loss: 1.1476 detection_loss_cls: 0.0282 detection_loss_reg: 0.3256 caption_loss_cls: 2.0335 grounding_loss_reg: 2.2824 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0266 instance_segmentation_loss_reg: 0.3193 instance_segmentation_loss_poly: 0.8513 +2024/01/09 20:05:04 - mmengine - INFO - Iter(train) [447500/640000] base_lr: 4.3006e-05 lr: 5.7279e-06 eta: 3 days, 12:09:16 time: 1.5914 data_time: 0.0272 memory: 25718 grad_norm: 3.2931 loss: 1.1386 detection_loss_cls: 0.0282 detection_loss_reg: 0.3247 caption_loss_cls: 2.0328 grounding_loss_reg: 2.2808 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0266 instance_segmentation_loss_reg: 0.3190 instance_segmentation_loss_poly: 0.8506 +2024/01/09 20:17:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 20:17:11 - mmengine - INFO - Iter(train) [448000/640000] base_lr: 4.2810e-05 lr: 5.7100e-06 eta: 3 days, 11:39:55 time: 1.5776 data_time: 0.0269 memory: 25718 grad_norm: 3.2515 loss: 1.1323 detection_loss_cls: 0.0282 detection_loss_reg: 0.3237 caption_loss_cls: 2.0263 grounding_loss_reg: 2.2802 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0266 instance_segmentation_loss_reg: 0.3192 instance_segmentation_loss_poly: 0.8516 +2024/01/09 20:17:11 - mmengine - INFO - Saving checkpoint at 448000 iterations +2024/01/09 20:30:39 - mmengine - INFO - Iter(train) [448500/640000] base_lr: 4.2613e-05 lr: 5.6921e-06 eta: 3 days, 11:32:56 time: 1.5821 data_time: 0.0271 memory: 25718 grad_norm: 3.2459 loss: 1.1330 detection_loss_cls: 0.0281 detection_loss_reg: 0.3228 caption_loss_cls: 2.0209 grounding_loss_reg: 2.2776 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0265 instance_segmentation_loss_reg: 0.3184 instance_segmentation_loss_poly: 0.8504 +2024/01/09 20:43:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 20:43:03 - mmengine - INFO - Iter(train) [449000/640000] base_lr: 4.2417e-05 lr: 5.6743e-06 eta: 3 days, 11:09:25 time: 1.5745 data_time: 0.0270 memory: 25718 grad_norm: 3.1978 loss: 1.1363 detection_loss_cls: 0.0281 detection_loss_reg: 0.3232 caption_loss_cls: 2.0218 grounding_loss_reg: 2.2719 semantic_segmentation_loss_cls: 0.0073 instance_segmentation_loss_cls: 0.0264 instance_segmentation_loss_reg: 0.3181 instance_segmentation_loss_poly: 0.8501 +2024/01/09 20:55:57 - mmengine - INFO - Iter(train) [449500/640000] base_lr: 4.2222e-05 lr: 5.6565e-06 eta: 3 days, 10:54:09 time: 1.5601 data_time: 0.0269 memory: 25718 grad_norm: 3.2831 loss: 1.1525 detection_loss_cls: 0.0280 detection_loss_reg: 0.3227 caption_loss_cls: 2.0223 grounding_loss_reg: 2.2721 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0264 instance_segmentation_loss_reg: 0.3176 instance_segmentation_loss_poly: 0.8493 +2024/01/09 21:09:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 21:09:14 - mmengine - INFO - Iter(train) [450000/640000] base_lr: 4.2026e-05 lr: 5.6387e-06 eta: 3 days, 10:43:58 time: 1.5653 data_time: 0.0270 memory: 25718 grad_norm: 3.2893 loss: 1.1450 detection_loss_cls: 0.0280 detection_loss_reg: 0.3219 caption_loss_cls: 2.0199 grounding_loss_reg: 2.2682 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0261 instance_segmentation_loss_reg: 0.3152 instance_segmentation_loss_poly: 0.8443 +2024/01/09 21:09:14 - mmengine - INFO - Saving checkpoint at 450000 iterations +2024/01/09 21:22:15 - mmengine - INFO - Iter(train) [450500/640000] base_lr: 4.1831e-05 lr: 5.6210e-06 eta: 3 days, 10:30:15 time: 1.5531 data_time: 0.0269 memory: 25718 grad_norm: 3.3412 loss: 1.1643 detection_loss_cls: 0.0279 detection_loss_reg: 0.3222 caption_loss_cls: 2.0138 grounding_loss_reg: 2.2669 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0261 instance_segmentation_loss_reg: 0.3143 instance_segmentation_loss_poly: 0.8414 +2024/01/09 21:35:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 21:35:05 - mmengine - INFO - Iter(train) [451000/640000] base_lr: 4.1637e-05 lr: 5.6033e-06 eta: 3 days, 10:14:12 time: 1.5440 data_time: 0.0268 memory: 25718 grad_norm: 3.3646 loss: 1.1677 detection_loss_cls: 0.0278 detection_loss_reg: 0.3217 caption_loss_cls: 2.0115 grounding_loss_reg: 2.2659 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0261 instance_segmentation_loss_reg: 0.3144 instance_segmentation_loss_poly: 0.8401 +2024/01/09 21:48:10 - mmengine - INFO - Iter(train) [451500/640000] base_lr: 4.1442e-05 lr: 5.5857e-06 eta: 3 days, 10:01:30 time: 1.5456 data_time: 0.0269 memory: 25718 grad_norm: 3.4020 loss: 1.1698 detection_loss_cls: 0.0277 detection_loss_reg: 0.3221 caption_loss_cls: 2.0133 grounding_loss_reg: 2.2634 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3142 instance_segmentation_loss_poly: 0.8394 +2024/01/09 22:01:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 22:01:11 - mmengine - INFO - Iter(train) [452000/640000] base_lr: 4.1248e-05 lr: 5.5680e-06 eta: 3 days, 9:47:59 time: 1.5593 data_time: 0.0270 memory: 25718 grad_norm: 3.3764 loss: 1.1678 detection_loss_cls: 0.0277 detection_loss_reg: 0.3225 caption_loss_cls: 2.0158 grounding_loss_reg: 2.2591 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3135 instance_segmentation_loss_poly: 0.8386 +2024/01/09 22:01:11 - mmengine - INFO - Saving checkpoint at 452000 iterations +2024/01/09 22:14:14 - mmengine - INFO - Iter(train) [452500/640000] base_lr: 4.1055e-05 lr: 5.5504e-06 eta: 3 days, 9:34:46 time: 1.5529 data_time: 0.0268 memory: 25718 grad_norm: 3.3585 loss: 1.1674 detection_loss_cls: 0.0276 detection_loss_reg: 0.3217 caption_loss_cls: 2.0154 grounding_loss_reg: 2.2586 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3143 instance_segmentation_loss_poly: 0.8408 +2024/01/09 22:28:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 22:28:05 - mmengine - INFO - Iter(train) [453000/640000] base_lr: 4.0862e-05 lr: 5.5329e-06 eta: 3 days, 9:30:28 time: 1.5749 data_time: 0.0272 memory: 25718 grad_norm: 3.3070 loss: 1.1553 detection_loss_cls: 0.0275 detection_loss_reg: 0.3204 caption_loss_cls: 2.0190 grounding_loss_reg: 2.2550 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3131 instance_segmentation_loss_poly: 0.8371 +2024/01/09 22:41:12 - mmengine - INFO - Iter(train) [453500/640000] base_lr: 4.0669e-05 lr: 5.5153e-06 eta: 3 days, 9:17:39 time: 1.5778 data_time: 0.0272 memory: 25718 grad_norm: 3.2888 loss: 1.1550 detection_loss_cls: 0.0274 detection_loss_reg: 0.3201 caption_loss_cls: 2.0221 grounding_loss_reg: 2.2515 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3126 instance_segmentation_loss_poly: 0.8351 +2024/01/09 22:53:48 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 22:53:48 - mmengine - INFO - Iter(train) [454000/640000] base_lr: 4.0476e-05 lr: 5.4978e-06 eta: 3 days, 8:59:34 time: 1.5677 data_time: 0.0271 memory: 25718 grad_norm: 3.2657 loss: 1.1610 detection_loss_cls: 0.0274 detection_loss_reg: 0.3190 caption_loss_cls: 2.0178 grounding_loss_reg: 2.2504 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3129 instance_segmentation_loss_poly: 0.8352 +2024/01/09 22:53:48 - mmengine - INFO - Saving checkpoint at 454000 iterations +2024/01/09 23:06:37 - mmengine - INFO - Iter(train) [454500/640000] base_lr: 4.0284e-05 lr: 5.4804e-06 eta: 3 days, 8:43:55 time: 1.5646 data_time: 0.0272 memory: 25718 grad_norm: 3.2726 loss: 1.1659 detection_loss_cls: 0.0274 detection_loss_reg: 0.3199 caption_loss_cls: 2.0182 grounding_loss_reg: 2.2490 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3124 instance_segmentation_loss_poly: 0.8337 +2024/01/09 23:20:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 23:20:14 - mmengine - INFO - Iter(train) [455000/640000] base_lr: 4.0092e-05 lr: 5.4630e-06 eta: 3 days, 8:36:23 time: 1.5766 data_time: 0.0274 memory: 25718 grad_norm: 3.2730 loss: 1.1678 detection_loss_cls: 0.0274 detection_loss_reg: 0.3197 caption_loss_cls: 2.0168 grounding_loss_reg: 2.2483 semantic_segmentation_loss_cls: 0.0072 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3137 instance_segmentation_loss_poly: 0.8368 +2024/01/09 23:34:14 - mmengine - INFO - Iter(train) [455500/640000] base_lr: 3.9901e-05 lr: 5.4456e-06 eta: 3 days, 8:31:58 time: 1.5901 data_time: 0.0277 memory: 25718 grad_norm: 3.1986 loss: 1.1643 detection_loss_cls: 0.0275 detection_loss_reg: 0.3201 caption_loss_cls: 2.0184 grounding_loss_reg: 2.2456 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3144 instance_segmentation_loss_poly: 0.8378 +2024/01/09 23:47:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/09 23:47:20 - mmengine - INFO - Iter(train) [456000/640000] base_lr: 3.9710e-05 lr: 5.4282e-06 eta: 3 days, 8:18:55 time: 1.5914 data_time: 0.0276 memory: 25718 grad_norm: 3.2160 loss: 1.1645 detection_loss_cls: 0.0273 detection_loss_reg: 0.3188 caption_loss_cls: 2.0210 grounding_loss_reg: 2.2452 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0257 instance_segmentation_loss_reg: 0.3128 instance_segmentation_loss_poly: 0.8344 +2024/01/09 23:47:20 - mmengine - INFO - Saving checkpoint at 456000 iterations +2024/01/10 00:01:07 - mmengine - INFO - Iter(train) [456500/640000] base_lr: 3.9519e-05 lr: 5.4109e-06 eta: 3 days, 8:11:53 time: 1.6024 data_time: 0.0277 memory: 25718 grad_norm: 3.2001 loss: 1.1645 detection_loss_cls: 0.0274 detection_loss_reg: 0.3192 caption_loss_cls: 2.0198 grounding_loss_reg: 2.2441 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3134 instance_segmentation_loss_poly: 0.8349 +2024/01/10 00:13:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 00:13:56 - mmengine - INFO - Iter(train) [457000/640000] base_lr: 3.9329e-05 lr: 5.3936e-06 eta: 3 days, 7:56:08 time: 1.5868 data_time: 0.0272 memory: 25718 grad_norm: 3.2422 loss: 1.1728 detection_loss_cls: 0.0274 detection_loss_reg: 0.3192 caption_loss_cls: 2.0148 grounding_loss_reg: 2.2444 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3130 instance_segmentation_loss_poly: 0.8330 +2024/01/10 00:27:14 - mmengine - INFO - Iter(train) [457500/640000] base_lr: 3.9139e-05 lr: 5.3763e-06 eta: 3 days, 7:44:39 time: 1.5898 data_time: 0.0272 memory: 25718 grad_norm: 3.2170 loss: 1.1676 detection_loss_cls: 0.0275 detection_loss_reg: 0.3200 caption_loss_cls: 2.0125 grounding_loss_reg: 2.2453 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3132 instance_segmentation_loss_poly: 0.8338 +2024/01/10 00:40:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 00:40:55 - mmengine - INFO - Iter(train) [458000/640000] base_lr: 3.8950e-05 lr: 5.3591e-06 eta: 3 days, 7:36:15 time: 1.6060 data_time: 0.0272 memory: 25718 grad_norm: 3.1919 loss: 1.1567 detection_loss_cls: 0.0275 detection_loss_reg: 0.3200 caption_loss_cls: 2.0141 grounding_loss_reg: 2.2479 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3128 instance_segmentation_loss_poly: 0.8322 +2024/01/10 00:40:55 - mmengine - INFO - Saving checkpoint at 458000 iterations +2024/01/10 00:54:18 - mmengine - INFO - Iter(train) [458500/640000] base_lr: 3.8761e-05 lr: 5.3419e-06 eta: 3 days, 7:25:12 time: 1.6146 data_time: 0.0265 memory: 25718 grad_norm: 3.2389 loss: 1.1511 detection_loss_cls: 0.0275 detection_loss_reg: 0.3202 caption_loss_cls: 2.0164 grounding_loss_reg: 2.2452 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3139 instance_segmentation_loss_poly: 0.8334 +2024/01/10 01:07:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 01:07:01 - mmengine - INFO - Iter(train) [459000/640000] base_lr: 3.8572e-05 lr: 5.3247e-06 eta: 3 days, 7:08:45 time: 1.6009 data_time: 0.0261 memory: 25718 grad_norm: 3.2238 loss: 1.1484 detection_loss_cls: 0.0274 detection_loss_reg: 0.3189 caption_loss_cls: 2.0170 grounding_loss_reg: 2.2453 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3137 instance_segmentation_loss_poly: 0.8329 +2024/01/10 01:19:43 - mmengine - INFO - Iter(train) [459500/640000] base_lr: 3.8383e-05 lr: 5.3076e-06 eta: 3 days, 6:52:25 time: 1.5816 data_time: 0.0255 memory: 25718 grad_norm: 3.2737 loss: 1.1476 detection_loss_cls: 0.0275 detection_loss_reg: 0.3192 caption_loss_cls: 2.0163 grounding_loss_reg: 2.2455 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3135 instance_segmentation_loss_poly: 0.8317 +2024/01/10 01:32:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 01:32:04 - mmengine - INFO - Iter(train) [460000/640000] base_lr: 3.8195e-05 lr: 5.2905e-06 eta: 3 days, 6:33:32 time: 1.5702 data_time: 0.0252 memory: 25718 grad_norm: 3.2838 loss: 1.1503 detection_loss_cls: 0.0274 detection_loss_reg: 0.3193 caption_loss_cls: 2.0209 grounding_loss_reg: 2.2445 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3124 instance_segmentation_loss_poly: 0.8289 +2024/01/10 01:32:04 - mmengine - INFO - Saving checkpoint at 460000 iterations +2024/01/10 01:44:23 - mmengine - INFO - Evaluating bbox... +2024/01/10 01:45:19 - mmengine - INFO - bbox_mAP_copypaste: 0.508 0.688 0.556 0.352 0.558 0.650 +2024/01/10 01:45:19 - mmengine - INFO - Evaluating segm... +2024/01/10 01:46:31 - mmengine - INFO - segm_mAP_copypaste: 0.347 0.612 0.345 0.201 0.395 0.522 +2024/01/10 01:53:40 - mmengine - INFO - per class results: +2024/01/10 01:53:40 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.76 | 90.17 | +| building | 83.61 | 92.14 | +| sky | 93.11 | 97.73 | +| floor | 82.39 | 91.19 | +| tree | 73.94 | 86.73 | +| ceiling | 85.55 | 94.13 | +| road | 83.59 | 90.15 | +| bed | 90.57 | 95.88 | +| windowpane | 63.98 | 77.74 | +| grass | 64.72 | 83.85 | +| cabinet | 63.48 | 76.11 | +| sidewalk | 66.84 | 80.78 | +| person | 80.55 | 91.3 | +| earth | 39.65 | 50.55 | +| door | 55.39 | 68.18 | +| table | 64.68 | 78.37 | +| mountain | 63.58 | 75.84 | +| plant | 50.58 | 59.06 | +| curtain | 75.06 | 86.18 | +| chair | 61.08 | 74.14 | +| car | 84.88 | 92.0 | +| water | 57.33 | 73.69 | +| painting | 70.11 | 87.7 | +| sofa | 71.61 | 86.07 | +| shelf | 44.05 | 60.71 | +| house | 50.55 | 66.54 | +| sea | 55.12 | 72.67 | +| mirror | 68.62 | 76.33 | +| rug | 65.83 | 75.87 | +| field | 30.35 | 48.48 | +| armchair | 50.61 | 67.07 | +| seat | 62.12 | 79.15 | +| fence | 43.86 | 59.66 | +| desk | 47.4 | 75.01 | +| rock | 52.1 | 82.35 | +| wardrobe | 46.2 | 59.48 | +| lamp | 62.7 | 74.47 | +| bathtub | 79.69 | 82.64 | +| railing | 37.12 | 52.47 | +| cushion | 60.11 | 72.74 | +| base | 27.74 | 36.46 | +| box | 27.18 | 34.92 | +| column | 52.4 | 63.62 | +| signboard | 37.83 | 49.53 | +| chest of drawers | 41.57 | 61.3 | +| counter | 27.27 | 36.47 | +| sand | 47.78 | 68.18 | +| sink | 74.85 | 83.07 | +| skyscraper | 66.19 | 82.78 | +| fireplace | 74.51 | 90.3 | +| refrigerator | 73.56 | 78.8 | +| grandstand | 38.87 | 77.28 | +| path | 24.01 | 38.54 | +| stairs | 27.09 | 32.12 | +| runway | 75.62 | 91.61 | +| case | 51.79 | 71.17 | +| pool table | 90.98 | 95.67 | +| pillow | 57.7 | 67.87 | +| screen door | 78.33 | 79.8 | +| stairway | 32.31 | 45.46 | +| river | 13.12 | 25.11 | +| bridge | 56.36 | 81.1 | +| bookcase | 38.63 | 59.83 | +| blind | 40.4 | 45.76 | +| coffee table | 68.2 | 80.54 | +| toilet | 86.85 | 91.22 | +| flower | 40.04 | 58.1 | +| book | 51.08 | 68.55 | +| hill | 14.1 | 19.02 | +| bench | 56.88 | 62.86 | +| countertop | 57.84 | 73.86 | +| stove | 75.71 | 83.35 | +| palm | 47.16 | 73.57 | +| kitchen island | 38.42 | 75.93 | +| computer | 71.24 | 80.77 | +| swivel chair | 38.82 | 51.69 | +| boat | 68.77 | 72.99 | +| bar | 33.37 | 44.23 | +| arcade machine | 54.46 | 59.81 | +| hovel | 28.52 | 36.07 | +| bus | 92.45 | 94.95 | +| towel | 66.06 | 79.77 | +| light | 52.41 | 62.45 | +| truck | 48.13 | 56.67 | +| tower | 28.76 | 49.29 | +| chandelier | 66.7 | 81.6 | +| awning | 35.32 | 43.12 | +| streetlight | 32.06 | 43.8 | +| booth | 34.22 | 38.33 | +| television receiver | 71.39 | 85.23 | +| airplane | 61.58 | 68.69 | +| dirt track | 11.92 | 17.6 | +| apparel | 31.29 | 38.88 | +| pole | 26.52 | 37.65 | +| land | 2.94 | 5.78 | +| bannister | 19.29 | 26.5 | +| escalator | 12.62 | 13.64 | +| ottoman | 55.64 | 71.24 | +| bottle | 23.59 | 30.88 | +| buffet | 42.24 | 51.55 | +| poster | 33.42 | 41.01 | +| stage | 10.1 | 16.45 | +| van | 44.3 | 58.5 | +| ship | 8.07 | 9.6 | +| fountain | 13.36 | 14.57 | +| conveyer belt | 72.91 | 90.99 | +| canopy | 20.85 | 23.99 | +| washer | 72.22 | 73.32 | +| plaything | 28.7 | 33.62 | +| swimming pool | 66.94 | 74.4 | +| stool | 49.33 | 60.76 | +| barrel | 28.49 | 32.24 | +| basket | 33.21 | 49.42 | +| waterfall | 54.79 | 81.55 | +| tent | 79.94 | 96.67 | +| bag | 18.28 | 24.96 | +| minibike | 70.84 | 84.31 | +| cradle | 74.95 | 95.04 | +| oven | 54.23 | 71.71 | +| ball | 51.29 | 70.46 | +| food | 46.92 | 51.31 | +| step | 7.63 | 9.3 | +| tank | 38.56 | 43.58 | +| trade name | 28.94 | 34.85 | +| microwave | 86.15 | 91.23 | +| pot | 52.5 | 64.01 | +| animal | 57.29 | 59.96 | +| bicycle | 58.33 | 75.71 | +| lake | 54.12 | 64.59 | +| dishwasher | 60.52 | 76.86 | +| screen | 51.05 | 71.34 | +| blanket | 13.97 | 16.24 | +| sculpture | 51.35 | 66.65 | +| hood | 62.57 | 67.92 | +| sconce | 45.43 | 56.41 | +| vase | 45.28 | 57.61 | +| traffic light | 39.53 | 60.43 | +| tray | 6.76 | 12.33 | +| ashcan | 47.03 | 58.82 | +| fan | 62.19 | 73.54 | +| pier | 29.25 | 37.44 | +| crt screen | 12.14 | 21.06 | +| plate | 57.43 | 72.46 | +| monitor | 51.25 | 71.28 | +| bulletin board | 33.96 | 47.81 | +| shower | 2.73 | 7.08 | +| radiator | 56.54 | 60.3 | +| glass | 18.65 | 20.33 | +| clock | 26.09 | 32.77 | +| flag | 25.42 | 29.47 | ++---------------------+-------+-------+ +2024/01/10 01:53:56 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.5080 coco/bbox_mAP_50: 0.6880 coco/bbox_mAP_75: 0.5560 coco/bbox_mAP_s: 0.3520 coco/bbox_mAP_m: 0.5580 coco/bbox_mAP_l: 0.6500 coco/segm_mAP: 0.3470 coco/segm_mAP_50: 0.6120 coco/segm_mAP_75: 0.3450 coco/segm_mAP_s: 0.2010 coco/segm_mAP_m: 0.3950 coco/segm_mAP_l: 0.5220 Bleu_1: 0.7558 Bleu_2: 0.5932 Bleu_3: 0.4517 Bleu_4: 0.3407 METEOR: 0.2753 ROUGE_L: 0.5605 CIDEr: 1.1135 SPICE: 0.2023 aAcc: 83.9000 mIoU: 50.0000 mAcc: 61.5200 visual-grounding/miou: 0.8191 visual-grounding/acc: 0.8818 data_time: 0.0043 time: 1.3497 +2024/01/10 02:06:48 - mmengine - INFO - Iter(train) [460500/640000] base_lr: 3.8008e-05 lr: 5.2734e-06 eta: 3 days, 6:19:00 time: 1.5570 data_time: 0.0211 memory: 25718 grad_norm: 3.3446 loss: 1.1625 detection_loss_cls: 0.0273 detection_loss_reg: 0.3185 caption_loss_cls: 2.0211 grounding_loss_reg: 2.2442 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3130 instance_segmentation_loss_poly: 0.8301 +2024/01/10 02:20:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 02:20:17 - mmengine - INFO - Iter(train) [461000/640000] base_lr: 3.7821e-05 lr: 5.2564e-06 eta: 3 days, 6:08:37 time: 1.5669 data_time: 0.0212 memory: 25718 grad_norm: 3.3123 loss: 1.1570 detection_loss_cls: 0.0274 detection_loss_reg: 0.3191 caption_loss_cls: 2.0225 grounding_loss_reg: 2.2457 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0257 instance_segmentation_loss_reg: 0.3120 instance_segmentation_loss_poly: 0.8276 +2024/01/10 02:33:47 - mmengine - INFO - Iter(train) [461500/640000] base_lr: 3.7634e-05 lr: 5.2394e-06 eta: 3 days, 5:58:22 time: 1.5700 data_time: 0.0211 memory: 25718 grad_norm: 3.2842 loss: 1.1451 detection_loss_cls: 0.0273 detection_loss_reg: 0.3186 caption_loss_cls: 2.0184 grounding_loss_reg: 2.2448 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0257 instance_segmentation_loss_reg: 0.3119 instance_segmentation_loss_poly: 0.8275 +2024/01/10 02:47:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 02:47:16 - mmengine - INFO - Iter(train) [462000/640000] base_lr: 3.7447e-05 lr: 5.2225e-06 eta: 3 days, 5:47:42 time: 1.5668 data_time: 0.0211 memory: 25718 grad_norm: 3.2980 loss: 1.1505 detection_loss_cls: 0.0272 detection_loss_reg: 0.3187 caption_loss_cls: 2.0193 grounding_loss_reg: 2.2446 semantic_segmentation_loss_cls: 0.0071 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3129 instance_segmentation_loss_poly: 0.8288 +2024/01/10 02:47:16 - mmengine - INFO - Saving checkpoint at 462000 iterations +2024/01/10 03:01:04 - mmengine - INFO - Iter(train) [462500/640000] base_lr: 3.7261e-05 lr: 5.2055e-06 eta: 3 days, 5:39:12 time: 1.5731 data_time: 0.0213 memory: 25718 grad_norm: 3.1806 loss: 1.1430 detection_loss_cls: 0.0274 detection_loss_reg: 0.3200 caption_loss_cls: 2.0214 grounding_loss_reg: 2.2437 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3132 instance_segmentation_loss_poly: 0.8290 +2024/01/10 03:14:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 03:14:40 - mmengine - INFO - Iter(train) [463000/640000] base_lr: 3.7075e-05 lr: 5.1887e-06 eta: 3 days, 5:29:11 time: 1.5865 data_time: 0.0216 memory: 25718 grad_norm: 3.1640 loss: 1.1421 detection_loss_cls: 0.0275 detection_loss_reg: 0.3211 caption_loss_cls: 2.0207 grounding_loss_reg: 2.2416 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3147 instance_segmentation_loss_poly: 0.8314 +2024/01/10 03:28:54 - mmengine - INFO - Iter(train) [463500/640000] base_lr: 3.6890e-05 lr: 5.1718e-06 eta: 3 days, 5:23:02 time: 1.6093 data_time: 0.0220 memory: 25718 grad_norm: 3.1295 loss: 1.1342 detection_loss_cls: 0.0274 detection_loss_reg: 0.3198 caption_loss_cls: 2.0177 grounding_loss_reg: 2.2403 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3133 instance_segmentation_loss_poly: 0.8302 +2024/01/10 03:41:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 03:41:40 - mmengine - INFO - Iter(train) [464000/640000] base_lr: 3.6705e-05 lr: 5.1550e-06 eta: 3 days, 5:07:26 time: 1.6157 data_time: 0.0223 memory: 25718 grad_norm: 3.1153 loss: 1.1393 detection_loss_cls: 0.0274 detection_loss_reg: 0.3197 caption_loss_cls: 2.0202 grounding_loss_reg: 2.2408 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3136 instance_segmentation_loss_poly: 0.8305 +2024/01/10 03:41:40 - mmengine - INFO - Saving checkpoint at 464000 iterations +2024/01/10 03:54:54 - mmengine - INFO - Iter(train) [464500/640000] base_lr: 3.6520e-05 lr: 5.1382e-06 eta: 3 days, 4:54:49 time: 1.6207 data_time: 0.0260 memory: 25718 grad_norm: 3.1169 loss: 1.1365 detection_loss_cls: 0.0273 detection_loss_reg: 0.3203 caption_loss_cls: 2.0221 grounding_loss_reg: 2.2409 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3144 instance_segmentation_loss_poly: 0.8306 +2024/01/10 04:08:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 04:08:12 - mmengine - INFO - Iter(train) [465000/640000] base_lr: 3.6336e-05 lr: 5.1215e-06 eta: 3 days, 4:42:32 time: 1.6181 data_time: 0.0261 memory: 25718 grad_norm: 3.1309 loss: 1.1416 detection_loss_cls: 0.0273 detection_loss_reg: 0.3205 caption_loss_cls: 2.0195 grounding_loss_reg: 2.2443 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3148 instance_segmentation_loss_poly: 0.8300 +2024/01/10 04:21:01 - mmengine - INFO - Iter(train) [465500/640000] base_lr: 3.6152e-05 lr: 5.1048e-06 eta: 3 days, 4:27:22 time: 1.6076 data_time: 0.0260 memory: 25718 grad_norm: 3.1810 loss: 1.1603 detection_loss_cls: 0.0273 detection_loss_reg: 0.3206 caption_loss_cls: 2.0198 grounding_loss_reg: 2.2426 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3148 instance_segmentation_loss_poly: 0.8307 +2024/01/10 04:33:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 04:33:46 - mmengine - INFO - Iter(train) [466000/640000] base_lr: 3.5969e-05 lr: 5.0881e-06 eta: 3 days, 4:11:55 time: 1.5969 data_time: 0.0259 memory: 25718 grad_norm: 3.2006 loss: 1.1640 detection_loss_cls: 0.0274 detection_loss_reg: 0.3218 caption_loss_cls: 2.0224 grounding_loss_reg: 2.2422 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3149 instance_segmentation_loss_poly: 0.8304 +2024/01/10 04:33:46 - mmengine - INFO - Saving checkpoint at 466000 iterations +2024/01/10 04:47:35 - mmengine - INFO - Iter(train) [466500/640000] base_lr: 3.5786e-05 lr: 5.0715e-06 eta: 3 days, 4:02:33 time: 1.5969 data_time: 0.0260 memory: 25718 grad_norm: 3.3581 loss: 1.1695 detection_loss_cls: 0.0273 detection_loss_reg: 0.3222 caption_loss_cls: 2.0213 grounding_loss_reg: 2.2407 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0261 instance_segmentation_loss_reg: 0.3158 instance_segmentation_loss_poly: 0.8328 +2024/01/10 05:00:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 05:00:01 - mmengine - INFO - Iter(train) [467000/640000] base_lr: 3.5603e-05 lr: 5.0549e-06 eta: 3 days, 3:45:26 time: 1.5795 data_time: 0.0257 memory: 25718 grad_norm: 3.4155 loss: 1.1784 detection_loss_cls: 0.0272 detection_loss_reg: 0.3217 caption_loss_cls: 2.0201 grounding_loss_reg: 2.2399 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0261 instance_segmentation_loss_reg: 0.3157 instance_segmentation_loss_poly: 0.8329 +2024/01/10 05:12:53 - mmengine - INFO - Iter(train) [467500/640000] base_lr: 3.5421e-05 lr: 5.0383e-06 eta: 3 days, 3:30:44 time: 1.5590 data_time: 0.0253 memory: 25718 grad_norm: 3.4477 loss: 1.1873 detection_loss_cls: 0.0272 detection_loss_reg: 0.3219 caption_loss_cls: 2.0250 grounding_loss_reg: 2.2396 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3153 instance_segmentation_loss_poly: 0.8325 +2024/01/10 05:25:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 05:25:22 - mmengine - INFO - Iter(train) [468000/640000] base_lr: 3.5239e-05 lr: 5.0218e-06 eta: 3 days, 3:14:06 time: 1.5548 data_time: 0.0253 memory: 25718 grad_norm: 3.4654 loss: 1.1843 detection_loss_cls: 0.0272 detection_loss_reg: 0.3216 caption_loss_cls: 2.0260 grounding_loss_reg: 2.2410 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3157 instance_segmentation_loss_poly: 0.8325 +2024/01/10 05:25:22 - mmengine - INFO - Saving checkpoint at 468000 iterations +2024/01/10 05:38:06 - mmengine - INFO - Iter(train) [468500/640000] base_lr: 3.5058e-05 lr: 5.0053e-06 eta: 3 days, 2:58:51 time: 1.5470 data_time: 0.0249 memory: 25718 grad_norm: 3.4786 loss: 1.1729 detection_loss_cls: 0.0272 detection_loss_reg: 0.3218 caption_loss_cls: 2.0255 grounding_loss_reg: 2.2377 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0261 instance_segmentation_loss_reg: 0.3156 instance_segmentation_loss_poly: 0.8323 +2024/01/10 05:50:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 05:50:53 - mmengine - INFO - Iter(train) [469000/640000] base_lr: 3.4877e-05 lr: 4.9888e-06 eta: 3 days, 2:43:57 time: 1.5393 data_time: 0.0247 memory: 25718 grad_norm: 3.5150 loss: 1.1759 detection_loss_cls: 0.0272 detection_loss_reg: 0.3209 caption_loss_cls: 2.0256 grounding_loss_reg: 2.2387 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0261 instance_segmentation_loss_reg: 0.3152 instance_segmentation_loss_poly: 0.8313 +2024/01/10 06:03:43 - mmengine - INFO - Iter(train) [469500/640000] base_lr: 3.4696e-05 lr: 4.9724e-06 eta: 3 days, 2:29:24 time: 1.5395 data_time: 0.0247 memory: 25718 grad_norm: 3.5265 loss: 1.1672 detection_loss_cls: 0.0272 detection_loss_reg: 0.3210 caption_loss_cls: 2.0265 grounding_loss_reg: 2.2370 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3144 instance_segmentation_loss_poly: 0.8295 +2024/01/10 06:16:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 06:16:53 - mmengine - INFO - Iter(train) [470000/640000] base_lr: 3.4516e-05 lr: 4.9560e-06 eta: 3 days, 2:16:34 time: 1.5458 data_time: 0.0247 memory: 25718 grad_norm: 3.5012 loss: 1.1628 detection_loss_cls: 0.0273 detection_loss_reg: 0.3209 caption_loss_cls: 2.0286 grounding_loss_reg: 2.2360 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0261 instance_segmentation_loss_reg: 0.3145 instance_segmentation_loss_poly: 0.8309 +2024/01/10 06:16:53 - mmengine - INFO - Saving checkpoint at 470000 iterations +2024/01/10 06:30:10 - mmengine - INFO - Iter(train) [470500/640000] base_lr: 3.4336e-05 lr: 4.9397e-06 eta: 3 days, 2:04:21 time: 1.5381 data_time: 0.0245 memory: 25718 grad_norm: 3.3553 loss: 1.1583 detection_loss_cls: 0.0272 detection_loss_reg: 0.3209 caption_loss_cls: 2.0318 grounding_loss_reg: 2.2339 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0261 instance_segmentation_loss_reg: 0.3149 instance_segmentation_loss_poly: 0.8313 +2024/01/10 06:43:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 06:43:28 - mmengine - INFO - Iter(train) [471000/640000] base_lr: 3.4157e-05 lr: 4.9233e-06 eta: 3 days, 1:52:06 time: 1.5508 data_time: 0.0247 memory: 25718 grad_norm: 3.3468 loss: 1.1539 detection_loss_cls: 0.0273 detection_loss_reg: 0.3213 caption_loss_cls: 2.0307 grounding_loss_reg: 2.2339 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0261 instance_segmentation_loss_reg: 0.3154 instance_segmentation_loss_poly: 0.8342 +2024/01/10 06:57:42 - mmengine - INFO - Iter(train) [471500/640000] base_lr: 3.3978e-05 lr: 4.9071e-06 eta: 3 days, 1:44:14 time: 1.5714 data_time: 0.0252 memory: 25718 grad_norm: 3.3294 loss: 1.1481 detection_loss_cls: 0.0272 detection_loss_reg: 0.3209 caption_loss_cls: 2.0289 grounding_loss_reg: 2.2316 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0262 instance_segmentation_loss_reg: 0.3154 instance_segmentation_loss_poly: 0.8350 +2024/01/10 07:11:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 07:11:19 - mmengine - INFO - Iter(train) [472000/640000] base_lr: 3.3799e-05 lr: 4.8908e-06 eta: 3 days, 1:33:20 time: 1.5882 data_time: 0.0253 memory: 25718 grad_norm: 3.2817 loss: 1.1378 detection_loss_cls: 0.0273 detection_loss_reg: 0.3220 caption_loss_cls: 2.0282 grounding_loss_reg: 2.2330 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0262 instance_segmentation_loss_reg: 0.3155 instance_segmentation_loss_poly: 0.8343 +2024/01/10 07:11:19 - mmengine - INFO - Saving checkpoint at 472000 iterations +2024/01/10 07:24:07 - mmengine - INFO - Iter(train) [472500/640000] base_lr: 3.3621e-05 lr: 4.8746e-06 eta: 3 days, 1:18:39 time: 1.5894 data_time: 0.0256 memory: 25718 grad_norm: 3.2893 loss: 1.1510 detection_loss_cls: 0.0274 detection_loss_reg: 0.3232 caption_loss_cls: 2.0292 grounding_loss_reg: 2.2320 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0262 instance_segmentation_loss_reg: 0.3165 instance_segmentation_loss_poly: 0.8358 +2024/01/10 07:36:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 07:36:56 - mmengine - INFO - Iter(train) [473000/640000] base_lr: 3.3443e-05 lr: 4.8585e-06 eta: 3 days, 1:04:07 time: 1.5901 data_time: 0.0256 memory: 25718 grad_norm: 3.3767 loss: 1.1529 detection_loss_cls: 0.0274 detection_loss_reg: 0.3222 caption_loss_cls: 2.0291 grounding_loss_reg: 2.2348 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0263 instance_segmentation_loss_reg: 0.3170 instance_segmentation_loss_poly: 0.8374 +2024/01/10 07:50:19 - mmengine - INFO - Iter(train) [473500/640000] base_lr: 3.3266e-05 lr: 4.8423e-06 eta: 3 days, 0:52:06 time: 1.5983 data_time: 0.0258 memory: 25718 grad_norm: 3.3700 loss: 1.1533 detection_loss_cls: 0.0274 detection_loss_reg: 0.3219 caption_loss_cls: 2.0240 grounding_loss_reg: 2.2345 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0264 instance_segmentation_loss_reg: 0.3173 instance_segmentation_loss_poly: 0.8381 +2024/01/10 08:03:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 08:03:15 - mmengine - INFO - Iter(train) [474000/640000] base_lr: 3.3089e-05 lr: 4.8262e-06 eta: 3 days, 0:38:03 time: 1.5947 data_time: 0.0258 memory: 25718 grad_norm: 3.3944 loss: 1.1626 detection_loss_cls: 0.0273 detection_loss_reg: 0.3225 caption_loss_cls: 2.0258 grounding_loss_reg: 2.2364 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0262 instance_segmentation_loss_reg: 0.3169 instance_segmentation_loss_poly: 0.8373 +2024/01/10 08:03:15 - mmengine - INFO - Saving checkpoint at 474000 iterations +2024/01/10 08:17:11 - mmengine - INFO - Iter(train) [474500/640000] base_lr: 3.2912e-05 lr: 4.8102e-06 eta: 3 days, 0:28:25 time: 1.6044 data_time: 0.0260 memory: 25718 grad_norm: 3.3911 loss: 1.1622 detection_loss_cls: 0.0272 detection_loss_reg: 0.3223 caption_loss_cls: 2.0282 grounding_loss_reg: 2.2371 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0261 instance_segmentation_loss_reg: 0.3159 instance_segmentation_loss_poly: 0.8352 +2024/01/10 08:30:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 08:30:16 - mmengine - INFO - Iter(train) [475000/640000] base_lr: 3.2736e-05 lr: 4.7942e-06 eta: 3 days, 0:15:00 time: 1.6012 data_time: 0.0260 memory: 25718 grad_norm: 3.3913 loss: 1.1707 detection_loss_cls: 0.0272 detection_loss_reg: 0.3223 caption_loss_cls: 2.0240 grounding_loss_reg: 2.2382 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0262 instance_segmentation_loss_reg: 0.3161 instance_segmentation_loss_poly: 0.8361 +2024/01/10 08:43:28 - mmengine - INFO - Iter(train) [475500/640000] base_lr: 3.2560e-05 lr: 4.7782e-06 eta: 3 days, 0:02:06 time: 1.5858 data_time: 0.0257 memory: 25718 grad_norm: 3.3762 loss: 1.1742 detection_loss_cls: 0.0272 detection_loss_reg: 0.3223 caption_loss_cls: 2.0234 grounding_loss_reg: 2.2391 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0262 instance_segmentation_loss_reg: 0.3164 instance_segmentation_loss_poly: 0.8375 +2024/01/10 08:56:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 08:56:56 - mmengine - INFO - Iter(train) [476000/640000] base_lr: 3.2385e-05 lr: 4.7622e-06 eta: 2 days, 23:50:17 time: 1.5836 data_time: 0.0256 memory: 25718 grad_norm: 3.3522 loss: 1.1683 detection_loss_cls: 0.0271 detection_loss_reg: 0.3217 caption_loss_cls: 2.0257 grounding_loss_reg: 2.2389 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0263 instance_segmentation_loss_reg: 0.3167 instance_segmentation_loss_poly: 0.8373 +2024/01/10 08:56:56 - mmengine - INFO - Saving checkpoint at 476000 iterations +2024/01/10 09:10:40 - mmengine - INFO - Iter(train) [476500/640000] base_lr: 3.2210e-05 lr: 4.7463e-06 eta: 2 days, 23:39:31 time: 1.5976 data_time: 0.0256 memory: 25718 grad_norm: 3.2951 loss: 1.1505 detection_loss_cls: 0.0271 detection_loss_reg: 0.3207 caption_loss_cls: 2.0266 grounding_loss_reg: 2.2369 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0261 instance_segmentation_loss_reg: 0.3149 instance_segmentation_loss_poly: 0.8335 +2024/01/10 09:24:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 09:24:08 - mmengine - INFO - Iter(train) [477000/640000] base_lr: 3.2035e-05 lr: 4.7305e-06 eta: 2 days, 23:27:35 time: 1.6071 data_time: 0.0255 memory: 25718 grad_norm: 3.1469 loss: 1.1288 detection_loss_cls: 0.0270 detection_loss_reg: 0.3199 caption_loss_cls: 2.0255 grounding_loss_reg: 2.2342 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3140 instance_segmentation_loss_poly: 0.8317 +2024/01/10 09:37:09 - mmengine - INFO - Iter(train) [477500/640000] base_lr: 3.1861e-05 lr: 4.7146e-06 eta: 2 days, 23:13:53 time: 1.6017 data_time: 0.0254 memory: 25718 grad_norm: 3.1616 loss: 1.1370 detection_loss_cls: 0.0269 detection_loss_reg: 0.3189 caption_loss_cls: 2.0287 grounding_loss_reg: 2.2333 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3130 instance_segmentation_loss_poly: 0.8297 +2024/01/10 09:50:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 09:50:19 - mmengine - INFO - Iter(train) [478000/640000] base_lr: 3.1687e-05 lr: 4.6989e-06 eta: 2 days, 23:00:45 time: 1.6052 data_time: 0.0255 memory: 25718 grad_norm: 3.1695 loss: 1.1241 detection_loss_cls: 0.0268 detection_loss_reg: 0.3172 caption_loss_cls: 2.0297 grounding_loss_reg: 2.2325 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3137 instance_segmentation_loss_poly: 0.8309 +2024/01/10 09:50:19 - mmengine - INFO - Saving checkpoint at 478000 iterations +2024/01/10 10:03:59 - mmengine - INFO - Iter(train) [478500/640000] base_lr: 3.1514e-05 lr: 4.6831e-06 eta: 2 days, 22:49:34 time: 1.6011 data_time: 0.0256 memory: 25718 grad_norm: 3.1932 loss: 1.1208 detection_loss_cls: 0.0268 detection_loss_reg: 0.3170 caption_loss_cls: 2.0275 grounding_loss_reg: 2.2281 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3129 instance_segmentation_loss_poly: 0.8301 +2024/01/10 10:17:02 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 10:17:02 - mmengine - INFO - Iter(train) [479000/640000] base_lr: 3.1341e-05 lr: 4.6674e-06 eta: 2 days, 22:35:59 time: 1.6007 data_time: 0.0255 memory: 25718 grad_norm: 3.2136 loss: 1.1140 detection_loss_cls: 0.0268 detection_loss_reg: 0.3172 caption_loss_cls: 2.0300 grounding_loss_reg: 2.2246 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3133 instance_segmentation_loss_poly: 0.8314 +2024/01/10 10:30:28 - mmengine - INFO - Iter(train) [479500/640000] base_lr: 3.1169e-05 lr: 4.6517e-06 eta: 2 days, 22:23:47 time: 1.6040 data_time: 0.0256 memory: 25718 grad_norm: 3.2323 loss: 1.1093 detection_loss_cls: 0.0269 detection_loss_reg: 0.3182 caption_loss_cls: 2.0277 grounding_loss_reg: 2.2227 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3132 instance_segmentation_loss_poly: 0.8318 +2024/01/10 10:43:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 10:43:04 - mmengine - INFO - Iter(train) [480000/640000] base_lr: 3.0997e-05 lr: 4.6361e-06 eta: 2 days, 22:08:35 time: 1.5910 data_time: 0.0256 memory: 25718 grad_norm: 3.3768 loss: 1.1346 detection_loss_cls: 0.0269 detection_loss_reg: 0.3182 caption_loss_cls: 2.0239 grounding_loss_reg: 2.2226 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3132 instance_segmentation_loss_poly: 0.8313 +2024/01/10 10:43:04 - mmengine - INFO - Saving checkpoint at 480000 iterations +2024/01/10 10:55:26 - mmengine - INFO - Evaluating bbox... +2024/01/10 10:56:23 - mmengine - INFO - bbox_mAP_copypaste: 0.511 0.691 0.558 0.360 0.560 0.655 +2024/01/10 10:56:23 - mmengine - INFO - Evaluating segm... +2024/01/10 10:57:33 - mmengine - INFO - segm_mAP_copypaste: 0.344 0.609 0.339 0.206 0.389 0.524 +2024/01/10 11:05:22 - mmengine - INFO - per class results: +2024/01/10 11:05:22 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.78 | 88.69 | +| building | 83.2 | 92.36 | +| sky | 93.27 | 97.7 | +| floor | 82.25 | 90.73 | +| tree | 73.44 | 87.14 | +| ceiling | 85.55 | 92.75 | +| road | 82.87 | 87.97 | +| bed | 90.57 | 95.89 | +| windowpane | 64.54 | 82.3 | +| grass | 65.88 | 84.59 | +| cabinet | 62.26 | 76.46 | +| sidewalk | 65.27 | 82.14 | +| person | 81.14 | 92.55 | +| earth | 36.19 | 45.39 | +| door | 54.98 | 68.79 | +| table | 66.34 | 79.94 | +| mountain | 60.08 | 70.37 | +| plant | 50.59 | 62.78 | +| curtain | 75.45 | 88.59 | +| chair | 61.44 | 77.7 | +| car | 84.9 | 92.03 | +| water | 49.1 | 61.13 | +| painting | 68.73 | 87.87 | +| sofa | 69.84 | 82.27 | +| shelf | 47.23 | 67.27 | +| house | 43.74 | 58.34 | +| sea | 47.77 | 74.39 | +| mirror | 69.2 | 78.45 | +| rug | 67.62 | 78.85 | +| field | 29.32 | 44.98 | +| armchair | 47.96 | 65.55 | +| seat | 64.55 | 81.91 | +| fence | 46.52 | 62.93 | +| desk | 49.83 | 70.47 | +| rock | 50.36 | 76.16 | +| wardrobe | 46.56 | 69.92 | +| lamp | 62.81 | 77.63 | +| bathtub | 81.48 | 84.93 | +| railing | 38.2 | 55.27 | +| cushion | 60.48 | 75.64 | +| base | 25.27 | 38.06 | +| box | 29.11 | 37.59 | +| column | 50.64 | 68.59 | +| signboard | 37.67 | 48.71 | +| chest of drawers | 40.91 | 55.46 | +| counter | 19.26 | 27.24 | +| sand | 48.52 | 64.08 | +| sink | 76.11 | 84.37 | +| skyscraper | 65.2 | 85.55 | +| fireplace | 77.5 | 89.05 | +| refrigerator | 73.65 | 81.21 | +| grandstand | 38.63 | 77.59 | +| path | 25.37 | 41.24 | +| stairs | 25.07 | 31.52 | +| runway | 72.48 | 88.59 | +| case | 51.5 | 67.48 | +| pool table | 86.79 | 96.76 | +| pillow | 59.91 | 70.58 | +| screen door | 84.43 | 87.59 | +| stairway | 32.15 | 50.03 | +| river | 19.0 | 39.12 | +| bridge | 52.37 | 60.87 | +| bookcase | 38.29 | 57.89 | +| blind | 37.25 | 40.23 | +| coffee table | 67.56 | 83.23 | +| toilet | 87.44 | 91.63 | +| flower | 40.93 | 56.06 | +| book | 51.12 | 73.02 | +| hill | 13.44 | 22.49 | +| bench | 63.35 | 74.15 | +| countertop | 62.49 | 74.48 | +| stove | 74.87 | 83.36 | +| palm | 43.63 | 59.59 | +| kitchen island | 47.08 | 81.84 | +| computer | 70.98 | 82.0 | +| swivel chair | 42.6 | 56.04 | +| boat | 64.73 | 70.94 | +| bar | 26.48 | 36.33 | +| arcade machine | 70.52 | 78.63 | +| hovel | 18.45 | 21.0 | +| bus | 92.63 | 95.34 | +| towel | 68.04 | 80.97 | +| light | 54.99 | 67.09 | +| truck | 47.04 | 56.56 | +| tower | 24.99 | 38.61 | +| chandelier | 67.87 | 85.39 | +| awning | 34.44 | 40.88 | +| streetlight | 32.87 | 44.52 | +| booth | 42.16 | 48.65 | +| television receiver | 68.13 | 78.71 | +| airplane | 62.33 | 71.14 | +| dirt track | 15.44 | 18.48 | +| apparel | 36.92 | 54.85 | +| pole | 29.03 | 40.42 | +| land | 1.99 | 5.44 | +| bannister | 15.54 | 23.21 | +| escalator | 15.22 | 15.87 | +| ottoman | 54.38 | 71.42 | +| bottle | 24.53 | 32.19 | +| buffet | 40.44 | 50.75 | +| poster | 27.68 | 31.74 | +| stage | 9.67 | 14.64 | +| van | 49.8 | 67.36 | +| ship | 8.15 | 9.95 | +| fountain | 23.11 | 23.6 | +| conveyer belt | 75.38 | 89.08 | +| canopy | 24.86 | 31.84 | +| washer | 73.27 | 73.99 | +| plaything | 27.08 | 31.1 | +| swimming pool | 61.22 | 71.52 | +| stool | 48.73 | 59.45 | +| barrel | 11.53 | 33.11 | +| basket | 30.47 | 48.34 | +| waterfall | 54.84 | 80.05 | +| tent | 91.09 | 96.71 | +| bag | 19.35 | 25.44 | +| minibike | 72.62 | 82.68 | +| cradle | 69.08 | 88.21 | +| oven | 51.05 | 65.08 | +| ball | 44.04 | 57.1 | +| food | 55.39 | 60.27 | +| step | 19.44 | 26.33 | +| tank | 34.81 | 44.45 | +| trade name | 24.82 | 29.59 | +| microwave | 83.94 | 93.5 | +| pot | 51.02 | 60.62 | +| animal | 57.2 | 59.75 | +| bicycle | 56.78 | 74.05 | +| lake | 58.51 | 63.17 | +| dishwasher | 56.33 | 65.26 | +| screen | 56.36 | 73.15 | +| blanket | 20.42 | 24.33 | +| sculpture | 48.4 | 73.55 | +| hood | 60.32 | 69.22 | +| sconce | 45.65 | 56.38 | +| vase | 44.44 | 65.54 | +| traffic light | 39.95 | 61.99 | +| tray | 5.07 | 8.44 | +| ashcan | 41.74 | 52.77 | +| fan | 58.08 | 76.32 | +| pier | 42.64 | 56.68 | +| crt screen | 12.27 | 21.05 | +| plate | 54.81 | 78.32 | +| monitor | 43.53 | 60.76 | +| bulletin board | 46.28 | 54.75 | +| shower | 3.49 | 5.76 | +| radiator | 61.67 | 67.83 | +| glass | 19.75 | 21.35 | +| clock | 27.85 | 34.42 | +| flag | 31.3 | 37.17 | ++---------------------+-------+-------+ +2024/01/10 11:05:39 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.5110 coco/bbox_mAP_50: 0.6910 coco/bbox_mAP_75: 0.5580 coco/bbox_mAP_s: 0.3600 coco/bbox_mAP_m: 0.5600 coco/bbox_mAP_l: 0.6550 coco/segm_mAP: 0.3440 coco/segm_mAP_50: 0.6090 coco/segm_mAP_75: 0.3390 coco/segm_mAP_s: 0.2060 coco/segm_mAP_m: 0.3890 coco/segm_mAP_l: 0.5240 Bleu_1: 0.7618 Bleu_2: 0.5990 Bleu_3: 0.4585 Bleu_4: 0.3486 METEOR: 0.2749 ROUGE_L: 0.5627 CIDEr: 1.1229 SPICE: 0.2027 aAcc: 83.5900 mIoU: 50.1200 mAcc: 62.0200 visual-grounding/miou: 0.8192 visual-grounding/acc: 0.8804 data_time: 0.0040 time: 1.3500 +2024/01/10 11:19:47 - mmengine - INFO - Iter(train) [480500/640000] base_lr: 3.0825e-05 lr: 4.6205e-06 eta: 2 days, 21:59:01 time: 1.5974 data_time: 0.0220 memory: 25718 grad_norm: 3.3455 loss: 1.1360 detection_loss_cls: 0.0268 detection_loss_reg: 0.3186 caption_loss_cls: 2.0252 grounding_loss_reg: 2.2200 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3141 instance_segmentation_loss_poly: 0.8336 +2024/01/10 11:33:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 11:33:32 - mmengine - INFO - Iter(train) [481000/640000] base_lr: 3.0654e-05 lr: 4.6049e-06 eta: 2 days, 21:47:56 time: 1.6019 data_time: 0.0221 memory: 25718 grad_norm: 3.3959 loss: 1.1441 detection_loss_cls: 0.0269 detection_loss_reg: 0.3182 caption_loss_cls: 2.0270 grounding_loss_reg: 2.2197 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3136 instance_segmentation_loss_poly: 0.8327 +2024/01/10 11:46:35 - mmengine - INFO - Iter(train) [481500/640000] base_lr: 3.0483e-05 lr: 4.5894e-06 eta: 2 days, 21:34:19 time: 1.6023 data_time: 0.0222 memory: 25718 grad_norm: 3.3993 loss: 1.1411 detection_loss_cls: 0.0269 detection_loss_reg: 0.3189 caption_loss_cls: 2.0314 grounding_loss_reg: 2.2165 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3137 instance_segmentation_loss_poly: 0.8319 +2024/01/10 11:59:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 11:59:51 - mmengine - INFO - Iter(train) [482000/640000] base_lr: 3.0313e-05 lr: 4.5739e-06 eta: 2 days, 21:21:27 time: 1.6038 data_time: 0.0222 memory: 25718 grad_norm: 3.4187 loss: 1.1461 detection_loss_cls: 0.0270 detection_loss_reg: 0.3197 caption_loss_cls: 2.0320 grounding_loss_reg: 2.2173 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3146 instance_segmentation_loss_poly: 0.8339 +2024/01/10 11:59:51 - mmengine - INFO - Saving checkpoint at 482000 iterations +2024/01/10 12:12:55 - mmengine - INFO - Iter(train) [482500/640000] base_lr: 3.0143e-05 lr: 4.5585e-06 eta: 2 days, 21:07:55 time: 1.5947 data_time: 0.0220 memory: 25718 grad_norm: 3.4636 loss: 1.1577 detection_loss_cls: 0.0271 detection_loss_reg: 0.3210 caption_loss_cls: 2.0318 grounding_loss_reg: 2.2145 semantic_segmentation_loss_cls: 0.0070 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3148 instance_segmentation_loss_poly: 0.8345 +2024/01/10 12:26:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 12:26:25 - mmengine - INFO - Iter(train) [483000/640000] base_lr: 2.9974e-05 lr: 4.5430e-06 eta: 2 days, 20:55:50 time: 1.6015 data_time: 0.0221 memory: 25718 grad_norm: 3.4381 loss: 1.1482 detection_loss_cls: 0.0271 detection_loss_reg: 0.3206 caption_loss_cls: 2.0316 grounding_loss_reg: 2.2130 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3152 instance_segmentation_loss_poly: 0.8349 +2024/01/10 12:39:00 - mmengine - INFO - Iter(train) [483500/640000] base_lr: 2.9804e-05 lr: 4.5277e-06 eta: 2 days, 20:40:43 time: 1.5890 data_time: 0.0219 memory: 25718 grad_norm: 3.4714 loss: 1.1547 detection_loss_cls: 0.0271 detection_loss_reg: 0.3211 caption_loss_cls: 2.0327 grounding_loss_reg: 2.2118 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3142 instance_segmentation_loss_poly: 0.8327 +2024/01/10 12:51:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 12:51:55 - mmengine - INFO - Iter(train) [484000/640000] base_lr: 2.9636e-05 lr: 4.5123e-06 eta: 2 days, 20:26:43 time: 1.5937 data_time: 0.0220 memory: 25718 grad_norm: 3.3897 loss: 1.1412 detection_loss_cls: 0.0271 detection_loss_reg: 0.3205 caption_loss_cls: 2.0331 grounding_loss_reg: 2.2081 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3139 instance_segmentation_loss_poly: 0.8315 +2024/01/10 12:51:55 - mmengine - INFO - Saving checkpoint at 484000 iterations +2024/01/10 13:05:21 - mmengine - INFO - Iter(train) [484500/640000] base_lr: 2.9468e-05 lr: 4.4971e-06 eta: 2 days, 20:14:23 time: 1.5827 data_time: 0.0256 memory: 25718 grad_norm: 3.4445 loss: 1.1509 detection_loss_cls: 0.0270 detection_loss_reg: 0.3199 caption_loss_cls: 2.0338 grounding_loss_reg: 2.2072 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3140 instance_segmentation_loss_poly: 0.8328 +2024/01/10 13:18:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 13:18:55 - mmengine - INFO - Iter(train) [485000/640000] base_lr: 2.9300e-05 lr: 4.4818e-06 eta: 2 days, 20:02:30 time: 1.5800 data_time: 0.0258 memory: 25718 grad_norm: 3.4384 loss: 1.1550 detection_loss_cls: 0.0270 detection_loss_reg: 0.3200 caption_loss_cls: 2.0331 grounding_loss_reg: 2.2044 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3128 instance_segmentation_loss_poly: 0.8310 +2024/01/10 13:32:18 - mmengine - INFO - Iter(train) [485500/640000] base_lr: 2.9133e-05 lr: 4.4666e-06 eta: 2 days, 19:49:56 time: 1.5848 data_time: 0.0258 memory: 25718 grad_norm: 3.4073 loss: 1.1506 detection_loss_cls: 0.0270 detection_loss_reg: 0.3194 caption_loss_cls: 2.0287 grounding_loss_reg: 2.2023 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3127 instance_segmentation_loss_poly: 0.8310 +2024/01/10 13:45:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 13:45:24 - mmengine - INFO - Iter(train) [486000/640000] base_lr: 2.8966e-05 lr: 4.4514e-06 eta: 2 days, 19:36:33 time: 1.5826 data_time: 0.0257 memory: 25718 grad_norm: 3.3730 loss: 1.1484 detection_loss_cls: 0.0270 detection_loss_reg: 0.3199 caption_loss_cls: 2.0295 grounding_loss_reg: 2.2031 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3128 instance_segmentation_loss_poly: 0.8311 +2024/01/10 13:45:24 - mmengine - INFO - Saving checkpoint at 486000 iterations +2024/01/10 13:58:47 - mmengine - INFO - Iter(train) [486500/640000] base_lr: 2.8799e-05 lr: 4.4363e-06 eta: 2 days, 19:24:00 time: 1.5873 data_time: 0.0258 memory: 25718 grad_norm: 3.3265 loss: 1.1421 detection_loss_cls: 0.0269 detection_loss_reg: 0.3186 caption_loss_cls: 2.0346 grounding_loss_reg: 2.2041 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3128 instance_segmentation_loss_poly: 0.8306 +2024/01/10 14:11:47 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240109_143717 +2024/01/10 14:11:47 - mmengine - INFO - Iter(train) [487000/640000] base_lr: 2.8633e-05 lr: 4.4212e-06 eta: 2 days, 19:10:17 time: 1.5797 data_time: 0.0257 memory: 25718 grad_norm: 3.3142 loss: 1.1436 detection_loss_cls: 0.0269 detection_loss_reg: 0.3186 caption_loss_cls: 2.0345 grounding_loss_reg: 2.1987 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3133 instance_segmentation_loss_poly: 0.8315 +2024/01/10 14:24:33 - mmengine - INFO - Iter(train) [487500/640000] base_lr: 2.8468e-05 lr: 4.4061e-06 eta: 2 days, 18:55:55 time: 1.5825 data_time: 0.0258 memory: 25718 grad_norm: 3.3012 loss: 1.1419 detection_loss_cls: 0.0269 detection_loss_reg: 0.3183 caption_loss_cls: 2.0343 grounding_loss_reg: 2.1988 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0257 instance_segmentation_loss_reg: 0.3125 instance_segmentation_loss_poly: 0.8292 +2024/01/11 05:53:43 - mmengine - INFO - Iter(train) [488000/640000] base_lr: 2.8302e-05 lr: 4.3911e-06 eta: 2 days, 13:52:00 time: 1.5346 data_time: 0.0209 memory: 25718 grad_norm: 3.3782 loss: 1.1331 detection_loss_cls: 0.0269 detection_loss_reg: 0.3192 caption_loss_cls: 2.0249 grounding_loss_reg: 2.1918 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3140 instance_segmentation_loss_poly: 0.8311 +2024/01/11 05:53:43 - mmengine - INFO - Saving checkpoint at 488000 iterations +2024/01/11 06:06:29 - mmengine - INFO - Iter(train) [488500/640000] base_lr: 2.8138e-05 lr: 4.3762e-06 eta: 2 days, 14:13:34 time: 1.5247 data_time: 0.0209 memory: 25718 grad_norm: 3.3826 loss: 1.1369 detection_loss_cls: 0.0270 detection_loss_reg: 0.3198 caption_loss_cls: 2.0255 grounding_loss_reg: 2.1882 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3149 instance_segmentation_loss_poly: 0.8332 +2024/01/11 06:18:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 06:18:43 - mmengine - INFO - Iter(train) [489000/640000] base_lr: 2.7973e-05 lr: 4.3612e-06 eta: 2 days, 13:56:07 time: 1.5045 data_time: 0.0206 memory: 25718 grad_norm: 3.3690 loss: 1.1389 detection_loss_cls: 0.0270 detection_loss_reg: 0.3207 caption_loss_cls: 2.0233 grounding_loss_reg: 2.1888 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0260 instance_segmentation_loss_reg: 0.3158 instance_segmentation_loss_poly: 0.8351 +2024/01/11 06:30:49 - mmengine - INFO - Iter(train) [489500/640000] base_lr: 2.7810e-05 lr: 4.3463e-06 eta: 2 days, 13:35:04 time: 1.4856 data_time: 0.0205 memory: 25718 grad_norm: 3.3889 loss: 1.1392 detection_loss_cls: 0.0271 detection_loss_reg: 0.3212 caption_loss_cls: 2.0223 grounding_loss_reg: 2.1889 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3165 instance_segmentation_loss_poly: 0.8350 +2024/01/11 06:43:26 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 06:43:26 - mmengine - INFO - Iter(train) [490000/640000] base_lr: 2.7646e-05 lr: 4.3315e-06 eta: 2 days, 13:35:07 time: 1.4781 data_time: 0.0204 memory: 25718 grad_norm: 3.3634 loss: 1.1323 detection_loss_cls: 0.0270 detection_loss_reg: 0.3214 caption_loss_cls: 2.0134 grounding_loss_reg: 2.1887 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3161 instance_segmentation_loss_poly: 0.8350 +2024/01/11 06:43:26 - mmengine - INFO - Saving checkpoint at 490000 iterations +2024/01/11 06:55:09 - mmengine - INFO - Iter(train) [490500/640000] base_lr: 2.7483e-05 lr: 4.3167e-06 eta: 2 days, 13:02:53 time: 1.4715 data_time: 0.0247 memory: 25718 grad_norm: 3.4004 loss: 1.1483 detection_loss_cls: 0.0271 detection_loss_reg: 0.3225 caption_loss_cls: 2.0152 grounding_loss_reg: 2.1874 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3164 instance_segmentation_loss_poly: 0.8347 +2024/01/11 07:08:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 07:08:01 - mmengine - INFO - Iter(train) [491000/640000] base_lr: 2.7321e-05 lr: 4.3019e-06 eta: 2 days, 13:08:28 time: 1.4781 data_time: 0.0248 memory: 25718 grad_norm: 3.3173 loss: 1.1377 detection_loss_cls: 0.0272 detection_loss_reg: 0.3231 caption_loss_cls: 2.0123 grounding_loss_reg: 2.1858 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3169 instance_segmentation_loss_poly: 0.8358 +2024/01/11 07:20:22 - mmengine - INFO - Iter(train) [491500/640000] base_lr: 2.7159e-05 lr: 4.2871e-06 eta: 2 days, 12:57:02 time: 1.4816 data_time: 0.0250 memory: 25718 grad_norm: 3.3299 loss: 1.1437 detection_loss_cls: 0.0271 detection_loss_reg: 0.3225 caption_loss_cls: 2.0099 grounding_loss_reg: 2.1834 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3172 instance_segmentation_loss_poly: 0.8372 +2024/01/11 07:32:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 07:32:38 - mmengine - INFO - Iter(train) [492000/640000] base_lr: 2.6997e-05 lr: 4.2725e-06 eta: 2 days, 12:43:18 time: 1.4829 data_time: 0.0250 memory: 25718 grad_norm: 3.3480 loss: 1.1419 detection_loss_cls: 0.0271 detection_loss_reg: 0.3220 caption_loss_cls: 2.0045 grounding_loss_reg: 2.1826 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0256 instance_segmentation_loss_reg: 0.3154 instance_segmentation_loss_poly: 0.8345 +2024/01/11 07:32:38 - mmengine - INFO - Saving checkpoint at 492000 iterations +2024/01/11 07:44:34 - mmengine - INFO - Iter(train) [492500/640000] base_lr: 2.6836e-05 lr: 4.2578e-06 eta: 2 days, 12:22:41 time: 1.4705 data_time: 0.0248 memory: 25718 grad_norm: 3.3672 loss: 1.1410 detection_loss_cls: 0.0271 detection_loss_reg: 0.3222 caption_loss_cls: 2.0060 grounding_loss_reg: 2.1801 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0256 instance_segmentation_loss_reg: 0.3156 instance_segmentation_loss_poly: 0.8348 +2024/01/11 07:56:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 07:56:41 - mmengine - INFO - Iter(train) [493000/640000] base_lr: 2.6675e-05 lr: 4.2432e-06 eta: 2 days, 12:06:49 time: 1.4688 data_time: 0.0248 memory: 25718 grad_norm: 3.4050 loss: 1.1422 detection_loss_cls: 0.0270 detection_loss_reg: 0.3211 caption_loss_cls: 2.0053 grounding_loss_reg: 2.1768 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0256 instance_segmentation_loss_reg: 0.3155 instance_segmentation_loss_poly: 0.8348 +2024/01/11 08:09:08 - mmengine - INFO - Iter(train) [493500/640000] base_lr: 2.6515e-05 lr: 4.2286e-06 eta: 2 days, 11:57:47 time: 1.4738 data_time: 0.0248 memory: 25718 grad_norm: 3.4016 loss: 1.1385 detection_loss_cls: 0.0270 detection_loss_reg: 0.3215 caption_loss_cls: 2.0036 grounding_loss_reg: 2.1783 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0255 instance_segmentation_loss_reg: 0.3153 instance_segmentation_loss_poly: 0.8335 +2024/01/11 08:21:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 08:21:25 - mmengine - INFO - Iter(train) [494000/640000] base_lr: 2.6355e-05 lr: 4.2141e-06 eta: 2 days, 11:45:20 time: 1.4688 data_time: 0.0249 memory: 25718 grad_norm: 3.4567 loss: 1.1512 detection_loss_cls: 0.0271 detection_loss_reg: 0.3222 caption_loss_cls: 2.0014 grounding_loss_reg: 2.1737 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0256 instance_segmentation_loss_reg: 0.3159 instance_segmentation_loss_poly: 0.8346 +2024/01/11 08:21:25 - mmengine - INFO - Saving checkpoint at 494000 iterations +2024/01/11 08:33:51 - mmengine - INFO - Iter(train) [494500/640000] base_lr: 2.6196e-05 lr: 4.1996e-06 eta: 2 days, 11:35:43 time: 1.4796 data_time: 0.0250 memory: 25718 grad_norm: 3.4112 loss: 1.1387 detection_loss_cls: 0.0270 detection_loss_reg: 0.3213 caption_loss_cls: 1.9991 grounding_loss_reg: 2.1716 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0255 instance_segmentation_loss_reg: 0.3154 instance_segmentation_loss_poly: 0.8343 +2024/01/11 08:46:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 08:46:01 - mmengine - INFO - Iter(train) [495000/640000] base_lr: 2.6037e-05 lr: 4.1851e-06 eta: 2 days, 11:21:15 time: 1.4691 data_time: 0.0247 memory: 25718 grad_norm: 3.4501 loss: 1.1461 detection_loss_cls: 0.0270 detection_loss_reg: 0.3205 caption_loss_cls: 1.9990 grounding_loss_reg: 2.1682 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0256 instance_segmentation_loss_reg: 0.3154 instance_segmentation_loss_poly: 0.8331 +2024/01/11 08:59:11 - mmengine - INFO - Iter(train) [495500/640000] base_lr: 2.5878e-05 lr: 4.1707e-06 eta: 2 days, 11:22:23 time: 1.4814 data_time: 0.0249 memory: 25718 grad_norm: 3.3875 loss: 1.1397 detection_loss_cls: 0.0270 detection_loss_reg: 0.3199 caption_loss_cls: 1.9974 grounding_loss_reg: 2.1687 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0256 instance_segmentation_loss_reg: 0.3153 instance_segmentation_loss_poly: 0.8328 +2024/01/11 09:11:23 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 09:11:23 - mmengine - INFO - Iter(train) [496000/640000] base_lr: 2.5720e-05 lr: 4.1564e-06 eta: 2 days, 11:08:13 time: 1.4805 data_time: 0.0250 memory: 25718 grad_norm: 3.3896 loss: 1.1495 detection_loss_cls: 0.0271 detection_loss_reg: 0.3210 caption_loss_cls: 1.9991 grounding_loss_reg: 2.1675 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0256 instance_segmentation_loss_reg: 0.3167 instance_segmentation_loss_poly: 0.8362 +2024/01/11 09:11:23 - mmengine - INFO - Saving checkpoint at 496000 iterations +2024/01/11 09:24:27 - mmengine - INFO - Iter(train) [496500/640000] base_lr: 2.5563e-05 lr: 4.1420e-06 eta: 2 days, 11:06:00 time: 1.4973 data_time: 0.0250 memory: 25718 grad_norm: 3.3224 loss: 1.1270 detection_loss_cls: 0.0272 detection_loss_reg: 0.3214 caption_loss_cls: 1.9996 grounding_loss_reg: 2.1673 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0257 instance_segmentation_loss_reg: 0.3169 instance_segmentation_loss_poly: 0.8367 +2024/01/11 09:37:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 09:37:14 - mmengine - INFO - Iter(train) [497000/640000] base_lr: 2.5405e-05 lr: 4.1278e-06 eta: 2 days, 10:59:11 time: 1.5074 data_time: 0.0251 memory: 25718 grad_norm: 3.2516 loss: 1.1171 detection_loss_cls: 0.0271 detection_loss_reg: 0.3216 caption_loss_cls: 2.0006 grounding_loss_reg: 2.1667 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0257 instance_segmentation_loss_reg: 0.3179 instance_segmentation_loss_poly: 0.8396 +2024/01/11 09:49:33 - mmengine - INFO - Iter(train) [497500/640000] base_lr: 2.5249e-05 lr: 4.1135e-06 eta: 2 days, 10:45:52 time: 1.5053 data_time: 0.0250 memory: 25718 grad_norm: 3.2672 loss: 1.1175 detection_loss_cls: 0.0272 detection_loss_reg: 0.3229 caption_loss_cls: 1.9946 grounding_loss_reg: 2.1661 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3187 instance_segmentation_loss_poly: 0.8406 +2024/01/11 10:00:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 10:00:56 - mmengine - INFO - Iter(train) [498000/640000] base_lr: 2.5093e-05 lr: 4.0993e-06 eta: 2 days, 10:21:44 time: 1.4920 data_time: 0.0248 memory: 25718 grad_norm: 3.2779 loss: 1.1206 detection_loss_cls: 0.0272 detection_loss_reg: 0.3234 caption_loss_cls: 1.9956 grounding_loss_reg: 2.1635 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3185 instance_segmentation_loss_poly: 0.8405 +2024/01/11 10:00:56 - mmengine - INFO - Saving checkpoint at 498000 iterations +2024/01/11 10:13:39 - mmengine - INFO - Iter(train) [498500/640000] base_lr: 2.4937e-05 lr: 4.0852e-06 eta: 2 days, 10:13:48 time: 1.4962 data_time: 0.0249 memory: 25718 grad_norm: 3.3042 loss: 1.1222 detection_loss_cls: 0.0273 detection_loss_reg: 0.3252 caption_loss_cls: 1.9946 grounding_loss_reg: 2.1625 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3188 instance_segmentation_loss_poly: 0.8412 +2024/01/11 10:25:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 10:25:15 - mmengine - INFO - Iter(train) [499000/640000] base_lr: 2.4781e-05 lr: 4.0710e-06 eta: 2 days, 9:53:16 time: 1.4878 data_time: 0.0248 memory: 25718 grad_norm: 3.3225 loss: 1.1186 detection_loss_cls: 0.0272 detection_loss_reg: 0.3246 caption_loss_cls: 1.9919 grounding_loss_reg: 2.1618 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3189 instance_segmentation_loss_poly: 0.8416 +2024/01/11 10:37:26 - mmengine - INFO - Iter(train) [499500/640000] base_lr: 2.4627e-05 lr: 4.0570e-06 eta: 2 days, 9:39:27 time: 1.4730 data_time: 0.0246 memory: 25718 grad_norm: 3.3877 loss: 1.1359 detection_loss_cls: 0.0272 detection_loss_reg: 0.3251 caption_loss_cls: 2.0000 grounding_loss_reg: 2.1636 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3184 instance_segmentation_loss_poly: 0.8397 +2024/01/11 10:50:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 10:50:05 - mmengine - INFO - Iter(train) [500000/640000] base_lr: 2.4472e-05 lr: 4.0429e-06 eta: 2 days, 9:30:31 time: 1.4797 data_time: 0.0247 memory: 25718 grad_norm: 3.3578 loss: 1.1331 detection_loss_cls: 0.0273 detection_loss_reg: 0.3255 caption_loss_cls: 1.9972 grounding_loss_reg: 2.1596 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3194 instance_segmentation_loss_poly: 0.8420 +2024/01/11 10:50:05 - mmengine - INFO - Saving checkpoint at 500000 iterations +2024/01/11 11:02:25 - mmengine - INFO - Evaluating bbox... +2024/01/11 11:03:21 - mmengine - INFO - bbox_mAP_copypaste: 0.513 0.693 0.561 0.353 0.560 0.654 +2024/01/11 11:03:21 - mmengine - INFO - Evaluating segm... +2024/01/11 11:04:37 - mmengine - INFO - segm_mAP_copypaste: 0.350 0.615 0.347 0.200 0.393 0.527 +2024/01/11 11:12:12 - mmengine - INFO - per class results: +2024/01/11 11:12:12 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.58 | 90.03 | +| building | 82.73 | 92.0 | +| sky | 93.43 | 98.05 | +| floor | 82.75 | 91.17 | +| tree | 74.37 | 87.23 | +| ceiling | 85.63 | 94.78 | +| road | 84.86 | 90.83 | +| bed | 89.99 | 95.95 | +| windowpane | 64.1 | 79.25 | +| grass | 65.09 | 82.93 | +| cabinet | 62.13 | 71.24 | +| sidewalk | 64.79 | 78.58 | +| person | 81.19 | 91.57 | +| earth | 42.48 | 55.18 | +| door | 53.89 | 66.35 | +| table | 65.39 | 81.19 | +| mountain | 61.71 | 72.58 | +| plant | 52.54 | 62.42 | +| curtain | 76.02 | 87.77 | +| chair | 61.91 | 74.81 | +| car | 85.57 | 92.2 | +| water | 57.09 | 74.5 | +| painting | 72.87 | 87.2 | +| sofa | 70.23 | 83.3 | +| shelf | 45.71 | 61.45 | +| house | 43.11 | 59.58 | +| sea | 55.64 | 69.08 | +| mirror | 70.13 | 78.95 | +| rug | 67.84 | 76.28 | +| field | 32.58 | 51.81 | +| armchair | 48.41 | 66.11 | +| seat | 62.97 | 80.12 | +| fence | 45.23 | 64.41 | +| desk | 47.53 | 69.29 | +| rock | 49.39 | 74.38 | +| wardrobe | 44.27 | 61.5 | +| lamp | 64.02 | 77.35 | +| bathtub | 80.37 | 84.98 | +| railing | 37.92 | 53.76 | +| cushion | 60.99 | 70.73 | +| base | 21.23 | 26.96 | +| box | 28.92 | 39.6 | +| column | 52.7 | 63.93 | +| signboard | 37.43 | 53.35 | +| chest of drawers | 40.9 | 59.95 | +| counter | 20.6 | 28.04 | +| sand | 47.64 | 58.13 | +| sink | 77.04 | 83.21 | +| skyscraper | 58.8 | 74.01 | +| fireplace | 75.99 | 88.27 | +| refrigerator | 72.14 | 79.02 | +| grandstand | 42.79 | 75.71 | +| path | 25.45 | 40.13 | +| stairs | 27.82 | 33.06 | +| runway | 76.95 | 88.67 | +| case | 48.88 | 68.03 | +| pool table | 91.26 | 96.55 | +| pillow | 60.67 | 73.38 | +| screen door | 80.44 | 83.24 | +| stairway | 30.55 | 44.56 | +| river | 14.13 | 28.71 | +| bridge | 65.9 | 86.64 | +| bookcase | 37.87 | 58.16 | +| blind | 38.94 | 42.12 | +| coffee table | 68.97 | 83.18 | +| toilet | 87.81 | 91.9 | +| flower | 39.66 | 54.22 | +| book | 51.62 | 68.02 | +| hill | 12.84 | 21.23 | +| bench | 59.61 | 70.91 | +| countertop | 58.59 | 75.28 | +| stove | 75.98 | 82.7 | +| palm | 45.8 | 61.31 | +| kitchen island | 43.75 | 76.13 | +| computer | 71.78 | 80.31 | +| swivel chair | 39.81 | 51.22 | +| boat | 78.55 | 85.29 | +| bar | 40.38 | 60.7 | +| arcade machine | 56.76 | 61.08 | +| hovel | 20.46 | 23.28 | +| bus | 93.14 | 95.56 | +| towel | 64.91 | 78.92 | +| light | 52.69 | 62.08 | +| truck | 45.35 | 55.37 | +| tower | 22.39 | 38.23 | +| chandelier | 64.58 | 78.86 | +| awning | 32.98 | 40.83 | +| streetlight | 32.87 | 42.53 | +| booth | 31.63 | 35.7 | +| television receiver | 71.01 | 81.37 | +| airplane | 65.83 | 79.18 | +| dirt track | 12.13 | 20.18 | +| apparel | 37.24 | 55.66 | +| pole | 27.76 | 40.89 | +| land | 3.38 | 6.9 | +| bannister | 16.88 | 22.89 | +| escalator | 19.17 | 20.93 | +| ottoman | 50.51 | 68.62 | +| bottle | 23.57 | 29.35 | +| buffet | 42.82 | 53.97 | +| poster | 33.3 | 38.58 | +| stage | 10.84 | 17.13 | +| van | 48.03 | 64.35 | +| ship | 9.38 | 9.73 | +| fountain | 19.82 | 20.13 | +| conveyer belt | 81.52 | 90.68 | +| canopy | 30.98 | 38.59 | +| washer | 68.98 | 69.79 | +| plaything | 28.3 | 31.97 | +| swimming pool | 61.19 | 75.36 | +| stool | 51.89 | 65.49 | +| barrel | 24.01 | 70.2 | +| basket | 31.22 | 47.65 | +| waterfall | 61.68 | 88.55 | +| tent | 90.28 | 96.8 | +| bag | 22.09 | 28.85 | +| minibike | 73.12 | 83.63 | +| cradle | 73.14 | 96.51 | +| oven | 53.18 | 74.73 | +| ball | 52.81 | 71.59 | +| food | 47.65 | 51.6 | +| step | 11.87 | 17.02 | +| tank | 31.75 | 43.22 | +| trade name | 21.2 | 23.14 | +| microwave | 84.73 | 89.41 | +| pot | 54.67 | 63.74 | +| animal | 57.67 | 60.58 | +| bicycle | 56.69 | 73.3 | +| lake | 59.06 | 63.25 | +| dishwasher | 60.24 | 71.82 | +| screen | 57.52 | 74.58 | +| blanket | 14.61 | 16.7 | +| sculpture | 58.59 | 67.78 | +| hood | 60.08 | 70.75 | +| sconce | 42.97 | 51.09 | +| vase | 46.13 | 61.95 | +| traffic light | 39.11 | 51.91 | +| tray | 7.83 | 14.49 | +| ashcan | 43.28 | 55.55 | +| fan | 58.86 | 68.66 | +| pier | 45.2 | 56.42 | +| crt screen | 13.16 | 20.06 | +| plate | 56.55 | 72.23 | +| monitor | 40.99 | 54.96 | +| bulletin board | 45.12 | 57.64 | +| shower | 4.17 | 5.85 | +| radiator | 60.61 | 69.04 | +| glass | 19.93 | 21.71 | +| clock | 26.05 | 33.76 | +| flag | 26.35 | 32.18 | ++---------------------+-------+-------+ +2024/01/11 11:12:30 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.5130 coco/bbox_mAP_50: 0.6930 coco/bbox_mAP_75: 0.5610 coco/bbox_mAP_s: 0.3530 coco/bbox_mAP_m: 0.5600 coco/bbox_mAP_l: 0.6540 coco/segm_mAP: 0.3500 coco/segm_mAP_50: 0.6150 coco/segm_mAP_75: 0.3470 coco/segm_mAP_s: 0.2000 coco/segm_mAP_m: 0.3930 coco/segm_mAP_l: 0.5270 Bleu_1: 0.7654 Bleu_2: 0.6035 Bleu_3: 0.4626 Bleu_4: 0.3510 METEOR: 0.2757 ROUGE_L: 0.5641 CIDEr: 1.1305 SPICE: 0.2052 aAcc: 83.9100 mIoU: 50.5500 mAcc: 62.0300 visual-grounding/miou: 0.8230 visual-grounding/acc: 0.8853 data_time: 0.0100 time: 1.3620 +2024/01/11 11:24:22 - mmengine - INFO - Iter(train) [500500/640000] base_lr: 2.4318e-05 lr: 4.0289e-06 eta: 2 days, 9:14:04 time: 1.4623 data_time: 0.0213 memory: 25718 grad_norm: 3.4198 loss: 1.1511 detection_loss_cls: 0.0271 detection_loss_reg: 0.3240 caption_loss_cls: 1.9954 grounding_loss_reg: 2.1585 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3188 instance_segmentation_loss_poly: 0.8406 +2024/01/11 11:36:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 11:36:19 - mmengine - INFO - Iter(train) [501000/640000] base_lr: 2.4165e-05 lr: 4.0150e-06 eta: 2 days, 8:58:19 time: 1.4496 data_time: 0.0213 memory: 25718 grad_norm: 3.4593 loss: 1.1577 detection_loss_cls: 0.0270 detection_loss_reg: 0.3232 caption_loss_cls: 1.9918 grounding_loss_reg: 2.1601 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3180 instance_segmentation_loss_poly: 0.8387 +2024/01/11 11:48:30 - mmengine - INFO - Iter(train) [501500/640000] base_lr: 2.4012e-05 lr: 4.0011e-06 eta: 2 days, 8:45:00 time: 1.4478 data_time: 0.0215 memory: 25718 grad_norm: 3.4683 loss: 1.1588 detection_loss_cls: 0.0270 detection_loss_reg: 0.3236 caption_loss_cls: 1.9926 grounding_loss_reg: 2.1582 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0258 instance_segmentation_loss_reg: 0.3185 instance_segmentation_loss_poly: 0.8405 +2024/01/11 12:00:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 12:00:46 - mmengine - INFO - Iter(train) [502000/640000] base_lr: 2.3859e-05 lr: 3.9872e-06 eta: 2 days, 8:32:23 time: 1.4610 data_time: 0.0219 memory: 25718 grad_norm: 3.4443 loss: 1.1510 detection_loss_cls: 0.0270 detection_loss_reg: 0.3228 caption_loss_cls: 1.9912 grounding_loss_reg: 2.1558 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0259 instance_segmentation_loss_reg: 0.3188 instance_segmentation_loss_poly: 0.8411 +2024/01/11 12:00:46 - mmengine - INFO - Saving checkpoint at 502000 iterations +2024/01/11 12:13:02 - mmengine - INFO - Iter(train) [502500/640000] base_lr: 2.3707e-05 lr: 3.9734e-06 eta: 2 days, 8:19:52 time: 1.4542 data_time: 0.0225 memory: 25718 grad_norm: 3.4262 loss: 1.1379 detection_loss_cls: 0.0268 detection_loss_reg: 0.3209 caption_loss_cls: 1.9894 grounding_loss_reg: 2.1552 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0257 instance_segmentation_loss_reg: 0.3171 instance_segmentation_loss_poly: 0.8385 +2024/01/11 12:26:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 12:26:08 - mmengine - INFO - Iter(train) [503000/640000] base_lr: 2.3556e-05 lr: 3.9596e-06 eta: 2 days, 8:14:03 time: 1.4767 data_time: 0.0231 memory: 25718 grad_norm: 3.3822 loss: 1.1329 detection_loss_cls: 0.0267 detection_loss_reg: 0.3207 caption_loss_cls: 1.9887 grounding_loss_reg: 2.1530 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0256 instance_segmentation_loss_reg: 0.3163 instance_segmentation_loss_poly: 0.8361 +2024/01/11 12:38:27 - mmengine - INFO - Iter(train) [503500/640000] base_lr: 2.3405e-05 lr: 3.9459e-06 eta: 2 days, 8:01:42 time: 1.4788 data_time: 0.0233 memory: 25718 grad_norm: 3.4171 loss: 1.1234 detection_loss_cls: 0.0266 detection_loss_reg: 0.3201 caption_loss_cls: 1.9876 grounding_loss_reg: 2.1533 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0255 instance_segmentation_loss_reg: 0.3153 instance_segmentation_loss_poly: 0.8339 +2024/01/11 12:50:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 12:50:15 - mmengine - INFO - Iter(train) [504000/640000] base_lr: 2.3254e-05 lr: 3.9322e-06 eta: 2 days, 7:45:22 time: 1.4658 data_time: 0.0234 memory: 25718 grad_norm: 3.4250 loss: 1.1280 detection_loss_cls: 0.0265 detection_loss_reg: 0.3199 caption_loss_cls: 1.9902 grounding_loss_reg: 2.1534 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0254 instance_segmentation_loss_reg: 0.3158 instance_segmentation_loss_poly: 0.8353 +2024/01/11 12:50:15 - mmengine - INFO - Saving checkpoint at 504000 iterations +2024/01/11 13:02:17 - mmengine - INFO - Iter(train) [504500/640000] base_lr: 2.3104e-05 lr: 3.9185e-06 eta: 2 days, 7:31:03 time: 1.4677 data_time: 0.0275 memory: 25718 grad_norm: 3.4530 loss: 1.1271 detection_loss_cls: 0.0265 detection_loss_reg: 0.3195 caption_loss_cls: 1.9897 grounding_loss_reg: 2.1497 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3148 instance_segmentation_loss_poly: 0.8331 +2024/01/11 13:15:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 13:15:05 - mmengine - INFO - Iter(train) [505000/640000] base_lr: 2.2954e-05 lr: 3.9049e-06 eta: 2 days, 7:22:23 time: 1.4807 data_time: 0.0278 memory: 25718 grad_norm: 3.4499 loss: 1.1224 detection_loss_cls: 0.0265 detection_loss_reg: 0.3199 caption_loss_cls: 1.9889 grounding_loss_reg: 2.1500 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3149 instance_segmentation_loss_poly: 0.8337 +2024/01/11 13:28:20 - mmengine - INFO - Iter(train) [505500/640000] base_lr: 2.2805e-05 lr: 3.8913e-06 eta: 2 days, 7:16:30 time: 1.4965 data_time: 0.0281 memory: 25718 grad_norm: 3.3821 loss: 1.1150 detection_loss_cls: 0.0264 detection_loss_reg: 0.3195 caption_loss_cls: 1.9845 grounding_loss_reg: 2.1515 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3150 instance_segmentation_loss_poly: 0.8323 +2024/01/11 13:40:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 13:40:37 - mmengine - INFO - Iter(train) [506000/640000] base_lr: 2.2656e-05 lr: 3.8778e-06 eta: 2 days, 7:03:48 time: 1.4968 data_time: 0.0281 memory: 25718 grad_norm: 3.3870 loss: 1.1166 detection_loss_cls: 0.0264 detection_loss_reg: 0.3195 caption_loss_cls: 1.9823 grounding_loss_reg: 2.1503 semantic_segmentation_loss_cls: 0.0069 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3151 instance_segmentation_loss_poly: 0.8325 +2024/01/11 13:40:37 - mmengine - INFO - Saving checkpoint at 506000 iterations +2024/01/11 13:53:36 - mmengine - INFO - Iter(train) [506500/640000] base_lr: 2.2508e-05 lr: 3.8643e-06 eta: 2 days, 6:55:41 time: 1.5074 data_time: 0.0282 memory: 25718 grad_norm: 3.3541 loss: 1.1247 detection_loss_cls: 0.0263 detection_loss_reg: 0.3191 caption_loss_cls: 1.9803 grounding_loss_reg: 2.1513 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3146 instance_segmentation_loss_poly: 0.8316 +2024/01/11 14:05:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 14:05:33 - mmengine - INFO - Iter(train) [507000/640000] base_lr: 2.2360e-05 lr: 3.8509e-06 eta: 2 days, 6:40:50 time: 1.4902 data_time: 0.0279 memory: 25718 grad_norm: 3.3986 loss: 1.1299 detection_loss_cls: 0.0262 detection_loss_reg: 0.3188 caption_loss_cls: 1.9792 grounding_loss_reg: 2.1528 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3145 instance_segmentation_loss_poly: 0.8312 +2024/01/11 14:18:02 - mmengine - INFO - Iter(train) [507500/640000] base_lr: 2.2212e-05 lr: 3.8375e-06 eta: 2 days, 6:29:22 time: 1.4927 data_time: 0.0281 memory: 25718 grad_norm: 3.3599 loss: 1.1323 detection_loss_cls: 0.0264 detection_loss_reg: 0.3206 caption_loss_cls: 1.9815 grounding_loss_reg: 2.1509 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3148 instance_segmentation_loss_poly: 0.8323 +2024/01/11 14:30:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 14:30:53 - mmengine - INFO - Iter(train) [508000/640000] base_lr: 2.2066e-05 lr: 3.8241e-06 eta: 2 days, 6:20:05 time: 1.5087 data_time: 0.0283 memory: 25718 grad_norm: 3.3229 loss: 1.1144 detection_loss_cls: 0.0264 detection_loss_reg: 0.3199 caption_loss_cls: 1.9813 grounding_loss_reg: 2.1505 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3147 instance_segmentation_loss_poly: 0.8324 +2024/01/11 14:30:53 - mmengine - INFO - Saving checkpoint at 508000 iterations +2024/01/11 14:43:28 - mmengine - INFO - Iter(train) [508500/640000] base_lr: 2.1919e-05 lr: 3.8108e-06 eta: 2 days, 6:09:01 time: 1.5168 data_time: 0.0285 memory: 25718 grad_norm: 3.3034 loss: 1.1161 detection_loss_cls: 0.0263 detection_loss_reg: 0.3187 caption_loss_cls: 1.9842 grounding_loss_reg: 2.1508 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3149 instance_segmentation_loss_poly: 0.8316 +2024/01/11 14:55:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 14:55:19 - mmengine - INFO - Iter(train) [509000/640000] base_lr: 2.1773e-05 lr: 3.7976e-06 eta: 2 days, 5:53:46 time: 1.5025 data_time: 0.0282 memory: 25718 grad_norm: 3.2869 loss: 1.1204 detection_loss_cls: 0.0263 detection_loss_reg: 0.3193 caption_loss_cls: 1.9868 grounding_loss_reg: 2.1482 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3140 instance_segmentation_loss_poly: 0.8289 +2024/01/11 15:07:10 - mmengine - INFO - Iter(train) [509500/640000] base_lr: 2.1628e-05 lr: 3.7843e-06 eta: 2 days, 5:38:40 time: 1.4816 data_time: 0.0278 memory: 25718 grad_norm: 3.3506 loss: 1.1250 detection_loss_cls: 0.0264 detection_loss_reg: 0.3192 caption_loss_cls: 1.9894 grounding_loss_reg: 2.1487 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3140 instance_segmentation_loss_poly: 0.8289 +2024/01/11 15:18:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 15:18:38 - mmengine - INFO - Iter(train) [510000/640000] base_lr: 2.1483e-05 lr: 3.7712e-06 eta: 2 days, 5:21:39 time: 1.4695 data_time: 0.0276 memory: 25718 grad_norm: 3.3750 loss: 1.1268 detection_loss_cls: 0.0264 detection_loss_reg: 0.3194 caption_loss_cls: 1.9912 grounding_loss_reg: 2.1445 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3142 instance_segmentation_loss_poly: 0.8287 +2024/01/11 15:18:38 - mmengine - INFO - Saving checkpoint at 510000 iterations +2024/01/11 15:30:56 - mmengine - INFO - Iter(train) [510500/640000] base_lr: 2.1338e-05 lr: 3.7580e-06 eta: 2 days, 5:09:11 time: 1.4592 data_time: 0.0275 memory: 25718 grad_norm: 3.4304 loss: 1.1386 detection_loss_cls: 0.0263 detection_loss_reg: 0.3180 caption_loss_cls: 1.9945 grounding_loss_reg: 2.1460 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3146 instance_segmentation_loss_poly: 0.8282 +2024/01/11 15:43:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 15:43:35 - mmengine - INFO - Iter(train) [511000/640000] base_lr: 2.1194e-05 lr: 3.7449e-06 eta: 2 days, 4:58:32 time: 1.4695 data_time: 0.0277 memory: 25718 grad_norm: 3.4160 loss: 1.1369 detection_loss_cls: 0.0262 detection_loss_reg: 0.3188 caption_loss_cls: 1.9988 grounding_loss_reg: 2.1483 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3132 instance_segmentation_loss_poly: 0.8251 +2024/01/11 15:56:18 - mmengine - INFO - Iter(train) [511500/640000] base_lr: 2.1051e-05 lr: 3.7319e-06 eta: 2 days, 4:48:12 time: 1.4731 data_time: 0.0277 memory: 25718 grad_norm: 3.3874 loss: 1.1306 detection_loss_cls: 0.0262 detection_loss_reg: 0.3188 caption_loss_cls: 1.9970 grounding_loss_reg: 2.1484 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3140 instance_segmentation_loss_poly: 0.8265 +2024/01/11 16:08:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 16:08:58 - mmengine - INFO - Iter(train) [512000/640000] base_lr: 2.0908e-05 lr: 3.7189e-06 eta: 2 days, 4:37:30 time: 1.4703 data_time: 0.0277 memory: 25718 grad_norm: 3.4268 loss: 1.1370 detection_loss_cls: 0.0262 detection_loss_reg: 0.3188 caption_loss_cls: 1.9954 grounding_loss_reg: 2.1487 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3137 instance_segmentation_loss_poly: 0.8254 +2024/01/11 16:08:58 - mmengine - INFO - Saving checkpoint at 512000 iterations +2024/01/11 16:22:03 - mmengine - INFO - Iter(train) [512500/640000] base_lr: 2.0765e-05 lr: 3.7059e-06 eta: 2 days, 4:28:42 time: 1.4778 data_time: 0.0276 memory: 25718 grad_norm: 3.3885 loss: 1.1242 detection_loss_cls: 0.0261 detection_loss_reg: 0.3176 caption_loss_cls: 1.9922 grounding_loss_reg: 2.1487 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3133 instance_segmentation_loss_poly: 0.8243 +2024/01/11 16:34:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 16:34:46 - mmengine - INFO - Iter(train) [513000/640000] base_lr: 2.0623e-05 lr: 3.6930e-06 eta: 2 days, 4:18:05 time: 1.4909 data_time: 0.0279 memory: 25718 grad_norm: 3.3841 loss: 1.1193 detection_loss_cls: 0.0261 detection_loss_reg: 0.3168 caption_loss_cls: 1.9953 grounding_loss_reg: 2.1484 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3120 instance_segmentation_loss_poly: 0.8216 +2024/01/11 16:48:10 - mmengine - INFO - Iter(train) [513500/640000] base_lr: 2.0481e-05 lr: 3.6801e-06 eta: 2 days, 4:10:31 time: 1.5141 data_time: 0.0283 memory: 25718 grad_norm: 3.3539 loss: 1.1148 detection_loss_cls: 0.0260 detection_loss_reg: 0.3171 caption_loss_cls: 1.9962 grounding_loss_reg: 2.1475 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3125 instance_segmentation_loss_poly: 0.8233 +2024/01/11 17:00:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 17:00:06 - mmengine - INFO - Iter(train) [514000/640000] base_lr: 2.0340e-05 lr: 3.6673e-06 eta: 2 days, 3:56:06 time: 1.5209 data_time: 0.0285 memory: 25718 grad_norm: 3.3296 loss: 1.1153 detection_loss_cls: 0.0259 detection_loss_reg: 0.3176 caption_loss_cls: 1.9969 grounding_loss_reg: 2.1477 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3124 instance_segmentation_loss_poly: 0.8231 +2024/01/11 17:00:06 - mmengine - INFO - Saving checkpoint at 514000 iterations +2024/01/11 17:12:34 - mmengine - INFO - Iter(train) [514500/640000] base_lr: 2.0200e-05 lr: 3.6545e-06 eta: 2 days, 3:44:11 time: 1.5236 data_time: 0.0285 memory: 25718 grad_norm: 3.3946 loss: 1.1082 detection_loss_cls: 0.0259 detection_loss_reg: 0.3167 caption_loss_cls: 1.9982 grounding_loss_reg: 2.1488 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3122 instance_segmentation_loss_poly: 0.8218 +2024/01/11 17:25:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 17:25:06 - mmengine - INFO - Iter(train) [515000/640000] base_lr: 2.0059e-05 lr: 3.6418e-06 eta: 2 days, 3:32:29 time: 1.5219 data_time: 0.0285 memory: 25718 grad_norm: 3.3874 loss: 1.1120 detection_loss_cls: 0.0259 detection_loss_reg: 0.3174 caption_loss_cls: 1.9983 grounding_loss_reg: 2.1488 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3126 instance_segmentation_loss_poly: 0.8227 +2024/01/11 17:37:11 - mmengine - INFO - Iter(train) [515500/640000] base_lr: 1.9920e-05 lr: 3.6291e-06 eta: 2 days, 3:18:51 time: 1.5122 data_time: 0.0284 memory: 25718 grad_norm: 3.4278 loss: 1.1207 detection_loss_cls: 0.0260 detection_loss_reg: 0.3182 caption_loss_cls: 1.9927 grounding_loss_reg: 2.1469 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3128 instance_segmentation_loss_poly: 0.8235 +2024/01/11 17:49:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 17:49:09 - mmengine - INFO - Iter(train) [516000/640000] base_lr: 1.9781e-05 lr: 3.6164e-06 eta: 2 days, 3:04:51 time: 1.5019 data_time: 0.0281 memory: 25718 grad_norm: 3.4303 loss: 1.1153 detection_loss_cls: 0.0258 detection_loss_reg: 0.3162 caption_loss_cls: 1.9899 grounding_loss_reg: 2.1423 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3113 instance_segmentation_loss_poly: 0.8212 +2024/01/11 17:49:09 - mmengine - INFO - Saving checkpoint at 516000 iterations +2024/01/11 18:02:08 - mmengine - INFO - Iter(train) [516500/640000] base_lr: 1.9642e-05 lr: 3.6038e-06 eta: 2 days, 2:54:58 time: 1.5004 data_time: 0.0281 memory: 25718 grad_norm: 3.4500 loss: 1.1193 detection_loss_cls: 0.0257 detection_loss_reg: 0.3157 caption_loss_cls: 1.9905 grounding_loss_reg: 2.1399 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3113 instance_segmentation_loss_poly: 0.8207 +2024/01/11 18:13:44 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 18:13:44 - mmengine - INFO - Iter(train) [517000/640000] base_lr: 1.9504e-05 lr: 3.5912e-06 eta: 2 days, 2:39:32 time: 1.4837 data_time: 0.0278 memory: 25718 grad_norm: 3.5244 loss: 1.1261 detection_loss_cls: 0.0257 detection_loss_reg: 0.3155 caption_loss_cls: 1.9923 grounding_loss_reg: 2.1393 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0250 instance_segmentation_loss_reg: 0.3105 instance_segmentation_loss_poly: 0.8193 +2024/01/11 18:25:51 - mmengine - INFO - Iter(train) [517500/640000] base_lr: 1.9366e-05 lr: 3.5787e-06 eta: 2 days, 2:26:14 time: 1.4644 data_time: 0.0275 memory: 25718 grad_norm: 3.5487 loss: 1.1332 detection_loss_cls: 0.0256 detection_loss_reg: 0.3155 caption_loss_cls: 1.9914 grounding_loss_reg: 2.1386 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3109 instance_segmentation_loss_poly: 0.8203 +2024/01/11 18:37:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 18:37:34 - mmengine - INFO - Iter(train) [518000/640000] base_lr: 1.9229e-05 lr: 3.5662e-06 eta: 2 days, 2:11:22 time: 1.4610 data_time: 0.0274 memory: 25718 grad_norm: 3.5681 loss: 1.1324 detection_loss_cls: 0.0255 detection_loss_reg: 0.3147 caption_loss_cls: 1.9935 grounding_loss_reg: 2.1375 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0249 instance_segmentation_loss_reg: 0.3097 instance_segmentation_loss_poly: 0.8185 +2024/01/11 18:37:34 - mmengine - INFO - Saving checkpoint at 518000 iterations +2024/01/11 18:49:23 - mmengine - INFO - Iter(train) [518500/640000] base_lr: 1.9092e-05 lr: 3.5538e-06 eta: 2 days, 1:57:05 time: 1.4513 data_time: 0.0274 memory: 25718 grad_norm: 3.5290 loss: 1.1252 detection_loss_cls: 0.0254 detection_loss_reg: 0.3139 caption_loss_cls: 1.9889 grounding_loss_reg: 2.1364 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0249 instance_segmentation_loss_reg: 0.3095 instance_segmentation_loss_poly: 0.8184 +2024/01/11 19:01:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 19:01:22 - mmengine - INFO - Iter(train) [519000/640000] base_lr: 1.8956e-05 lr: 3.5414e-06 eta: 2 days, 1:43:24 time: 1.4430 data_time: 0.0271 memory: 25718 grad_norm: 3.5848 loss: 1.1234 detection_loss_cls: 0.0254 detection_loss_reg: 0.3134 caption_loss_cls: 1.9847 grounding_loss_reg: 2.1400 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0248 instance_segmentation_loss_reg: 0.3088 instance_segmentation_loss_poly: 0.8173 +2024/01/11 19:13:22 - mmengine - INFO - Iter(train) [519500/640000] base_lr: 1.8820e-05 lr: 3.5291e-06 eta: 2 days, 1:29:55 time: 1.4420 data_time: 0.0270 memory: 25718 grad_norm: 3.5769 loss: 1.1150 detection_loss_cls: 0.0254 detection_loss_reg: 0.3139 caption_loss_cls: 1.9776 grounding_loss_reg: 2.1367 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0248 instance_segmentation_loss_reg: 0.3094 instance_segmentation_loss_poly: 0.8189 +2024/01/11 19:25:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 19:25:42 - mmengine - INFO - Iter(train) [520000/640000] base_lr: 1.8685e-05 lr: 3.5168e-06 eta: 2 days, 1:17:33 time: 1.4471 data_time: 0.0271 memory: 25718 grad_norm: 3.5474 loss: 1.1157 detection_loss_cls: 0.0253 detection_loss_reg: 0.3134 caption_loss_cls: 1.9770 grounding_loss_reg: 2.1382 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0247 instance_segmentation_loss_reg: 0.3090 instance_segmentation_loss_poly: 0.8178 +2024/01/11 19:25:42 - mmengine - INFO - Saving checkpoint at 520000 iterations +2024/01/11 19:38:30 - mmengine - INFO - Evaluating bbox... +2024/01/11 19:39:26 - mmengine - INFO - bbox_mAP_copypaste: 0.510 0.692 0.556 0.349 0.558 0.654 +2024/01/11 19:39:26 - mmengine - INFO - Evaluating segm... +2024/01/11 19:40:39 - mmengine - INFO - segm_mAP_copypaste: 0.347 0.612 0.342 0.197 0.393 0.526 +2024/01/11 19:46:53 - mmengine - INFO - per class results: +2024/01/11 19:46:53 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.73 | 89.49 | +| building | 83.06 | 92.23 | +| sky | 93.32 | 97.12 | +| floor | 83.13 | 90.73 | +| tree | 73.76 | 89.02 | +| ceiling | 85.15 | 93.84 | +| road | 83.04 | 89.93 | +| bed | 91.11 | 96.37 | +| windowpane | 63.61 | 77.9 | +| grass | 66.36 | 82.27 | +| cabinet | 65.8 | 78.18 | +| sidewalk | 66.37 | 82.64 | +| person | 81.57 | 91.87 | +| earth | 39.14 | 50.75 | +| door | 54.01 | 67.93 | +| table | 66.69 | 78.36 | +| mountain | 61.77 | 72.03 | +| plant | 51.98 | 62.89 | +| curtain | 75.66 | 88.27 | +| chair | 61.36 | 74.07 | +| car | 84.79 | 92.07 | +| water | 56.69 | 73.05 | +| painting | 71.66 | 86.87 | +| sofa | 70.98 | 82.67 | +| shelf | 46.18 | 63.83 | +| house | 42.3 | 56.86 | +| sea | 55.3 | 70.55 | +| mirror | 71.45 | 80.26 | +| rug | 69.01 | 81.97 | +| field | 31.65 | 50.1 | +| armchair | 48.49 | 68.99 | +| seat | 63.15 | 80.77 | +| fence | 45.6 | 62.6 | +| desk | 48.69 | 69.8 | +| rock | 49.86 | 70.64 | +| wardrobe | 52.81 | 61.93 | +| lamp | 63.76 | 77.11 | +| bathtub | 82.07 | 84.72 | +| railing | 38.7 | 54.54 | +| cushion | 61.01 | 74.52 | +| base | 22.22 | 29.01 | +| box | 28.95 | 37.76 | +| column | 52.33 | 65.95 | +| signboard | 36.95 | 51.49 | +| chest of drawers | 40.98 | 60.99 | +| counter | 31.29 | 46.53 | +| sand | 50.53 | 71.82 | +| sink | 76.09 | 83.99 | +| skyscraper | 62.41 | 78.01 | +| fireplace | 77.69 | 90.27 | +| refrigerator | 72.3 | 80.59 | +| grandstand | 43.59 | 76.43 | +| path | 25.46 | 38.72 | +| stairs | 33.35 | 39.01 | +| runway | 71.08 | 85.91 | +| case | 50.44 | 66.19 | +| pool table | 87.35 | 96.84 | +| pillow | 59.59 | 71.39 | +| screen door | 79.55 | 83.04 | +| stairway | 30.78 | 43.74 | +| river | 14.07 | 29.98 | +| bridge | 60.01 | 75.1 | +| bookcase | 37.51 | 56.62 | +| blind | 40.79 | 48.17 | +| coffee table | 67.82 | 83.82 | +| toilet | 87.08 | 91.68 | +| flower | 41.54 | 56.41 | +| book | 52.1 | 72.35 | +| hill | 12.17 | 19.5 | +| bench | 58.64 | 67.09 | +| countertop | 58.74 | 75.12 | +| stove | 78.62 | 85.48 | +| palm | 47.49 | 70.74 | +| kitchen island | 42.75 | 75.32 | +| computer | 74.75 | 85.46 | +| swivel chair | 45.85 | 66.2 | +| boat | 70.31 | 75.84 | +| bar | 33.39 | 41.8 | +| arcade machine | 60.82 | 65.45 | +| hovel | 24.11 | 30.57 | +| bus | 92.83 | 95.18 | +| towel | 64.59 | 80.93 | +| light | 52.16 | 62.25 | +| truck | 43.45 | 60.89 | +| tower | 25.34 | 38.26 | +| chandelier | 65.74 | 81.03 | +| awning | 35.28 | 44.25 | +| streetlight | 33.64 | 45.28 | +| booth | 39.43 | 46.23 | +| television receiver | 68.78 | 83.79 | +| airplane | 60.41 | 75.53 | +| dirt track | 9.97 | 13.46 | +| apparel | 36.41 | 51.03 | +| pole | 27.22 | 39.55 | +| land | 3.34 | 5.82 | +| bannister | 17.48 | 24.16 | +| escalator | 25.08 | 26.37 | +| ottoman | 50.7 | 68.45 | +| bottle | 23.52 | 29.75 | +| buffet | 43.99 | 55.68 | +| poster | 37.12 | 45.2 | +| stage | 10.21 | 17.08 | +| van | 46.94 | 61.03 | +| ship | 9.36 | 10.68 | +| fountain | 21.14 | 22.21 | +| conveyer belt | 75.94 | 90.93 | +| canopy | 24.56 | 33.1 | +| washer | 72.88 | 74.55 | +| plaything | 32.74 | 39.42 | +| swimming pool | 56.97 | 58.68 | +| stool | 50.61 | 62.98 | +| barrel | 50.18 | 67.97 | +| basket | 28.54 | 42.62 | +| waterfall | 47.86 | 65.23 | +| tent | 73.14 | 96.53 | +| bag | 21.49 | 28.6 | +| minibike | 72.66 | 84.44 | +| cradle | 79.27 | 96.44 | +| oven | 53.66 | 74.25 | +| ball | 53.05 | 67.01 | +| food | 54.24 | 60.26 | +| step | 13.19 | 18.78 | +| tank | 37.18 | 45.23 | +| trade name | 30.15 | 39.08 | +| microwave | 84.05 | 89.84 | +| pot | 51.88 | 61.45 | +| animal | 57.12 | 59.8 | +| bicycle | 57.54 | 75.97 | +| lake | 57.59 | 63.84 | +| dishwasher | 64.49 | 74.99 | +| screen | 53.5 | 71.71 | +| blanket | 21.21 | 25.27 | +| sculpture | 54.98 | 69.23 | +| hood | 62.3 | 68.61 | +| sconce | 45.36 | 55.79 | +| vase | 45.43 | 61.36 | +| traffic light | 41.72 | 61.69 | +| tray | 7.88 | 14.88 | +| ashcan | 48.31 | 62.53 | +| fan | 60.78 | 72.2 | +| pier | 29.08 | 63.05 | +| crt screen | 9.72 | 20.69 | +| plate | 55.59 | 75.18 | +| monitor | 37.69 | 46.15 | +| bulletin board | 35.58 | 42.64 | +| shower | 4.05 | 10.0 | +| radiator | 59.7 | 68.78 | +| glass | 20.83 | 22.86 | +| clock | 26.93 | 33.55 | +| flag | 31.79 | 37.53 | ++---------------------+-------+-------+ +2024/01/11 19:47:10 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.5100 coco/bbox_mAP_50: 0.6920 coco/bbox_mAP_75: 0.5560 coco/bbox_mAP_s: 0.3490 coco/bbox_mAP_m: 0.5580 coco/bbox_mAP_l: 0.6540 coco/segm_mAP: 0.3470 coco/segm_mAP_50: 0.6120 coco/segm_mAP_75: 0.3420 coco/segm_mAP_s: 0.1970 coco/segm_mAP_m: 0.3930 coco/segm_mAP_l: 0.5260 Bleu_1: 0.7691 Bleu_2: 0.6068 Bleu_3: 0.4645 Bleu_4: 0.3511 METEOR: 0.2767 ROUGE_L: 0.5650 CIDEr: 1.1397 SPICE: 0.2069 aAcc: 83.9700 mIoU: 50.7900 mAcc: 62.6700 visual-grounding/miou: 0.8263 visual-grounding/acc: 0.8874 data_time: 0.0045 time: 1.3579 +2024/01/11 19:59:23 - mmengine - INFO - Iter(train) [520500/640000] base_lr: 1.8550e-05 lr: 3.5045e-06 eta: 2 days, 1:04:58 time: 1.4364 data_time: 0.0231 memory: 25718 grad_norm: 3.5247 loss: 1.1262 detection_loss_cls: 0.0254 detection_loss_reg: 0.3141 caption_loss_cls: 1.9802 grounding_loss_reg: 2.1397 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0248 instance_segmentation_loss_reg: 0.3095 instance_segmentation_loss_poly: 0.8183 +2024/01/11 20:11:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 20:11:46 - mmengine - INFO - Iter(train) [521000/640000] base_lr: 1.8416e-05 lr: 3.4923e-06 eta: 2 days, 0:52:52 time: 1.4481 data_time: 0.0233 memory: 25718 grad_norm: 3.4860 loss: 1.1217 detection_loss_cls: 0.0254 detection_loss_reg: 0.3143 caption_loss_cls: 1.9799 grounding_loss_reg: 2.1358 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0247 instance_segmentation_loss_reg: 0.3091 instance_segmentation_loss_poly: 0.8168 +2024/01/11 20:25:10 - mmengine - INFO - Iter(train) [521500/640000] base_lr: 1.8282e-05 lr: 3.4802e-06 eta: 2 days, 0:44:06 time: 1.4674 data_time: 0.0237 memory: 25718 grad_norm: 3.4338 loss: 1.1126 detection_loss_cls: 0.0254 detection_loss_reg: 0.3137 caption_loss_cls: 1.9810 grounding_loss_reg: 2.1343 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0248 instance_segmentation_loss_reg: 0.3097 instance_segmentation_loss_poly: 0.8177 +2024/01/11 20:38:01 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 20:38:01 - mmengine - INFO - Iter(train) [522000/640000] base_lr: 1.8149e-05 lr: 3.4681e-06 eta: 2 days, 0:33:23 time: 1.4844 data_time: 0.0238 memory: 25718 grad_norm: 3.3758 loss: 1.0991 detection_loss_cls: 0.0255 detection_loss_reg: 0.3144 caption_loss_cls: 1.9762 grounding_loss_reg: 2.1360 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0247 instance_segmentation_loss_reg: 0.3088 instance_segmentation_loss_poly: 0.8161 +2024/01/11 20:38:01 - mmengine - INFO - Saving checkpoint at 522000 iterations +2024/01/11 20:50:02 - mmengine - INFO - Iter(train) [522500/640000] base_lr: 1.8016e-05 lr: 3.4560e-06 eta: 2 days, 0:19:58 time: 1.4873 data_time: 0.0239 memory: 25718 grad_norm: 3.3643 loss: 1.1141 detection_loss_cls: 0.0256 detection_loss_reg: 0.3157 caption_loss_cls: 1.9794 grounding_loss_reg: 2.1354 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0249 instance_segmentation_loss_reg: 0.3113 instance_segmentation_loss_poly: 0.8206 +2024/01/11 21:02:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 21:02:04 - mmengine - INFO - Iter(train) [523000/640000] base_lr: 1.7884e-05 lr: 3.4440e-06 eta: 2 days, 0:06:38 time: 1.4882 data_time: 0.0239 memory: 25718 grad_norm: 3.3459 loss: 1.1138 detection_loss_cls: 0.0257 detection_loss_reg: 0.3163 caption_loss_cls: 1.9758 grounding_loss_reg: 2.1343 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0250 instance_segmentation_loss_reg: 0.3113 instance_segmentation_loss_poly: 0.8208 +2024/01/11 21:14:38 - mmengine - INFO - Iter(train) [523500/640000] base_lr: 1.7752e-05 lr: 3.4320e-06 eta: 1 day, 23:55:00 time: 1.4966 data_time: 0.0242 memory: 25718 grad_norm: 3.3442 loss: 1.1184 detection_loss_cls: 0.0256 detection_loss_reg: 0.3157 caption_loss_cls: 1.9784 grounding_loss_reg: 2.1339 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0250 instance_segmentation_loss_reg: 0.3124 instance_segmentation_loss_poly: 0.8230 +2024/01/11 21:26:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 21:26:41 - mmengine - INFO - Iter(train) [524000/640000] base_lr: 1.7621e-05 lr: 3.4201e-06 eta: 1 day, 23:41:46 time: 1.4926 data_time: 0.0242 memory: 25718 grad_norm: 3.4000 loss: 1.1207 detection_loss_cls: 0.0256 detection_loss_reg: 0.3160 caption_loss_cls: 1.9703 grounding_loss_reg: 2.1302 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0250 instance_segmentation_loss_reg: 0.3119 instance_segmentation_loss_poly: 0.8211 +2024/01/11 21:26:41 - mmengine - INFO - Saving checkpoint at 524000 iterations +2024/01/11 21:39:50 - mmengine - INFO - Iter(train) [524500/640000] base_lr: 1.7490e-05 lr: 3.4082e-06 eta: 1 day, 23:31:52 time: 1.5060 data_time: 0.0284 memory: 25718 grad_norm: 3.4025 loss: 1.1101 detection_loss_cls: 0.0257 detection_loss_reg: 0.3167 caption_loss_cls: 1.9714 grounding_loss_reg: 2.1283 semantic_segmentation_loss_cls: 0.0068 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3129 instance_segmentation_loss_poly: 0.8226 +2024/01/11 21:52:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 21:52:03 - mmengine - INFO - Iter(train) [525000/640000] base_lr: 1.7360e-05 lr: 3.3963e-06 eta: 1 day, 23:19:07 time: 1.5034 data_time: 0.0284 memory: 25718 grad_norm: 3.4129 loss: 1.1165 detection_loss_cls: 0.0256 detection_loss_reg: 0.3153 caption_loss_cls: 1.9742 grounding_loss_reg: 2.1288 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3128 instance_segmentation_loss_poly: 0.8226 +2024/01/11 22:04:23 - mmengine - INFO - Iter(train) [525500/640000] base_lr: 1.7230e-05 lr: 3.3845e-06 eta: 1 day, 23:06:43 time: 1.4874 data_time: 0.0280 memory: 25718 grad_norm: 3.4495 loss: 1.1167 detection_loss_cls: 0.0257 detection_loss_reg: 0.3148 caption_loss_cls: 1.9783 grounding_loss_reg: 2.1293 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0250 instance_segmentation_loss_reg: 0.3114 instance_segmentation_loss_poly: 0.8203 +2024/01/11 22:16:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 22:16:55 - mmengine - INFO - Iter(train) [526000/640000] base_lr: 1.7101e-05 lr: 3.3728e-06 eta: 1 day, 22:54:51 time: 1.4826 data_time: 0.0280 memory: 25718 grad_norm: 3.4390 loss: 1.1194 detection_loss_cls: 0.0257 detection_loss_reg: 0.3152 caption_loss_cls: 1.9828 grounding_loss_reg: 2.1263 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0250 instance_segmentation_loss_reg: 0.3115 instance_segmentation_loss_poly: 0.8197 +2024/01/11 22:16:55 - mmengine - INFO - Saving checkpoint at 526000 iterations +2024/01/11 22:29:51 - mmengine - INFO - Iter(train) [526500/640000] base_lr: 1.6972e-05 lr: 3.3611e-06 eta: 1 day, 22:44:09 time: 1.4964 data_time: 0.0283 memory: 25718 grad_norm: 3.4043 loss: 1.1112 detection_loss_cls: 0.0257 detection_loss_reg: 0.3151 caption_loss_cls: 1.9862 grounding_loss_reg: 2.1242 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0250 instance_segmentation_loss_reg: 0.3115 instance_segmentation_loss_poly: 0.8199 +2024/01/11 22:42:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 22:42:31 - mmengine - INFO - Iter(train) [527000/640000] base_lr: 1.6844e-05 lr: 3.3494e-06 eta: 1 day, 22:32:39 time: 1.5059 data_time: 0.0285 memory: 25718 grad_norm: 3.3322 loss: 1.1057 detection_loss_cls: 0.0257 detection_loss_reg: 0.3158 caption_loss_cls: 1.9893 grounding_loss_reg: 2.1239 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0250 instance_segmentation_loss_reg: 0.3118 instance_segmentation_loss_poly: 0.8204 +2024/01/11 22:54:46 - mmengine - INFO - Iter(train) [527500/640000] base_lr: 1.6716e-05 lr: 3.3378e-06 eta: 1 day, 22:19:59 time: 1.5011 data_time: 0.0283 memory: 25718 grad_norm: 3.3783 loss: 1.1150 detection_loss_cls: 0.0258 detection_loss_reg: 0.3149 caption_loss_cls: 1.9923 grounding_loss_reg: 2.1240 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0250 instance_segmentation_loss_reg: 0.3107 instance_segmentation_loss_poly: 0.8176 +2024/01/11 23:07:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 23:07:09 - mmengine - INFO - Iter(train) [528000/640000] base_lr: 1.6589e-05 lr: 3.3263e-06 eta: 1 day, 22:07:39 time: 1.5059 data_time: 0.0286 memory: 25718 grad_norm: 3.3414 loss: 1.1130 detection_loss_cls: 0.0257 detection_loss_reg: 0.3151 caption_loss_cls: 1.9894 grounding_loss_reg: 2.1240 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3113 instance_segmentation_loss_poly: 0.8184 +2024/01/11 23:07:09 - mmengine - INFO - Saving checkpoint at 528000 iterations +2024/01/11 23:20:02 - mmengine - INFO - Iter(train) [528500/640000] base_lr: 1.6462e-05 lr: 3.3147e-06 eta: 1 day, 21:56:40 time: 1.5019 data_time: 0.0285 memory: 25718 grad_norm: 3.3652 loss: 1.1132 detection_loss_cls: 0.0258 detection_loss_reg: 0.3163 caption_loss_cls: 1.9882 grounding_loss_reg: 2.1221 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3107 instance_segmentation_loss_poly: 0.8182 +2024/01/11 23:32:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 23:32:16 - mmengine - INFO - Iter(train) [529000/640000] base_lr: 1.6336e-05 lr: 3.3033e-06 eta: 1 day, 21:43:57 time: 1.5022 data_time: 0.0286 memory: 25718 grad_norm: 3.3652 loss: 1.1146 detection_loss_cls: 0.0258 detection_loss_reg: 0.3165 caption_loss_cls: 1.9856 grounding_loss_reg: 2.1222 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3119 instance_segmentation_loss_poly: 0.8206 +2024/01/11 23:44:54 - mmengine - INFO - Iter(train) [529500/640000] base_lr: 1.6210e-05 lr: 3.2918e-06 eta: 1 day, 21:32:16 time: 1.5067 data_time: 0.0287 memory: 25718 grad_norm: 3.3599 loss: 1.1194 detection_loss_cls: 0.0258 detection_loss_reg: 0.3158 caption_loss_cls: 1.9836 grounding_loss_reg: 2.1234 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3112 instance_segmentation_loss_poly: 0.8194 +2024/01/11 23:56:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/11 23:56:42 - mmengine - INFO - Iter(train) [530000/640000] base_lr: 1.6085e-05 lr: 3.2805e-06 eta: 1 day, 21:18:29 time: 1.4959 data_time: 0.0287 memory: 25718 grad_norm: 3.4600 loss: 1.1303 detection_loss_cls: 0.0257 detection_loss_reg: 0.3157 caption_loss_cls: 1.9772 grounding_loss_reg: 2.1215 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3113 instance_segmentation_loss_poly: 0.8210 +2024/01/11 23:56:42 - mmengine - INFO - Saving checkpoint at 530000 iterations +2024/01/12 00:10:22 - mmengine - INFO - Iter(train) [530500/640000] base_lr: 1.5960e-05 lr: 3.2691e-06 eta: 1 day, 21:09:19 time: 1.5067 data_time: 0.0288 memory: 25718 grad_norm: 3.4099 loss: 1.1158 detection_loss_cls: 0.0257 detection_loss_reg: 0.3160 caption_loss_cls: 1.9737 grounding_loss_reg: 2.1190 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0250 instance_segmentation_loss_reg: 0.3113 instance_segmentation_loss_poly: 0.8210 +2024/01/12 00:23:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/12 00:23:20 - mmengine - INFO - Iter(train) [531000/640000] base_lr: 1.5836e-05 lr: 3.2578e-06 eta: 1 day, 20:58:21 time: 1.5111 data_time: 0.0289 memory: 25718 grad_norm: 3.4545 loss: 1.1214 detection_loss_cls: 0.0257 detection_loss_reg: 0.3157 caption_loss_cls: 1.9774 grounding_loss_reg: 2.1171 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0250 instance_segmentation_loss_reg: 0.3099 instance_segmentation_loss_poly: 0.8184 +2024/01/12 00:35:31 - mmengine - INFO - Iter(train) [531500/640000] base_lr: 1.5713e-05 lr: 3.2466e-06 eta: 1 day, 20:45:31 time: 1.5102 data_time: 0.0290 memory: 25718 grad_norm: 3.4348 loss: 1.1216 detection_loss_cls: 0.0257 detection_loss_reg: 0.3158 caption_loss_cls: 1.9809 grounding_loss_reg: 2.1153 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3112 instance_segmentation_loss_poly: 0.8210 +2024/01/12 00:47:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/12 00:47:58 - mmengine - INFO - Iter(train) [532000/640000] base_lr: 1.5590e-05 lr: 3.2354e-06 eta: 1 day, 20:33:16 time: 1.5112 data_time: 0.0290 memory: 25718 grad_norm: 3.4496 loss: 1.1242 detection_loss_cls: 0.0257 detection_loss_reg: 0.3156 caption_loss_cls: 1.9809 grounding_loss_reg: 2.1139 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3127 instance_segmentation_loss_poly: 0.8245 +2024/01/12 00:47:58 - mmengine - INFO - Saving checkpoint at 532000 iterations +2024/01/12 01:00:15 - mmengine - INFO - Iter(train) [532500/640000] base_lr: 1.5467e-05 lr: 3.2243e-06 eta: 1 day, 20:20:40 time: 1.5022 data_time: 0.0289 memory: 25718 grad_norm: 3.4897 loss: 1.1346 detection_loss_cls: 0.0258 detection_loss_reg: 0.3165 caption_loss_cls: 1.9804 grounding_loss_reg: 2.1144 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3137 instance_segmentation_loss_poly: 0.8268 +2024/01/12 01:12:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/12 01:12:58 - mmengine - INFO - Iter(train) [533000/640000] base_lr: 1.5345e-05 lr: 3.2132e-06 eta: 1 day, 20:09:04 time: 1.5095 data_time: 0.0288 memory: 25718 grad_norm: 3.4555 loss: 1.1209 detection_loss_cls: 0.0258 detection_loss_reg: 0.3165 caption_loss_cls: 1.9793 grounding_loss_reg: 2.1161 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3135 instance_segmentation_loss_poly: 0.8264 +2024/01/12 01:24:48 - mmengine - INFO - Iter(train) [533500/640000] base_lr: 1.5223e-05 lr: 3.2021e-06 eta: 1 day, 19:55:26 time: 1.4974 data_time: 0.0286 memory: 25718 grad_norm: 3.4819 loss: 1.1226 detection_loss_cls: 0.0258 detection_loss_reg: 0.3165 caption_loss_cls: 1.9727 grounding_loss_reg: 2.1144 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3137 instance_segmentation_loss_poly: 0.8270 +2024/01/12 01:36:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/12 01:36:53 - mmengine - INFO - Iter(train) [534000/640000] base_lr: 1.5102e-05 lr: 3.1911e-06 eta: 1 day, 19:42:24 time: 1.5016 data_time: 0.0287 memory: 25718 grad_norm: 3.4401 loss: 1.1200 detection_loss_cls: 0.0259 detection_loss_reg: 0.3167 caption_loss_cls: 1.9725 grounding_loss_reg: 2.1128 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3140 instance_segmentation_loss_poly: 0.8276 +2024/01/12 01:36:53 - mmengine - INFO - Saving checkpoint at 534000 iterations +2024/01/12 01:49:25 - mmengine - INFO - Iter(train) [534500/640000] base_lr: 1.4982e-05 lr: 3.1802e-06 eta: 1 day, 19:30:23 time: 1.4848 data_time: 0.0283 memory: 25718 grad_norm: 3.5032 loss: 1.1256 detection_loss_cls: 0.0259 detection_loss_reg: 0.3157 caption_loss_cls: 1.9705 grounding_loss_reg: 2.1102 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3129 instance_segmentation_loss_poly: 0.8248 +2024/01/12 02:02:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/12 02:02:16 - mmengine - INFO - Iter(train) [535000/640000] base_lr: 1.4862e-05 lr: 3.1692e-06 eta: 1 day, 19:19:01 time: 1.4831 data_time: 0.0284 memory: 25718 grad_norm: 3.5240 loss: 1.1255 detection_loss_cls: 0.0259 detection_loss_reg: 0.3164 caption_loss_cls: 1.9721 grounding_loss_reg: 2.1110 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3116 instance_segmentation_loss_poly: 0.8221 +2024/01/12 02:14:52 - mmengine - INFO - Iter(train) [535500/640000] base_lr: 1.4742e-05 lr: 3.1584e-06 eta: 1 day, 19:07:06 time: 1.4893 data_time: 0.0282 memory: 25718 grad_norm: 3.4972 loss: 1.1082 detection_loss_cls: 0.0258 detection_loss_reg: 0.3149 caption_loss_cls: 1.9712 grounding_loss_reg: 2.1080 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3114 instance_segmentation_loss_poly: 0.8211 +2024/01/12 02:27:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/12 02:27:15 - mmengine - INFO - Iter(train) [536000/640000] base_lr: 1.4623e-05 lr: 3.1476e-06 eta: 1 day, 18:54:43 time: 1.4885 data_time: 0.0280 memory: 25718 grad_norm: 3.4853 loss: 1.1022 detection_loss_cls: 0.0257 detection_loss_reg: 0.3140 caption_loss_cls: 1.9729 grounding_loss_reg: 2.1080 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3119 instance_segmentation_loss_poly: 0.8217 +2024/01/12 02:27:15 - mmengine - INFO - Saving checkpoint at 536000 iterations +2024/01/12 02:39:53 - mmengine - INFO - Iter(train) [536500/640000] base_lr: 1.4505e-05 lr: 3.1368e-06 eta: 1 day, 18:42:50 time: 1.4936 data_time: 0.0279 memory: 25718 grad_norm: 3.4395 loss: 1.0853 detection_loss_cls: 0.0256 detection_loss_reg: 0.3145 caption_loss_cls: 1.9702 grounding_loss_reg: 2.1081 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3123 instance_segmentation_loss_poly: 0.8226 +2024/01/12 02:52:09 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/12 02:52:09 - mmengine - INFO - Iter(train) [537000/640000] base_lr: 1.4387e-05 lr: 3.1261e-06 eta: 1 day, 18:30:13 time: 1.4868 data_time: 0.0278 memory: 25718 grad_norm: 3.4552 loss: 1.0913 detection_loss_cls: 0.0257 detection_loss_reg: 0.3152 caption_loss_cls: 1.9729 grounding_loss_reg: 2.1085 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3116 instance_segmentation_loss_poly: 0.8214 +2024/01/12 03:04:07 - mmengine - INFO - Iter(train) [537500/640000] base_lr: 1.4269e-05 lr: 3.1154e-06 eta: 1 day, 18:16:59 time: 1.4888 data_time: 0.0279 memory: 25718 grad_norm: 3.4566 loss: 1.0930 detection_loss_cls: 0.0257 detection_loss_reg: 0.3147 caption_loss_cls: 1.9715 grounding_loss_reg: 2.1076 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3124 instance_segmentation_loss_poly: 0.8222 +2024/01/12 03:16:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/12 03:16:21 - mmengine - INFO - Iter(train) [538000/640000] base_lr: 1.4152e-05 lr: 3.1048e-06 eta: 1 day, 18:04:19 time: 1.4911 data_time: 0.0278 memory: 25718 grad_norm: 3.4581 loss: 1.0869 detection_loss_cls: 0.0258 detection_loss_reg: 0.3150 caption_loss_cls: 1.9739 grounding_loss_reg: 2.1045 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3125 instance_segmentation_loss_poly: 0.8210 +2024/01/12 03:16:21 - mmengine - INFO - Saving checkpoint at 538000 iterations +2024/01/12 03:29:14 - mmengine - INFO - Iter(train) [538500/640000] base_lr: 1.4036e-05 lr: 3.0942e-06 eta: 1 day, 17:52:54 time: 1.4962 data_time: 0.0280 memory: 25718 grad_norm: 3.4589 loss: 1.0953 detection_loss_cls: 0.0259 detection_loss_reg: 0.3165 caption_loss_cls: 1.9757 grounding_loss_reg: 2.1058 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3138 instance_segmentation_loss_poly: 0.8237 +2024/01/12 03:41:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/12 03:41:45 - mmengine - INFO - Iter(train) [539000/640000] base_lr: 1.3920e-05 lr: 3.0837e-06 eta: 1 day, 17:40:46 time: 1.4912 data_time: 0.0280 memory: 25718 grad_norm: 3.4645 loss: 1.0981 detection_loss_cls: 0.0261 detection_loss_reg: 0.3178 caption_loss_cls: 1.9782 grounding_loss_reg: 2.1055 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0254 instance_segmentation_loss_reg: 0.3142 instance_segmentation_loss_poly: 0.8245 +2024/01/12 03:53:41 - mmengine - INFO - Iter(train) [539500/640000] base_lr: 1.3805e-05 lr: 3.0732e-06 eta: 1 day, 17:27:33 time: 1.4813 data_time: 0.0277 memory: 25718 grad_norm: 3.4568 loss: 1.0990 detection_loss_cls: 0.0262 detection_loss_reg: 0.3192 caption_loss_cls: 1.9812 grounding_loss_reg: 2.1031 semantic_segmentation_loss_cls: 0.0067 instance_segmentation_loss_cls: 0.0254 instance_segmentation_loss_reg: 0.3150 instance_segmentation_loss_poly: 0.8266 +2024/01/12 04:06:12 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/12 04:06:12 - mmengine - INFO - Iter(train) [540000/640000] base_lr: 1.3690e-05 lr: 3.0627e-06 eta: 1 day, 17:15:25 time: 1.4833 data_time: 0.0279 memory: 25718 grad_norm: 3.4650 loss: 1.1106 detection_loss_cls: 0.0263 detection_loss_reg: 0.3197 caption_loss_cls: 1.9848 grounding_loss_reg: 2.1034 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0255 instance_segmentation_loss_reg: 0.3150 instance_segmentation_loss_poly: 0.8268 +2024/01/12 04:06:12 - mmengine - INFO - Saving checkpoint at 540000 iterations +2024/01/12 04:19:08 - mmengine - INFO - Evaluating bbox... +2024/01/12 04:20:06 - mmengine - INFO - bbox_mAP_copypaste: 0.513 0.693 0.561 0.352 0.561 0.653 +2024/01/12 04:20:06 - mmengine - INFO - Evaluating segm... +2024/01/12 04:21:18 - mmengine - INFO - segm_mAP_copypaste: 0.352 0.616 0.351 0.202 0.396 0.530 +2024/01/12 04:28:39 - mmengine - INFO - per class results: +2024/01/12 04:28:39 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.78 | 89.13 | +| building | 83.24 | 92.01 | +| sky | 93.31 | 97.75 | +| floor | 83.37 | 90.48 | +| tree | 74.1 | 87.88 | +| ceiling | 85.07 | 95.16 | +| road | 83.95 | 90.85 | +| bed | 90.24 | 95.84 | +| windowpane | 63.75 | 78.91 | +| grass | 65.42 | 84.82 | +| cabinet | 66.18 | 78.2 | +| sidewalk | 67.23 | 80.89 | +| person | 81.66 | 92.04 | +| earth | 39.39 | 48.65 | +| door | 53.55 | 68.62 | +| table | 66.66 | 80.93 | +| mountain | 62.83 | 73.73 | +| plant | 50.92 | 62.87 | +| curtain | 76.41 | 87.08 | +| chair | 61.46 | 76.59 | +| car | 85.27 | 92.8 | +| water | 53.3 | 67.9 | +| painting | 71.73 | 87.9 | +| sofa | 70.23 | 82.6 | +| shelf | 46.79 | 66.57 | +| house | 42.65 | 57.49 | +| sea | 51.94 | 77.77 | +| mirror | 68.86 | 78.96 | +| rug | 69.37 | 78.72 | +| field | 31.04 | 46.91 | +| armchair | 48.0 | 68.49 | +| seat | 61.49 | 80.56 | +| fence | 42.63 | 60.52 | +| desk | 49.8 | 70.81 | +| rock | 49.45 | 73.36 | +| wardrobe | 49.42 | 59.37 | +| lamp | 63.36 | 75.91 | +| bathtub | 81.25 | 84.9 | +| railing | 39.31 | 56.5 | +| cushion | 61.7 | 74.32 | +| base | 24.55 | 35.39 | +| box | 27.75 | 37.59 | +| column | 52.41 | 66.95 | +| signboard | 38.44 | 52.58 | +| chest of drawers | 39.89 | 58.91 | +| counter | 29.34 | 43.18 | +| sand | 53.9 | 68.86 | +| sink | 76.13 | 83.53 | +| skyscraper | 65.35 | 81.79 | +| fireplace | 77.48 | 86.84 | +| refrigerator | 74.46 | 78.95 | +| grandstand | 41.81 | 77.13 | +| path | 26.12 | 38.37 | +| stairs | 28.55 | 34.93 | +| runway | 65.54 | 86.61 | +| case | 48.38 | 68.71 | +| pool table | 90.3 | 96.82 | +| pillow | 60.55 | 72.73 | +| screen door | 84.63 | 87.51 | +| stairway | 31.61 | 45.58 | +| river | 20.71 | 32.11 | +| bridge | 60.16 | 78.27 | +| bookcase | 37.76 | 59.69 | +| blind | 40.14 | 45.75 | +| coffee table | 69.29 | 82.87 | +| toilet | 87.23 | 91.32 | +| flower | 40.06 | 53.96 | +| book | 51.85 | 72.26 | +| hill | 13.65 | 23.74 | +| bench | 60.71 | 68.01 | +| countertop | 62.78 | 75.77 | +| stove | 75.76 | 82.16 | +| palm | 46.17 | 62.53 | +| kitchen island | 45.89 | 79.58 | +| computer | 68.58 | 77.11 | +| swivel chair | 41.15 | 54.74 | +| boat | 57.49 | 61.03 | +| bar | 34.26 | 46.93 | +| arcade machine | 59.28 | 62.87 | +| hovel | 18.99 | 21.18 | +| bus | 92.87 | 95.56 | +| towel | 65.01 | 78.78 | +| light | 51.56 | 61.05 | +| truck | 46.04 | 57.32 | +| tower | 22.53 | 38.89 | +| chandelier | 65.05 | 79.48 | +| awning | 34.32 | 39.37 | +| streetlight | 33.91 | 46.95 | +| booth | 35.66 | 41.34 | +| television receiver | 72.49 | 80.91 | +| airplane | 64.39 | 75.95 | +| dirt track | 14.91 | 21.3 | +| apparel | 34.3 | 44.25 | +| pole | 26.91 | 37.4 | +| land | 2.37 | 3.92 | +| bannister | 19.46 | 26.42 | +| escalator | 34.76 | 35.71 | +| ottoman | 50.15 | 64.29 | +| bottle | 24.13 | 30.23 | +| buffet | 44.19 | 53.46 | +| poster | 32.39 | 38.96 | +| stage | 10.14 | 18.93 | +| van | 44.44 | 58.25 | +| ship | 8.59 | 11.19 | +| fountain | 21.25 | 22.32 | +| conveyer belt | 69.15 | 91.43 | +| canopy | 32.08 | 35.55 | +| washer | 69.59 | 70.29 | +| plaything | 29.95 | 35.32 | +| swimming pool | 67.14 | 73.1 | +| stool | 51.45 | 65.43 | +| barrel | 11.47 | 27.86 | +| basket | 30.31 | 48.88 | +| waterfall | 59.41 | 82.16 | +| tent | 93.63 | 96.65 | +| bag | 22.14 | 28.82 | +| minibike | 72.71 | 83.94 | +| cradle | 74.49 | 96.27 | +| oven | 54.5 | 73.61 | +| ball | 57.41 | 76.07 | +| food | 55.11 | 60.89 | +| step | 11.56 | 16.72 | +| tank | 32.65 | 41.04 | +| trade name | 30.34 | 39.14 | +| microwave | 85.41 | 90.72 | +| pot | 52.35 | 61.79 | +| animal | 57.23 | 60.59 | +| bicycle | 57.76 | 74.89 | +| lake | 59.47 | 63.14 | +| dishwasher | 63.24 | 73.0 | +| screen | 55.76 | 71.45 | +| blanket | 13.93 | 16.07 | +| sculpture | 57.0 | 70.93 | +| hood | 56.77 | 69.36 | +| sconce | 45.43 | 56.48 | +| vase | 46.59 | 60.84 | +| traffic light | 41.37 | 61.31 | +| tray | 7.04 | 11.48 | +| ashcan | 48.25 | 63.88 | +| fan | 59.79 | 71.94 | +| pier | 26.9 | 41.77 | +| crt screen | 11.37 | 20.02 | +| plate | 56.53 | 75.51 | +| monitor | 32.14 | 46.96 | +| bulletin board | 51.61 | 71.31 | +| shower | 2.31 | 2.8 | +| radiator | 58.31 | 65.87 | +| glass | 20.9 | 23.03 | +| clock | 27.26 | 32.94 | +| flag | 36.02 | 42.71 | ++---------------------+-------+-------+ +2024/01/12 04:28:55 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.5130 coco/bbox_mAP_50: 0.6930 coco/bbox_mAP_75: 0.5610 coco/bbox_mAP_s: 0.3520 coco/bbox_mAP_m: 0.5610 coco/bbox_mAP_l: 0.6530 coco/segm_mAP: 0.3520 coco/segm_mAP_50: 0.6160 coco/segm_mAP_75: 0.3510 coco/segm_mAP_s: 0.2020 coco/segm_mAP_m: 0.3960 coco/segm_mAP_l: 0.5300 Bleu_1: 0.7656 Bleu_2: 0.6026 Bleu_3: 0.4607 Bleu_4: 0.3489 METEOR: 0.2766 ROUGE_L: 0.5636 CIDEr: 1.1426 SPICE: 0.2065 aAcc: 83.9800 mIoU: 50.6800 mAcc: 62.2400 visual-grounding/miou: 0.8270 visual-grounding/acc: 0.8874 data_time: 0.0042 time: 1.3567 +2024/01/12 04:40:55 - mmengine - INFO - Iter(train) [540500/640000] base_lr: 1.3576e-05 lr: 3.0523e-06 eta: 1 day, 17:02:23 time: 1.4741 data_time: 0.0236 memory: 25718 grad_norm: 3.5093 loss: 1.1227 detection_loss_cls: 0.0262 detection_loss_reg: 0.3195 caption_loss_cls: 1.9807 grounding_loss_reg: 2.1009 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0255 instance_segmentation_loss_reg: 0.3154 instance_segmentation_loss_poly: 0.8272 +2024/01/12 04:53:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240111_050137 +2024/01/12 04:53:45 - mmengine - INFO - Iter(train) [541000/640000] base_lr: 1.3462e-05 lr: 3.0420e-06 eta: 1 day, 16:50:49 time: 1.4825 data_time: 0.0237 memory: 25718 grad_norm: 3.5046 loss: 1.1189 detection_loss_cls: 0.0262 detection_loss_reg: 0.3197 caption_loss_cls: 1.9766 grounding_loss_reg: 2.0996 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0254 instance_segmentation_loss_reg: 0.3157 instance_segmentation_loss_poly: 0.8290 +2024/01/12 05:42:04 - mmengine - INFO - Iter(train) [541500/640000] base_lr: 1.3349e-05 lr: 3.0317e-06 eta: 1 day, 16:20:50 time: 1.4837 data_time: 0.0223 memory: 25721 grad_norm: 3.4927 loss: 1.1219 detection_loss_cls: 0.0263 detection_loss_reg: 0.3213 caption_loss_cls: 1.9819 grounding_loss_reg: 2.0994 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0255 instance_segmentation_loss_reg: 0.3168 instance_segmentation_loss_poly: 0.8306 +2024/01/12 05:54:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 05:54:16 - mmengine - INFO - Iter(train) [542000/640000] base_lr: 1.3236e-05 lr: 3.0215e-06 eta: 1 day, 16:04:29 time: 1.4834 data_time: 0.0220 memory: 25721 grad_norm: 3.4956 loss: 1.1213 detection_loss_cls: 0.0263 detection_loss_reg: 0.3208 caption_loss_cls: 1.9819 grounding_loss_reg: 2.0976 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0255 instance_segmentation_loss_reg: 0.3164 instance_segmentation_loss_poly: 0.8295 +2024/01/12 05:54:16 - mmengine - INFO - Saving checkpoint at 542000 iterations +2024/01/12 06:07:02 - mmengine - INFO - Iter(train) [542500/640000] base_lr: 1.3124e-05 lr: 3.0113e-06 eta: 1 day, 16:11:18 time: 1.4817 data_time: 0.0215 memory: 25721 grad_norm: 3.4982 loss: 1.1261 detection_loss_cls: 0.0263 detection_loss_reg: 0.3221 caption_loss_cls: 1.9798 grounding_loss_reg: 2.0964 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0256 instance_segmentation_loss_reg: 0.3172 instance_segmentation_loss_poly: 0.8302 +2024/01/12 06:19:16 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 06:19:16 - mmengine - INFO - Iter(train) [543000/640000] base_lr: 1.3012e-05 lr: 3.0011e-06 eta: 1 day, 15:54:05 time: 1.4773 data_time: 0.0211 memory: 25721 grad_norm: 3.4723 loss: 1.1225 detection_loss_cls: 0.0262 detection_loss_reg: 0.3218 caption_loss_cls: 1.9780 grounding_loss_reg: 2.0979 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0255 instance_segmentation_loss_reg: 0.3168 instance_segmentation_loss_poly: 0.8298 +2024/01/12 06:31:19 - mmengine - INFO - Iter(train) [543500/640000] base_lr: 1.2901e-05 lr: 2.9910e-06 eta: 1 day, 15:33:31 time: 1.4789 data_time: 0.0209 memory: 25721 grad_norm: 3.5115 loss: 1.1268 detection_loss_cls: 0.0262 detection_loss_reg: 0.3214 caption_loss_cls: 1.9765 grounding_loss_reg: 2.0985 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0255 instance_segmentation_loss_reg: 0.3167 instance_segmentation_loss_poly: 0.8295 +2024/01/12 06:44:46 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 06:44:46 - mmengine - INFO - Iter(train) [544000/640000] base_lr: 1.2791e-05 lr: 2.9810e-06 eta: 1 day, 15:48:38 time: 1.4929 data_time: 0.0205 memory: 25721 grad_norm: 3.5062 loss: 1.1136 detection_loss_cls: 0.0261 detection_loss_reg: 0.3205 caption_loss_cls: 1.9780 grounding_loss_reg: 2.0979 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0255 instance_segmentation_loss_reg: 0.3164 instance_segmentation_loss_poly: 0.8293 +2024/01/12 06:44:46 - mmengine - INFO - Saving checkpoint at 544000 iterations +2024/01/12 06:57:07 - mmengine - INFO - Iter(train) [544500/640000] base_lr: 1.2681e-05 lr: 2.9710e-06 eta: 1 day, 15:34:08 time: 1.4968 data_time: 0.0249 memory: 25721 grad_norm: 3.5645 loss: 1.1261 detection_loss_cls: 0.0261 detection_loss_reg: 0.3208 caption_loss_cls: 1.9808 grounding_loss_reg: 2.0985 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0255 instance_segmentation_loss_reg: 0.3156 instance_segmentation_loss_poly: 0.8271 +2024/01/12 07:09:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 07:09:54 - mmengine - INFO - Iter(train) [545000/640000] base_lr: 1.2571e-05 lr: 2.9610e-06 eta: 1 day, 15:28:10 time: 1.4999 data_time: 0.0248 memory: 25721 grad_norm: 3.5291 loss: 1.1094 detection_loss_cls: 0.0261 detection_loss_reg: 0.3200 caption_loss_cls: 1.9819 grounding_loss_reg: 2.0982 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0255 instance_segmentation_loss_reg: 0.3158 instance_segmentation_loss_poly: 0.8272 +2024/01/12 07:22:13 - mmengine - INFO - Iter(train) [545500/640000] base_lr: 1.2462e-05 lr: 2.9511e-06 eta: 1 day, 15:13:11 time: 1.5014 data_time: 0.0250 memory: 25721 grad_norm: 3.5445 loss: 1.1180 detection_loss_cls: 0.0260 detection_loss_reg: 0.3207 caption_loss_cls: 1.9806 grounding_loss_reg: 2.0966 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0255 instance_segmentation_loss_reg: 0.3168 instance_segmentation_loss_poly: 0.8290 +2024/01/12 07:34:32 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 07:34:32 - mmengine - INFO - Iter(train) [546000/640000] base_lr: 1.2354e-05 lr: 2.9412e-06 eta: 1 day, 14:58:34 time: 1.5030 data_time: 0.0251 memory: 25721 grad_norm: 3.5632 loss: 1.1185 detection_loss_cls: 0.0260 detection_loss_reg: 0.3203 caption_loss_cls: 1.9779 grounding_loss_reg: 2.0926 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0254 instance_segmentation_loss_reg: 0.3161 instance_segmentation_loss_poly: 0.8280 +2024/01/12 07:34:32 - mmengine - INFO - Saving checkpoint at 546000 iterations +2024/01/12 07:46:35 - mmengine - INFO - Iter(train) [546500/640000] base_lr: 1.2246e-05 lr: 2.9314e-06 eta: 1 day, 14:40:20 time: 1.4922 data_time: 0.0248 memory: 25721 grad_norm: 3.5880 loss: 1.1168 detection_loss_cls: 0.0259 detection_loss_reg: 0.3199 caption_loss_cls: 1.9752 grounding_loss_reg: 2.0946 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0254 instance_segmentation_loss_reg: 0.3165 instance_segmentation_loss_poly: 0.8286 +2024/01/12 07:58:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 07:58:42 - mmengine - INFO - Iter(train) [547000/640000] base_lr: 1.2138e-05 lr: 2.9217e-06 eta: 1 day, 14:24:01 time: 1.4907 data_time: 0.0247 memory: 25721 grad_norm: 3.6216 loss: 1.1081 detection_loss_cls: 0.0258 detection_loss_reg: 0.3188 caption_loss_cls: 1.9734 grounding_loss_reg: 2.0911 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3155 instance_segmentation_loss_poly: 0.8266 +2024/01/12 08:11:10 - mmengine - INFO - Iter(train) [547500/640000] base_lr: 1.2031e-05 lr: 2.9119e-06 eta: 1 day, 14:12:25 time: 1.4968 data_time: 0.0249 memory: 25721 grad_norm: 3.5963 loss: 1.1066 detection_loss_cls: 0.0258 detection_loss_reg: 0.3181 caption_loss_cls: 1.9674 grounding_loss_reg: 2.0870 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0253 instance_segmentation_loss_reg: 0.3155 instance_segmentation_loss_poly: 0.8270 +2024/01/12 08:23:26 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 08:23:26 - mmengine - INFO - Iter(train) [548000/640000] base_lr: 1.1925e-05 lr: 2.9023e-06 eta: 1 day, 13:58:26 time: 1.4790 data_time: 0.0249 memory: 25721 grad_norm: 3.6372 loss: 1.1178 detection_loss_cls: 0.0256 detection_loss_reg: 0.3179 caption_loss_cls: 1.9678 grounding_loss_reg: 2.0847 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0252 instance_segmentation_loss_reg: 0.3146 instance_segmentation_loss_poly: 0.8253 +2024/01/12 08:23:26 - mmengine - INFO - Saving checkpoint at 548000 iterations +2024/01/12 08:35:53 - mmengine - INFO - Iter(train) [548500/640000] base_lr: 1.1819e-05 lr: 2.8927e-06 eta: 1 day, 13:46:44 time: 1.4805 data_time: 0.0250 memory: 25721 grad_norm: 3.5689 loss: 1.1020 detection_loss_cls: 0.0255 detection_loss_reg: 0.3165 caption_loss_cls: 1.9639 grounding_loss_reg: 2.0862 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0251 instance_segmentation_loss_reg: 0.3138 instance_segmentation_loss_poly: 0.8234 +2024/01/12 08:48:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 08:48:06 - mmengine - INFO - Iter(train) [549000/640000] base_lr: 1.1714e-05 lr: 2.8831e-06 eta: 1 day, 13:32:36 time: 1.4722 data_time: 0.0248 memory: 25721 grad_norm: 3.5948 loss: 1.0998 detection_loss_cls: 0.0254 detection_loss_reg: 0.3146 caption_loss_cls: 1.9634 grounding_loss_reg: 2.0855 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0249 instance_segmentation_loss_reg: 0.3121 instance_segmentation_loss_poly: 0.8209 +2024/01/12 09:01:14 - mmengine - INFO - Iter(train) [549500/640000] base_lr: 1.1609e-05 lr: 2.8736e-06 eta: 1 day, 13:27:24 time: 1.4844 data_time: 0.0250 memory: 25721 grad_norm: 3.5392 loss: 1.0885 detection_loss_cls: 0.0253 detection_loss_reg: 0.3150 caption_loss_cls: 1.9647 grounding_loss_reg: 2.0834 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0249 instance_segmentation_loss_reg: 0.3121 instance_segmentation_loss_poly: 0.8212 +2024/01/12 09:13:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 09:13:30 - mmengine - INFO - Iter(train) [550000/640000] base_lr: 1.1505e-05 lr: 2.8641e-06 eta: 1 day, 13:13:34 time: 1.4836 data_time: 0.0250 memory: 25721 grad_norm: 3.5340 loss: 1.0891 detection_loss_cls: 0.0252 detection_loss_reg: 0.3145 caption_loss_cls: 1.9673 grounding_loss_reg: 2.0829 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0249 instance_segmentation_loss_reg: 0.3126 instance_segmentation_loss_poly: 0.8212 +2024/01/12 09:13:30 - mmengine - INFO - Saving checkpoint at 550000 iterations +2024/01/12 09:26:40 - mmengine - INFO - Iter(train) [550500/640000] base_lr: 1.1402e-05 lr: 2.8547e-06 eta: 1 day, 13:07:25 time: 1.5002 data_time: 0.0251 memory: 25721 grad_norm: 3.4896 loss: 1.0711 detection_loss_cls: 0.0253 detection_loss_reg: 0.3145 caption_loss_cls: 1.9683 grounding_loss_reg: 2.0835 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0249 instance_segmentation_loss_reg: 0.3123 instance_segmentation_loss_poly: 0.8204 +2024/01/12 09:39:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 09:39:28 - mmengine - INFO - Iter(train) [551000/640000] base_lr: 1.1299e-05 lr: 2.8453e-06 eta: 1 day, 12:57:51 time: 1.5104 data_time: 0.0252 memory: 25721 grad_norm: 3.4257 loss: 1.0686 detection_loss_cls: 0.0254 detection_loss_reg: 0.3152 caption_loss_cls: 1.9636 grounding_loss_reg: 2.0827 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0249 instance_segmentation_loss_reg: 0.3121 instance_segmentation_loss_poly: 0.8206 +2024/01/12 09:51:43 - mmengine - INFO - Iter(train) [551500/640000] base_lr: 1.1196e-05 lr: 2.8360e-06 eta: 1 day, 12:43:45 time: 1.5074 data_time: 0.0251 memory: 25721 grad_norm: 3.4406 loss: 1.0712 detection_loss_cls: 0.0253 detection_loss_reg: 0.3144 caption_loss_cls: 1.9599 grounding_loss_reg: 2.0800 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0249 instance_segmentation_loss_reg: 0.3120 instance_segmentation_loss_poly: 0.8203 +2024/01/12 10:03:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 10:03:10 - mmengine - INFO - Iter(train) [552000/640000] base_lr: 1.1094e-05 lr: 2.8267e-06 eta: 1 day, 12:23:52 time: 1.4951 data_time: 0.0249 memory: 25721 grad_norm: 3.4548 loss: 1.0685 detection_loss_cls: 0.0252 detection_loss_reg: 0.3143 caption_loss_cls: 1.9584 grounding_loss_reg: 2.0781 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0248 instance_segmentation_loss_reg: 0.3112 instance_segmentation_loss_poly: 0.8188 +2024/01/12 10:03:10 - mmengine - INFO - Saving checkpoint at 552000 iterations +2024/01/12 10:15:53 - mmengine - INFO - Iter(train) [552500/640000] base_lr: 1.0993e-05 lr: 2.8175e-06 eta: 1 day, 12:13:34 time: 1.4991 data_time: 0.0252 memory: 25721 grad_norm: 3.4873 loss: 1.0762 detection_loss_cls: 0.0251 detection_loss_reg: 0.3137 caption_loss_cls: 1.9554 grounding_loss_reg: 2.0788 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0247 instance_segmentation_loss_reg: 0.3106 instance_segmentation_loss_poly: 0.8175 +2024/01/12 10:27:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 10:27:31 - mmengine - INFO - Iter(train) [553000/640000] base_lr: 1.0892e-05 lr: 2.8083e-06 eta: 1 day, 11:55:46 time: 1.4901 data_time: 0.0251 memory: 25721 grad_norm: 3.5247 loss: 1.0811 detection_loss_cls: 0.0252 detection_loss_reg: 0.3140 caption_loss_cls: 1.9569 grounding_loss_reg: 2.0726 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0247 instance_segmentation_loss_reg: 0.3101 instance_segmentation_loss_poly: 0.8165 +2024/01/12 10:39:43 - mmengine - INFO - Iter(train) [553500/640000] base_lr: 1.0791e-05 lr: 2.7992e-06 eta: 1 day, 11:42:10 time: 1.4762 data_time: 0.0250 memory: 25721 grad_norm: 3.5887 loss: 1.0903 detection_loss_cls: 0.0251 detection_loss_reg: 0.3137 caption_loss_cls: 1.9613 grounding_loss_reg: 2.0715 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0247 instance_segmentation_loss_reg: 0.3097 instance_segmentation_loss_poly: 0.8155 +2024/01/12 10:52:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 10:52:19 - mmengine - INFO - Iter(train) [554000/640000] base_lr: 1.0691e-05 lr: 2.7901e-06 eta: 1 day, 11:31:01 time: 1.4811 data_time: 0.0250 memory: 25721 grad_norm: 3.5707 loss: 1.0902 detection_loss_cls: 0.0249 detection_loss_reg: 0.3117 caption_loss_cls: 1.9602 grounding_loss_reg: 2.0712 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0245 instance_segmentation_loss_reg: 0.3081 instance_segmentation_loss_poly: 0.8125 +2024/01/12 10:52:19 - mmengine - INFO - Saving checkpoint at 554000 iterations +2024/01/12 11:04:33 - mmengine - INFO - Iter(train) [554500/640000] base_lr: 1.0592e-05 lr: 2.7811e-06 eta: 1 day, 11:17:43 time: 1.4674 data_time: 0.0250 memory: 25721 grad_norm: 3.6263 loss: 1.1067 detection_loss_cls: 0.0248 detection_loss_reg: 0.3122 caption_loss_cls: 1.9603 grounding_loss_reg: 2.0697 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0244 instance_segmentation_loss_reg: 0.3074 instance_segmentation_loss_poly: 0.8105 +2024/01/12 11:16:39 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 11:16:39 - mmengine - INFO - Iter(train) [555000/640000] base_lr: 1.0493e-05 lr: 2.7721e-06 eta: 1 day, 11:03:40 time: 1.4568 data_time: 0.0249 memory: 25721 grad_norm: 3.6539 loss: 1.1136 detection_loss_cls: 0.0248 detection_loss_reg: 0.3118 caption_loss_cls: 1.9627 grounding_loss_reg: 2.0703 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0244 instance_segmentation_loss_reg: 0.3077 instance_segmentation_loss_poly: 0.8113 +2024/01/12 11:28:59 - mmengine - INFO - Iter(train) [555500/640000] base_lr: 1.0395e-05 lr: 2.7632e-06 eta: 1 day, 10:51:03 time: 1.4580 data_time: 0.0250 memory: 25721 grad_norm: 3.6748 loss: 1.1156 detection_loss_cls: 0.0249 detection_loss_reg: 0.3123 caption_loss_cls: 1.9638 grounding_loss_reg: 2.0685 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0244 instance_segmentation_loss_reg: 0.3078 instance_segmentation_loss_poly: 0.8118 +2024/01/12 11:41:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 11:41:20 - mmengine - INFO - Iter(train) [556000/640000] base_lr: 1.0298e-05 lr: 2.7543e-06 eta: 1 day, 10:38:28 time: 1.4715 data_time: 0.0252 memory: 25721 grad_norm: 3.6336 loss: 1.1149 detection_loss_cls: 0.0250 detection_loss_reg: 0.3139 caption_loss_cls: 1.9619 grounding_loss_reg: 2.0684 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0244 instance_segmentation_loss_reg: 0.3091 instance_segmentation_loss_poly: 0.8144 +2024/01/12 11:41:20 - mmengine - INFO - Saving checkpoint at 556000 iterations +2024/01/12 11:53:41 - mmengine - INFO - Iter(train) [556500/640000] base_lr: 1.0200e-05 lr: 2.7455e-06 eta: 1 day, 10:25:57 time: 1.4660 data_time: 0.0249 memory: 25721 grad_norm: 3.6198 loss: 1.1040 detection_loss_cls: 0.0250 detection_loss_reg: 0.3139 caption_loss_cls: 1.9594 grounding_loss_reg: 2.0665 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0244 instance_segmentation_loss_reg: 0.3092 instance_segmentation_loss_poly: 0.8146 +2024/01/12 12:06:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 12:06:53 - mmengine - INFO - Iter(train) [557000/640000] base_lr: 1.0104e-05 lr: 2.7367e-06 eta: 1 day, 10:17:36 time: 1.4897 data_time: 0.0254 memory: 25721 grad_norm: 3.5569 loss: 1.1040 detection_loss_cls: 0.0250 detection_loss_reg: 0.3140 caption_loss_cls: 1.9595 grounding_loss_reg: 2.0667 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0245 instance_segmentation_loss_reg: 0.3100 instance_segmentation_loss_poly: 0.8166 +2024/01/12 12:19:20 - mmengine - INFO - Iter(train) [557500/640000] base_lr: 1.0008e-05 lr: 2.7280e-06 eta: 1 day, 10:05:22 time: 1.4931 data_time: 0.0254 memory: 25721 grad_norm: 3.5430 loss: 1.1003 detection_loss_cls: 0.0250 detection_loss_reg: 0.3137 caption_loss_cls: 1.9569 grounding_loss_reg: 2.0635 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0244 instance_segmentation_loss_reg: 0.3099 instance_segmentation_loss_poly: 0.8167 +2024/01/12 12:31:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 12:31:15 - mmengine - INFO - Iter(train) [558000/640000] base_lr: 9.9125e-06 lr: 2.7193e-06 eta: 1 day, 9:50:47 time: 1.4831 data_time: 0.0253 memory: 25721 grad_norm: 3.5585 loss: 1.1062 detection_loss_cls: 0.0249 detection_loss_reg: 0.3136 caption_loss_cls: 1.9573 grounding_loss_reg: 2.0639 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0244 instance_segmentation_loss_reg: 0.3092 instance_segmentation_loss_poly: 0.8160 +2024/01/12 12:31:15 - mmengine - INFO - Saving checkpoint at 558000 iterations +2024/01/12 12:43:20 - mmengine - INFO - Iter(train) [558500/640000] base_lr: 9.8175e-06 lr: 2.7107e-06 eta: 1 day, 9:37:04 time: 1.4808 data_time: 0.0254 memory: 25721 grad_norm: 3.5826 loss: 1.1078 detection_loss_cls: 0.0249 detection_loss_reg: 0.3135 caption_loss_cls: 1.9553 grounding_loss_reg: 2.0601 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0244 instance_segmentation_loss_reg: 0.3105 instance_segmentation_loss_poly: 0.8194 +2024/01/12 12:56:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 12:56:11 - mmengine - INFO - Iter(train) [559000/640000] base_lr: 9.7232e-06 lr: 2.7021e-06 eta: 1 day, 9:26:40 time: 1.4920 data_time: 0.0255 memory: 25721 grad_norm: 3.6054 loss: 1.0980 detection_loss_cls: 0.0247 detection_loss_reg: 0.3119 caption_loss_cls: 1.9546 grounding_loss_reg: 2.0584 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0243 instance_segmentation_loss_reg: 0.3088 instance_segmentation_loss_poly: 0.8156 +2024/01/12 13:09:23 - mmengine - INFO - Iter(train) [559500/640000] base_lr: 9.6294e-06 lr: 2.6936e-06 eta: 1 day, 9:17:35 time: 1.5048 data_time: 0.0258 memory: 25721 grad_norm: 3.5401 loss: 1.0843 detection_loss_cls: 0.0246 detection_loss_reg: 0.3106 caption_loss_cls: 1.9502 grounding_loss_reg: 2.0544 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3084 instance_segmentation_loss_poly: 0.8146 +2024/01/12 13:21:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 13:21:40 - mmengine - INFO - Iter(train) [560000/640000] base_lr: 9.5361e-06 lr: 2.6851e-06 eta: 1 day, 9:04:40 time: 1.5041 data_time: 0.0257 memory: 25721 grad_norm: 3.5634 loss: 1.0825 detection_loss_cls: 0.0245 detection_loss_reg: 0.3091 caption_loss_cls: 1.9464 grounding_loss_reg: 2.0522 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0241 instance_segmentation_loss_reg: 0.3065 instance_segmentation_loss_poly: 0.8101 +2024/01/12 13:21:40 - mmengine - INFO - Saving checkpoint at 560000 iterations +2024/01/12 13:33:57 - mmengine - INFO - Evaluating bbox... +2024/01/12 13:34:55 - mmengine - INFO - bbox_mAP_copypaste: 0.513 0.693 0.560 0.352 0.559 0.649 +2024/01/12 13:34:55 - mmengine - INFO - Evaluating segm... +2024/01/12 13:36:09 - mmengine - INFO - segm_mAP_copypaste: 0.348 0.612 0.344 0.197 0.393 0.527 +2024/01/12 13:43:24 - mmengine - INFO - per class results: +2024/01/12 13:43:24 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.54 | 89.59 | +| building | 83.25 | 92.41 | +| sky | 93.39 | 97.73 | +| floor | 83.06 | 90.73 | +| tree | 73.86 | 86.77 | +| ceiling | 85.32 | 94.44 | +| road | 83.7 | 88.97 | +| bed | 90.86 | 95.98 | +| windowpane | 64.35 | 78.78 | +| grass | 66.05 | 83.0 | +| cabinet | 64.96 | 79.96 | +| sidewalk | 66.9 | 82.85 | +| person | 81.42 | 92.33 | +| earth | 43.08 | 56.65 | +| door | 53.91 | 67.08 | +| table | 66.58 | 81.58 | +| mountain | 60.48 | 73.44 | +| plant | 51.27 | 61.38 | +| curtain | 75.19 | 86.93 | +| chair | 61.9 | 76.2 | +| car | 85.02 | 92.11 | +| water | 53.99 | 68.58 | +| painting | 72.41 | 88.04 | +| sofa | 70.91 | 81.81 | +| shelf | 46.86 | 65.8 | +| house | 47.55 | 64.27 | +| sea | 52.18 | 69.24 | +| mirror | 69.04 | 77.62 | +| rug | 68.89 | 79.62 | +| field | 29.34 | 48.39 | +| armchair | 51.09 | 70.55 | +| seat | 62.49 | 79.86 | +| fence | 45.41 | 62.81 | +| desk | 47.86 | 69.74 | +| rock | 45.17 | 64.61 | +| wardrobe | 52.04 | 59.74 | +| lamp | 64.18 | 76.62 | +| bathtub | 80.05 | 83.58 | +| railing | 37.9 | 53.78 | +| cushion | 58.7 | 67.32 | +| base | 23.05 | 30.78 | +| box | 28.39 | 36.99 | +| column | 52.04 | 65.9 | +| signboard | 38.08 | 49.74 | +| chest of drawers | 42.95 | 59.76 | +| counter | 22.35 | 31.78 | +| sand | 47.6 | 65.01 | +| sink | 76.33 | 83.77 | +| skyscraper | 64.15 | 80.64 | +| fireplace | 78.55 | 90.83 | +| refrigerator | 71.99 | 79.49 | +| grandstand | 42.18 | 76.95 | +| path | 25.94 | 39.19 | +| stairs | 26.33 | 31.9 | +| runway | 72.97 | 86.39 | +| case | 50.95 | 68.14 | +| pool table | 92.44 | 96.52 | +| pillow | 58.76 | 72.27 | +| screen door | 74.9 | 83.38 | +| stairway | 30.12 | 44.85 | +| river | 14.65 | 32.72 | +| bridge | 62.97 | 80.36 | +| bookcase | 39.71 | 58.09 | +| blind | 40.43 | 45.4 | +| coffee table | 68.76 | 83.03 | +| toilet | 86.89 | 91.92 | +| flower | 39.32 | 51.13 | +| book | 51.88 | 69.34 | +| hill | 12.66 | 22.94 | +| bench | 59.97 | 66.82 | +| countertop | 63.93 | 75.02 | +| stove | 78.56 | 84.9 | +| palm | 45.33 | 61.7 | +| kitchen island | 43.16 | 72.57 | +| computer | 73.37 | 83.92 | +| swivel chair | 40.16 | 52.82 | +| boat | 71.89 | 79.54 | +| bar | 31.86 | 42.91 | +| arcade machine | 44.7 | 47.9 | +| hovel | 8.79 | 9.55 | +| bus | 92.85 | 95.71 | +| towel | 63.78 | 77.87 | +| light | 53.05 | 63.75 | +| truck | 41.08 | 60.87 | +| tower | 22.85 | 40.29 | +| chandelier | 64.77 | 77.89 | +| awning | 35.8 | 43.73 | +| streetlight | 32.6 | 42.83 | +| booth | 36.76 | 42.27 | +| television receiver | 69.26 | 84.48 | +| airplane | 62.34 | 77.13 | +| dirt track | 14.66 | 19.54 | +| apparel | 32.88 | 44.5 | +| pole | 28.14 | 42.27 | +| land | 2.6 | 4.53 | +| bannister | 16.62 | 21.67 | +| escalator | 24.11 | 25.37 | +| ottoman | 49.16 | 65.75 | +| bottle | 23.17 | 30.0 | +| buffet | 40.29 | 48.09 | +| poster | 27.99 | 33.58 | +| stage | 9.82 | 17.65 | +| van | 48.86 | 63.31 | +| ship | 9.75 | 11.18 | +| fountain | 21.99 | 23.14 | +| conveyer belt | 78.19 | 90.89 | +| canopy | 28.96 | 31.61 | +| washer | 70.27 | 71.02 | +| plaything | 27.09 | 29.92 | +| swimming pool | 65.51 | 72.33 | +| stool | 50.69 | 63.85 | +| barrel | 17.04 | 70.95 | +| basket | 29.97 | 43.7 | +| waterfall | 56.65 | 75.68 | +| tent | 92.43 | 96.9 | +| bag | 20.48 | 24.04 | +| minibike | 73.07 | 82.82 | +| cradle | 72.09 | 96.57 | +| oven | 56.57 | 76.61 | +| ball | 54.2 | 69.02 | +| food | 54.21 | 59.66 | +| step | 10.42 | 15.37 | +| tank | 36.2 | 45.6 | +| trade name | 28.53 | 35.09 | +| microwave | 84.7 | 90.65 | +| pot | 53.37 | 62.18 | +| animal | 57.37 | 60.47 | +| bicycle | 58.13 | 75.88 | +| lake | 56.13 | 63.2 | +| dishwasher | 64.26 | 75.69 | +| screen | 52.85 | 74.32 | +| blanket | 16.43 | 18.9 | +| sculpture | 57.18 | 67.4 | +| hood | 60.2 | 69.3 | +| sconce | 45.52 | 55.16 | +| vase | 46.02 | 61.35 | +| traffic light | 39.84 | 56.08 | +| tray | 6.87 | 11.35 | +| ashcan | 44.4 | 56.22 | +| fan | 59.91 | 72.19 | +| pier | 46.95 | 65.17 | +| crt screen | 9.24 | 19.93 | +| plate | 55.85 | 73.94 | +| monitor | 32.84 | 41.62 | +| bulletin board | 38.01 | 48.46 | +| shower | 2.6 | 5.9 | +| radiator | 58.86 | 67.44 | +| glass | 20.12 | 21.89 | +| clock | 26.11 | 32.49 | +| flag | 34.07 | 39.99 | ++---------------------+-------+-------+ +2024/01/12 13:43:42 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.5130 coco/bbox_mAP_50: 0.6930 coco/bbox_mAP_75: 0.5600 coco/bbox_mAP_s: 0.3520 coco/bbox_mAP_m: 0.5590 coco/bbox_mAP_l: 0.6490 coco/segm_mAP: 0.3480 coco/segm_mAP_50: 0.6120 coco/segm_mAP_75: 0.3440 coco/segm_mAP_s: 0.1970 coco/segm_mAP_m: 0.3930 coco/segm_mAP_l: 0.5270 Bleu_1: 0.7676 Bleu_2: 0.6056 Bleu_3: 0.4639 Bleu_4: 0.3514 METEOR: 0.2774 ROUGE_L: 0.5654 CIDEr: 1.1412 SPICE: 0.2063 aAcc: 83.9400 mIoU: 50.2900 mAcc: 61.7600 visual-grounding/miou: 0.8256 visual-grounding/acc: 0.8833 data_time: 0.0100 time: 1.3576 +2024/01/12 13:56:21 - mmengine - INFO - Iter(train) [560500/640000] base_lr: 9.4434e-06 lr: 2.6767e-06 eta: 1 day, 8:53:22 time: 1.5093 data_time: 0.0224 memory: 25722 grad_norm: 3.5374 loss: 1.0843 detection_loss_cls: 0.0245 detection_loss_reg: 0.3086 caption_loss_cls: 1.9451 grounding_loss_reg: 2.0516 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0241 instance_segmentation_loss_reg: 0.3067 instance_segmentation_loss_poly: 0.8098 +2024/01/12 14:08:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 14:08:20 - mmengine - INFO - Iter(train) [561000/640000] base_lr: 9.3512e-06 lr: 2.6683e-06 eta: 1 day, 8:39:20 time: 1.4910 data_time: 0.0222 memory: 25722 grad_norm: 3.5905 loss: 1.0804 detection_loss_cls: 0.0245 detection_loss_reg: 0.3078 caption_loss_cls: 1.9401 grounding_loss_reg: 2.0525 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0241 instance_segmentation_loss_reg: 0.3056 instance_segmentation_loss_poly: 0.8075 +2024/01/12 14:20:47 - mmengine - INFO - Iter(train) [561500/640000] base_lr: 9.2596e-06 lr: 2.6600e-06 eta: 1 day, 8:27:05 time: 1.4912 data_time: 0.0225 memory: 25722 grad_norm: 3.5896 loss: 1.0798 detection_loss_cls: 0.0244 detection_loss_reg: 0.3061 caption_loss_cls: 1.9407 grounding_loss_reg: 2.0507 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3033 instance_segmentation_loss_poly: 0.8025 +2024/01/12 14:33:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 14:33:43 - mmengine - INFO - Iter(train) [562000/640000] base_lr: 9.1686e-06 lr: 2.6517e-06 eta: 1 day, 8:16:30 time: 1.5062 data_time: 0.0228 memory: 25722 grad_norm: 3.5405 loss: 1.0641 detection_loss_cls: 0.0243 detection_loss_reg: 0.3057 caption_loss_cls: 1.9444 grounding_loss_reg: 2.0501 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3028 instance_segmentation_loss_poly: 0.8013 +2024/01/12 14:33:43 - mmengine - INFO - Saving checkpoint at 562000 iterations +2024/01/12 14:46:24 - mmengine - INFO - Iter(train) [562500/640000] base_lr: 9.0781e-06 lr: 2.6435e-06 eta: 1 day, 8:05:01 time: 1.5152 data_time: 0.0237 memory: 25722 grad_norm: 3.5160 loss: 1.0535 detection_loss_cls: 0.0243 detection_loss_reg: 0.3044 caption_loss_cls: 1.9423 grounding_loss_reg: 2.0476 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0237 instance_segmentation_loss_reg: 0.3018 instance_segmentation_loss_poly: 0.7995 +2024/01/12 14:58:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 14:58:19 - mmengine - INFO - Iter(train) [563000/640000] base_lr: 8.9881e-06 lr: 2.6353e-06 eta: 1 day, 7:50:52 time: 1.5012 data_time: 0.0237 memory: 25722 grad_norm: 3.4877 loss: 1.0600 detection_loss_cls: 0.0242 detection_loss_reg: 0.3034 caption_loss_cls: 1.9445 grounding_loss_reg: 2.0458 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0237 instance_segmentation_loss_reg: 0.3011 instance_segmentation_loss_poly: 0.7987 +2024/01/12 15:10:14 - mmengine - INFO - Iter(train) [563500/640000] base_lr: 8.8987e-06 lr: 2.6272e-06 eta: 1 day, 7:36:49 time: 1.4819 data_time: 0.0235 memory: 25722 grad_norm: 3.5723 loss: 1.0667 detection_loss_cls: 0.0241 detection_loss_reg: 0.3020 caption_loss_cls: 1.9478 grounding_loss_reg: 2.0423 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3008 instance_segmentation_loss_poly: 0.7979 +2024/01/12 15:21:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 15:21:43 - mmengine - INFO - Iter(train) [564000/640000] base_lr: 8.8099e-06 lr: 2.6191e-06 eta: 1 day, 7:21:30 time: 1.4699 data_time: 0.0235 memory: 25722 grad_norm: 3.5910 loss: 1.0701 detection_loss_cls: 0.0242 detection_loss_reg: 0.3029 caption_loss_cls: 1.9450 grounding_loss_reg: 2.0401 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.2997 instance_segmentation_loss_poly: 0.7959 +2024/01/12 15:21:43 - mmengine - INFO - Saving checkpoint at 564000 iterations +2024/01/12 15:34:05 - mmengine - INFO - Iter(train) [564500/640000] base_lr: 8.7216e-06 lr: 2.6111e-06 eta: 1 day, 7:09:03 time: 1.4649 data_time: 0.0276 memory: 25722 grad_norm: 3.6489 loss: 1.0812 detection_loss_cls: 0.0243 detection_loss_reg: 0.3034 caption_loss_cls: 1.9461 grounding_loss_reg: 2.0386 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0237 instance_segmentation_loss_reg: 0.3010 instance_segmentation_loss_poly: 0.7979 +2024/01/12 15:46:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 15:46:43 - mmengine - INFO - Iter(train) [565000/640000] base_lr: 8.6339e-06 lr: 2.6031e-06 eta: 1 day, 6:57:27 time: 1.4747 data_time: 0.0280 memory: 25722 grad_norm: 3.6238 loss: 1.0783 detection_loss_cls: 0.0243 detection_loss_reg: 0.3047 caption_loss_cls: 1.9420 grounding_loss_reg: 2.0360 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0237 instance_segmentation_loss_reg: 0.3013 instance_segmentation_loss_poly: 0.7992 +2024/01/12 15:59:28 - mmengine - INFO - Iter(train) [565500/640000] base_lr: 8.5467e-06 lr: 2.5952e-06 eta: 1 day, 6:46:07 time: 1.4792 data_time: 0.0281 memory: 25722 grad_norm: 3.5933 loss: 1.0747 detection_loss_cls: 0.0243 detection_loss_reg: 0.3035 caption_loss_cls: 1.9392 grounding_loss_reg: 2.0340 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3017 instance_segmentation_loss_poly: 0.7995 +2024/01/12 16:12:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 16:12:10 - mmengine - INFO - Iter(train) [566000/640000] base_lr: 8.4601e-06 lr: 2.5873e-06 eta: 1 day, 6:34:33 time: 1.4756 data_time: 0.0281 memory: 25722 grad_norm: 3.6287 loss: 1.0808 detection_loss_cls: 0.0243 detection_loss_reg: 0.3041 caption_loss_cls: 1.9369 grounding_loss_reg: 2.0345 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3016 instance_segmentation_loss_poly: 0.7997 +2024/01/12 16:12:10 - mmengine - INFO - Saving checkpoint at 566000 iterations +2024/01/12 16:25:07 - mmengine - INFO - Iter(train) [566500/640000] base_lr: 8.3740e-06 lr: 2.5795e-06 eta: 1 day, 6:23:41 time: 1.4797 data_time: 0.0279 memory: 25722 grad_norm: 3.5900 loss: 1.0847 detection_loss_cls: 0.0243 detection_loss_reg: 0.3044 caption_loss_cls: 1.9385 grounding_loss_reg: 2.0349 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0237 instance_segmentation_loss_reg: 0.3014 instance_segmentation_loss_poly: 0.7984 +2024/01/12 16:37:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 16:37:57 - mmengine - INFO - Iter(train) [567000/640000] base_lr: 8.2885e-06 lr: 2.5717e-06 eta: 1 day, 6:12:23 time: 1.4934 data_time: 0.0282 memory: 25722 grad_norm: 3.5735 loss: 1.0795 detection_loss_cls: 0.0244 detection_loss_reg: 0.3053 caption_loss_cls: 1.9387 grounding_loss_reg: 2.0338 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3023 instance_segmentation_loss_poly: 0.8004 +2024/01/12 16:51:21 - mmengine - INFO - Iter(train) [567500/640000] base_lr: 8.2036e-06 lr: 2.5640e-06 eta: 1 day, 6:02:34 time: 1.5158 data_time: 0.0287 memory: 25722 grad_norm: 3.5051 loss: 1.0706 detection_loss_cls: 0.0243 detection_loss_reg: 0.3056 caption_loss_cls: 1.9347 grounding_loss_reg: 2.0338 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0237 instance_segmentation_loss_reg: 0.3024 instance_segmentation_loss_poly: 0.8001 +2024/01/12 17:03:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 17:03:18 - mmengine - INFO - Iter(train) [568000/640000] base_lr: 8.1192e-06 lr: 2.5563e-06 eta: 1 day, 5:48:52 time: 1.5226 data_time: 0.0291 memory: 25722 grad_norm: 3.4888 loss: 1.0745 detection_loss_cls: 0.0243 detection_loss_reg: 0.3062 caption_loss_cls: 1.9358 grounding_loss_reg: 2.0347 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3030 instance_segmentation_loss_poly: 0.8012 +2024/01/12 17:03:18 - mmengine - INFO - Saving checkpoint at 568000 iterations +2024/01/12 17:15:41 - mmengine - INFO - Iter(train) [568500/640000] base_lr: 8.0354e-06 lr: 2.5487e-06 eta: 1 day, 5:36:21 time: 1.5231 data_time: 0.0291 memory: 25722 grad_norm: 3.4745 loss: 1.0761 detection_loss_cls: 0.0244 detection_loss_reg: 0.3065 caption_loss_cls: 1.9383 grounding_loss_reg: 2.0372 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3046 instance_segmentation_loss_poly: 0.8041 +2024/01/12 17:28:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 17:28:11 - mmengine - INFO - Iter(train) [569000/640000] base_lr: 7.9521e-06 lr: 2.5411e-06 eta: 1 day, 5:24:06 time: 1.5209 data_time: 0.0290 memory: 25722 grad_norm: 3.5271 loss: 1.0786 detection_loss_cls: 0.0245 detection_loss_reg: 0.3068 caption_loss_cls: 1.9394 grounding_loss_reg: 2.0360 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3047 instance_segmentation_loss_poly: 0.8041 +2024/01/12 17:40:15 - mmengine - INFO - Iter(train) [569500/640000] base_lr: 7.8694e-06 lr: 2.5336e-06 eta: 1 day, 5:10:48 time: 1.5107 data_time: 0.0288 memory: 25722 grad_norm: 3.5943 loss: 1.0909 detection_loss_cls: 0.0245 detection_loss_reg: 0.3073 caption_loss_cls: 1.9378 grounding_loss_reg: 2.0360 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3046 instance_segmentation_loss_poly: 0.8041 +2024/01/12 17:52:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 17:52:14 - mmengine - INFO - Iter(train) [570000/640000] base_lr: 7.7873e-06 lr: 2.5261e-06 eta: 1 day, 4:57:21 time: 1.5001 data_time: 0.0287 memory: 25722 grad_norm: 3.6135 loss: 1.0966 detection_loss_cls: 0.0245 detection_loss_reg: 0.3068 caption_loss_cls: 1.9372 grounding_loss_reg: 2.0346 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3050 instance_segmentation_loss_poly: 0.8053 +2024/01/12 17:52:14 - mmengine - INFO - Saving checkpoint at 570000 iterations +2024/01/12 18:05:16 - mmengine - INFO - Iter(train) [570500/640000] base_lr: 7.7057e-06 lr: 2.5187e-06 eta: 1 day, 4:46:20 time: 1.5012 data_time: 0.0287 memory: 25722 grad_norm: 3.6274 loss: 1.0913 detection_loss_cls: 0.0244 detection_loss_reg: 0.3069 caption_loss_cls: 1.9362 grounding_loss_reg: 2.0342 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3043 instance_segmentation_loss_poly: 0.8043 +2024/01/12 18:16:56 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 18:16:56 - mmengine - INFO - Iter(train) [571000/640000] base_lr: 7.6247e-06 lr: 2.5113e-06 eta: 1 day, 4:32:14 time: 1.4839 data_time: 0.0285 memory: 25722 grad_norm: 3.6936 loss: 1.1042 detection_loss_cls: 0.0244 detection_loss_reg: 0.3063 caption_loss_cls: 1.9369 grounding_loss_reg: 2.0355 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3042 instance_segmentation_loss_poly: 0.8044 +2024/01/12 18:26:55 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 18:29:01 - mmengine - INFO - Iter(train) [571500/640000] base_lr: 7.5443e-06 lr: 2.5040e-06 eta: 1 day, 4:19:04 time: 1.4638 data_time: 0.0280 memory: 25722 grad_norm: 3.7278 loss: 1.1192 detection_loss_cls: 0.0243 detection_loss_reg: 0.3058 caption_loss_cls: 1.9438 grounding_loss_reg: 2.0374 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3039 instance_segmentation_loss_poly: 0.8034 +2024/01/12 18:40:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 18:40:42 - mmengine - INFO - Iter(train) [572000/640000] base_lr: 7.4644e-06 lr: 2.4968e-06 eta: 1 day, 4:05:08 time: 1.4600 data_time: 0.0279 memory: 25722 grad_norm: 3.7459 loss: 1.1137 detection_loss_cls: 0.0242 detection_loss_reg: 0.3047 caption_loss_cls: 1.9443 grounding_loss_reg: 2.0361 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3033 instance_segmentation_loss_poly: 0.8026 +2024/01/12 18:40:42 - mmengine - INFO - Saving checkpoint at 572000 iterations +2024/01/12 18:52:34 - mmengine - INFO - Iter(train) [572500/640000] base_lr: 7.3850e-06 lr: 2.4895e-06 eta: 1 day, 3:51:38 time: 1.4521 data_time: 0.0275 memory: 25722 grad_norm: 3.7698 loss: 1.1041 detection_loss_cls: 0.0242 detection_loss_reg: 0.3045 caption_loss_cls: 1.9437 grounding_loss_reg: 2.0318 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3030 instance_segmentation_loss_poly: 0.8018 +2024/01/12 19:04:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 19:04:30 - mmengine - INFO - Iter(train) [573000/640000] base_lr: 7.3063e-06 lr: 2.4824e-06 eta: 1 day, 3:38:19 time: 1.4436 data_time: 0.0273 memory: 25722 grad_norm: 3.7571 loss: 1.1063 detection_loss_cls: 0.0242 detection_loss_reg: 0.3046 caption_loss_cls: 1.9428 grounding_loss_reg: 2.0313 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3024 instance_segmentation_loss_poly: 0.8006 +2024/01/12 19:16:30 - mmengine - INFO - Iter(train) [573500/640000] base_lr: 7.2281e-06 lr: 2.4753e-06 eta: 1 day, 3:25:10 time: 1.4425 data_time: 0.0273 memory: 25722 grad_norm: 3.7442 loss: 1.1016 detection_loss_cls: 0.0242 detection_loss_reg: 0.3045 caption_loss_cls: 1.9433 grounding_loss_reg: 2.0305 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3029 instance_segmentation_loss_poly: 0.8021 +2024/01/12 19:28:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 19:28:45 - mmengine - INFO - Iter(train) [574000/640000] base_lr: 7.1504e-06 lr: 2.4682e-06 eta: 1 day, 3:12:34 time: 1.4466 data_time: 0.0272 memory: 25722 grad_norm: 3.7178 loss: 1.0913 detection_loss_cls: 0.0243 detection_loss_reg: 0.3061 caption_loss_cls: 1.9444 grounding_loss_reg: 2.0273 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0237 instance_segmentation_loss_reg: 0.3027 instance_segmentation_loss_poly: 0.8017 +2024/01/12 19:28:45 - mmengine - INFO - Saving checkpoint at 574000 iterations +2024/01/12 19:41:13 - mmengine - INFO - Iter(train) [574500/640000] base_lr: 7.0734e-06 lr: 2.4612e-06 eta: 1 day, 3:00:22 time: 1.4381 data_time: 0.0271 memory: 25722 grad_norm: 3.6956 loss: 1.0942 detection_loss_cls: 0.0243 detection_loss_reg: 0.3058 caption_loss_cls: 1.9391 grounding_loss_reg: 2.0267 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3039 instance_segmentation_loss_poly: 0.8035 +2024/01/12 19:53:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 19:53:43 - mmengine - INFO - Iter(train) [575000/640000] base_lr: 6.9969e-06 lr: 2.4543e-06 eta: 1 day, 2:48:14 time: 1.4507 data_time: 0.0273 memory: 25722 grad_norm: 3.6834 loss: 1.0878 detection_loss_cls: 0.0244 detection_loss_reg: 0.3067 caption_loss_cls: 1.9395 grounding_loss_reg: 2.0226 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3041 instance_segmentation_loss_poly: 0.8045 +2024/01/12 20:07:10 - mmengine - INFO - Iter(train) [575500/640000] base_lr: 6.9209e-06 lr: 2.4474e-06 eta: 1 day, 2:37:47 time: 1.4712 data_time: 0.0278 memory: 25722 grad_norm: 3.6230 loss: 1.0817 detection_loss_cls: 0.0245 detection_loss_reg: 0.3070 caption_loss_cls: 1.9417 grounding_loss_reg: 2.0218 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3041 instance_segmentation_loss_poly: 0.8036 +2024/01/12 20:19:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 20:19:57 - mmengine - INFO - Iter(train) [576000/640000] base_lr: 6.8456e-06 lr: 2.4405e-06 eta: 1 day, 2:26:07 time: 1.4879 data_time: 0.0280 memory: 25722 grad_norm: 3.5520 loss: 1.0739 detection_loss_cls: 0.0244 detection_loss_reg: 0.3064 caption_loss_cls: 1.9441 grounding_loss_reg: 2.0199 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3038 instance_segmentation_loss_poly: 0.8031 +2024/01/12 20:19:57 - mmengine - INFO - Saving checkpoint at 576000 iterations +2024/01/12 20:32:01 - mmengine - INFO - Iter(train) [576500/640000] base_lr: 6.7708e-06 lr: 2.4337e-06 eta: 1 day, 2:13:09 time: 1.4908 data_time: 0.0282 memory: 25722 grad_norm: 3.5977 loss: 1.0815 detection_loss_cls: 0.0243 detection_loss_reg: 0.3051 caption_loss_cls: 1.9443 grounding_loss_reg: 2.0193 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3043 instance_segmentation_loss_poly: 0.8045 +2024/01/12 20:43:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 20:43:59 - mmengine - INFO - Iter(train) [577000/640000] base_lr: 6.6965e-06 lr: 2.4270e-06 eta: 1 day, 2:00:01 time: 1.4913 data_time: 0.0282 memory: 25722 grad_norm: 3.5980 loss: 1.0817 detection_loss_cls: 0.0243 detection_loss_reg: 0.3060 caption_loss_cls: 1.9428 grounding_loss_reg: 2.0180 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3038 instance_segmentation_loss_poly: 0.8033 +2024/01/12 20:56:33 - mmengine - INFO - Iter(train) [577500/640000] base_lr: 6.6228e-06 lr: 2.4203e-06 eta: 1 day, 1:47:55 time: 1.4997 data_time: 0.0284 memory: 25722 grad_norm: 3.5789 loss: 1.0803 detection_loss_cls: 0.0244 detection_loss_reg: 0.3065 caption_loss_cls: 1.9410 grounding_loss_reg: 2.0207 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3042 instance_segmentation_loss_poly: 0.8034 +2024/01/12 21:08:37 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 21:08:37 - mmengine - INFO - Iter(train) [578000/640000] base_lr: 6.5497e-06 lr: 2.4136e-06 eta: 1 day, 1:35:01 time: 1.4970 data_time: 0.0285 memory: 25722 grad_norm: 3.6055 loss: 1.0942 detection_loss_cls: 0.0245 detection_loss_reg: 0.3075 caption_loss_cls: 1.9368 grounding_loss_reg: 2.0206 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3051 instance_segmentation_loss_poly: 0.8055 +2024/01/12 21:08:37 - mmengine - INFO - Saving checkpoint at 578000 iterations +2024/01/12 21:21:46 - mmengine - INFO - Iter(train) [578500/640000] base_lr: 6.4772e-06 lr: 2.4070e-06 eta: 1 day, 1:23:51 time: 1.5072 data_time: 0.0288 memory: 25722 grad_norm: 3.6068 loss: 1.0903 detection_loss_cls: 0.0244 detection_loss_reg: 0.3070 caption_loss_cls: 1.9349 grounding_loss_reg: 2.0208 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3047 instance_segmentation_loss_poly: 0.8042 +2024/01/12 21:33:58 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 21:33:58 - mmengine - INFO - Iter(train) [579000/640000] base_lr: 6.4053e-06 lr: 2.4005e-06 eta: 1 day, 1:11:09 time: 1.5026 data_time: 0.0287 memory: 25722 grad_norm: 3.5982 loss: 1.0936 detection_loss_cls: 0.0245 detection_loss_reg: 0.3077 caption_loss_cls: 1.9350 grounding_loss_reg: 2.0210 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3055 instance_segmentation_loss_poly: 0.8060 +2024/01/12 21:46:19 - mmengine - INFO - Iter(train) [579500/640000] base_lr: 6.3339e-06 lr: 2.3940e-06 eta: 1 day, 0:58:42 time: 1.4863 data_time: 0.0284 memory: 25722 grad_norm: 3.6329 loss: 1.0894 detection_loss_cls: 0.0244 detection_loss_reg: 0.3070 caption_loss_cls: 1.9388 grounding_loss_reg: 2.0215 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3050 instance_segmentation_loss_poly: 0.8056 +2024/01/12 21:58:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 21:58:59 - mmengine - INFO - Iter(train) [580000/640000] base_lr: 6.2630e-06 lr: 2.3875e-06 eta: 1 day, 0:46:44 time: 1.4844 data_time: 0.0283 memory: 25722 grad_norm: 3.6322 loss: 1.0898 detection_loss_cls: 0.0244 detection_loss_reg: 0.3076 caption_loss_cls: 1.9395 grounding_loss_reg: 2.0221 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3055 instance_segmentation_loss_poly: 0.8073 +2024/01/12 21:58:59 - mmengine - INFO - Saving checkpoint at 580000 iterations +2024/01/12 22:11:33 - mmengine - INFO - Evaluating bbox... +2024/01/12 22:12:31 - mmengine - INFO - bbox_mAP_copypaste: 0.514 0.694 0.561 0.353 0.563 0.650 +2024/01/12 22:12:31 - mmengine - INFO - Evaluating segm... +2024/01/12 22:13:44 - mmengine - INFO - segm_mAP_copypaste: 0.348 0.613 0.345 0.197 0.395 0.533 +2024/01/12 22:19:56 - mmengine - INFO - per class results: +2024/01/12 22:19:56 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.81 | 89.11 | +| building | 83.31 | 91.63 | +| sky | 93.49 | 97.77 | +| floor | 83.01 | 90.84 | +| tree | 74.04 | 86.74 | +| ceiling | 85.03 | 94.3 | +| road | 83.79 | 90.28 | +| bed | 90.48 | 95.89 | +| windowpane | 64.24 | 79.77 | +| grass | 65.75 | 82.92 | +| cabinet | 64.19 | 77.5 | +| sidewalk | 66.86 | 80.98 | +| person | 81.52 | 91.97 | +| earth | 41.14 | 53.53 | +| door | 54.12 | 68.24 | +| table | 66.67 | 81.62 | +| mountain | 62.61 | 74.54 | +| plant | 51.96 | 63.95 | +| curtain | 75.96 | 87.06 | +| chair | 61.29 | 75.2 | +| car | 84.82 | 92.49 | +| water | 56.74 | 72.69 | +| painting | 71.55 | 87.5 | +| sofa | 71.22 | 84.09 | +| shelf | 46.54 | 65.43 | +| house | 48.0 | 67.77 | +| sea | 55.08 | 70.88 | +| mirror | 69.44 | 76.16 | +| rug | 68.92 | 78.05 | +| field | 29.47 | 46.74 | +| armchair | 48.33 | 66.03 | +| seat | 61.72 | 80.44 | +| fence | 45.9 | 66.33 | +| desk | 48.77 | 69.96 | +| rock | 47.18 | 71.68 | +| wardrobe | 51.77 | 63.32 | +| lamp | 63.73 | 76.68 | +| bathtub | 80.79 | 84.26 | +| railing | 37.54 | 53.22 | +| cushion | 62.47 | 75.09 | +| base | 23.49 | 31.46 | +| box | 28.16 | 37.36 | +| column | 53.16 | 66.29 | +| signboard | 38.42 | 57.26 | +| chest of drawers | 40.04 | 59.64 | +| counter | 25.01 | 34.33 | +| sand | 47.73 | 64.8 | +| sink | 76.16 | 83.72 | +| skyscraper | 64.31 | 81.42 | +| fireplace | 79.41 | 90.39 | +| refrigerator | 73.99 | 81.37 | +| grandstand | 41.98 | 77.63 | +| path | 26.14 | 37.98 | +| stairs | 31.86 | 38.19 | +| runway | 68.14 | 86.65 | +| case | 55.15 | 71.29 | +| pool table | 91.47 | 96.64 | +| pillow | 60.66 | 72.59 | +| screen door | 80.28 | 83.6 | +| stairway | 34.3 | 46.35 | +| river | 15.4 | 33.61 | +| bridge | 62.37 | 82.25 | +| bookcase | 38.99 | 58.19 | +| blind | 41.12 | 46.13 | +| coffee table | 68.91 | 83.39 | +| toilet | 87.66 | 91.96 | +| flower | 41.07 | 55.83 | +| book | 52.59 | 73.63 | +| hill | 12.46 | 20.32 | +| bench | 58.65 | 67.26 | +| countertop | 62.05 | 80.23 | +| stove | 76.72 | 85.8 | +| palm | 46.17 | 64.05 | +| kitchen island | 48.6 | 84.07 | +| computer | 74.4 | 85.56 | +| swivel chair | 39.45 | 51.89 | +| boat | 76.42 | 85.23 | +| bar | 31.97 | 42.75 | +| arcade machine | 44.48 | 48.31 | +| hovel | 21.68 | 28.49 | +| bus | 92.02 | 95.39 | +| towel | 64.42 | 80.43 | +| light | 53.05 | 63.89 | +| truck | 42.14 | 58.22 | +| tower | 22.84 | 38.2 | +| chandelier | 64.76 | 77.64 | +| awning | 37.4 | 45.31 | +| streetlight | 33.19 | 44.79 | +| booth | 33.82 | 39.19 | +| television receiver | 70.95 | 86.14 | +| airplane | 61.51 | 76.01 | +| dirt track | 14.27 | 21.85 | +| apparel | 34.7 | 46.9 | +| pole | 27.37 | 39.47 | +| land | 2.3 | 4.4 | +| bannister | 16.57 | 21.92 | +| escalator | 24.87 | 25.81 | +| ottoman | 49.34 | 67.57 | +| bottle | 23.03 | 29.57 | +| buffet | 39.19 | 46.72 | +| poster | 34.34 | 41.4 | +| stage | 11.0 | 18.04 | +| van | 43.91 | 58.66 | +| ship | 23.34 | 25.78 | +| fountain | 21.1 | 21.86 | +| conveyer belt | 73.69 | 91.3 | +| canopy | 32.73 | 36.54 | +| washer | 72.92 | 73.79 | +| plaything | 26.31 | 29.93 | +| swimming pool | 69.84 | 72.85 | +| stool | 50.13 | 65.17 | +| barrel | 14.49 | 61.95 | +| basket | 29.85 | 45.76 | +| waterfall | 50.69 | 69.89 | +| tent | 68.85 | 96.81 | +| bag | 22.97 | 30.28 | +| minibike | 72.94 | 84.13 | +| cradle | 73.51 | 95.67 | +| oven | 54.83 | 69.6 | +| ball | 56.71 | 75.59 | +| food | 54.27 | 60.31 | +| step | 12.3 | 17.25 | +| tank | 35.7 | 45.19 | +| trade name | 26.52 | 31.81 | +| microwave | 86.24 | 93.92 | +| pot | 51.05 | 59.61 | +| animal | 56.33 | 59.32 | +| bicycle | 57.09 | 74.61 | +| lake | 56.01 | 63.72 | +| dishwasher | 62.53 | 73.8 | +| screen | 52.43 | 71.66 | +| blanket | 17.63 | 19.81 | +| sculpture | 57.69 | 68.79 | +| hood | 58.25 | 69.74 | +| sconce | 44.05 | 52.39 | +| vase | 46.92 | 62.25 | +| traffic light | 41.27 | 61.84 | +| tray | 8.46 | 16.61 | +| ashcan | 46.04 | 58.67 | +| fan | 59.6 | 71.15 | +| pier | 41.35 | 67.89 | +| crt screen | 9.19 | 23.45 | +| plate | 56.81 | 75.07 | +| monitor | 27.19 | 34.42 | +| bulletin board | 41.9 | 59.22 | +| shower | 3.12 | 4.21 | +| radiator | 57.14 | 64.83 | +| glass | 20.46 | 22.3 | +| clock | 27.46 | 34.03 | +| flag | 34.06 | 38.92 | ++---------------------+-------+-------+ +2024/01/12 22:20:13 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.5140 coco/bbox_mAP_50: 0.6940 coco/bbox_mAP_75: 0.5610 coco/bbox_mAP_s: 0.3530 coco/bbox_mAP_m: 0.5630 coco/bbox_mAP_l: 0.6500 coco/segm_mAP: 0.3480 coco/segm_mAP_50: 0.6130 coco/segm_mAP_75: 0.3450 coco/segm_mAP_s: 0.1970 coco/segm_mAP_m: 0.3950 coco/segm_mAP_l: 0.5330 Bleu_1: 0.7657 Bleu_2: 0.6036 Bleu_3: 0.4625 Bleu_4: 0.3512 METEOR: 0.2766 ROUGE_L: 0.5646 CIDEr: 1.1417 SPICE: 0.2057 aAcc: 84.0000 mIoU: 50.5300 mAcc: 62.6800 visual-grounding/miou: 0.8289 visual-grounding/acc: 0.8877 data_time: 0.0041 time: 1.3532 +2024/01/12 22:32:54 - mmengine - INFO - Iter(train) [580500/640000] base_lr: 6.1928e-06 lr: 2.3812e-06 eta: 1 day, 0:34:48 time: 1.4942 data_time: 0.0242 memory: 25722 grad_norm: 3.5449 loss: 1.0858 detection_loss_cls: 0.0245 detection_loss_reg: 0.3091 caption_loss_cls: 1.9438 grounding_loss_reg: 2.0230 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3060 instance_segmentation_loss_poly: 0.8087 +2024/01/12 22:45:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 22:45:34 - mmengine - INFO - Iter(train) [581000/640000] base_lr: 6.1231e-06 lr: 2.3748e-06 eta: 1 day, 0:22:47 time: 1.5047 data_time: 0.0244 memory: 25722 grad_norm: 3.4853 loss: 1.0789 detection_loss_cls: 0.0245 detection_loss_reg: 0.3099 caption_loss_cls: 1.9433 grounding_loss_reg: 2.0223 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3070 instance_segmentation_loss_poly: 0.8112 +2024/01/12 22:57:50 - mmengine - INFO - Iter(train) [581500/640000] base_lr: 6.0540e-06 lr: 2.3685e-06 eta: 1 day, 0:10:12 time: 1.5005 data_time: 0.0244 memory: 25722 grad_norm: 3.5128 loss: 1.0892 detection_loss_cls: 0.0246 detection_loss_reg: 0.3102 caption_loss_cls: 1.9422 grounding_loss_reg: 2.0200 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0241 instance_segmentation_loss_reg: 0.3086 instance_segmentation_loss_poly: 0.8148 +2024/01/12 23:10:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 23:10:11 - mmengine - INFO - Iter(train) [582000/640000] base_lr: 5.9855e-06 lr: 2.3623e-06 eta: 23:57:44 time: 1.5045 data_time: 0.0243 memory: 25722 grad_norm: 3.4882 loss: 1.0779 detection_loss_cls: 0.0247 detection_loss_reg: 0.3109 caption_loss_cls: 1.9457 grounding_loss_reg: 2.0214 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3085 instance_segmentation_loss_poly: 0.8158 +2024/01/12 23:10:11 - mmengine - INFO - Saving checkpoint at 582000 iterations +2024/01/12 23:23:09 - mmengine - INFO - Iter(train) [582500/640000] base_lr: 5.9175e-06 lr: 2.3561e-06 eta: 23:46:07 time: 1.5019 data_time: 0.0242 memory: 25722 grad_norm: 3.5196 loss: 1.0806 detection_loss_cls: 0.0248 detection_loss_reg: 0.3120 caption_loss_cls: 1.9438 grounding_loss_reg: 2.0211 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3089 instance_segmentation_loss_poly: 0.8161 +2024/01/12 23:35:24 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 23:35:24 - mmengine - INFO - Iter(train) [583000/640000] base_lr: 5.8501e-06 lr: 2.3500e-06 eta: 23:33:30 time: 1.5027 data_time: 0.0244 memory: 25722 grad_norm: 3.5208 loss: 1.0873 detection_loss_cls: 0.0248 detection_loss_reg: 0.3126 caption_loss_cls: 1.9447 grounding_loss_reg: 2.0225 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0243 instance_segmentation_loss_reg: 0.3106 instance_segmentation_loss_poly: 0.8193 +2024/01/12 23:48:01 - mmengine - INFO - Iter(train) [583500/640000] base_lr: 5.7833e-06 lr: 2.3439e-06 eta: 23:21:22 time: 1.5067 data_time: 0.0245 memory: 25722 grad_norm: 3.5286 loss: 1.0930 detection_loss_cls: 0.0249 detection_loss_reg: 0.3131 caption_loss_cls: 1.9456 grounding_loss_reg: 2.0229 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0243 instance_segmentation_loss_reg: 0.3107 instance_segmentation_loss_poly: 0.8195 +2024/01/12 23:59:51 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/12 23:59:51 - mmengine - INFO - Iter(train) [584000/640000] base_lr: 5.7171e-06 lr: 2.3379e-06 eta: 23:08:13 time: 1.4939 data_time: 0.0243 memory: 25722 grad_norm: 3.6342 loss: 1.1066 detection_loss_cls: 0.0249 detection_loss_reg: 0.3132 caption_loss_cls: 1.9457 grounding_loss_reg: 2.0227 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0244 instance_segmentation_loss_reg: 0.3103 instance_segmentation_loss_poly: 0.8189 +2024/01/12 23:59:51 - mmengine - INFO - Saving checkpoint at 584000 iterations +2024/01/13 00:13:33 - mmengine - INFO - Iter(train) [584500/640000] base_lr: 5.6514e-06 lr: 2.3319e-06 eta: 22:57:26 time: 1.5086 data_time: 0.0288 memory: 25722 grad_norm: 3.5882 loss: 1.0977 detection_loss_cls: 0.0248 detection_loss_reg: 0.3129 caption_loss_cls: 1.9438 grounding_loss_reg: 2.0224 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0243 instance_segmentation_loss_reg: 0.3101 instance_segmentation_loss_poly: 0.8194 +2024/01/13 00:26:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/13 00:26:33 - mmengine - INFO - Iter(train) [585000/640000] base_lr: 5.5863e-06 lr: 2.3260e-06 eta: 22:45:45 time: 1.5137 data_time: 0.0289 memory: 25722 grad_norm: 3.6099 loss: 1.0982 detection_loss_cls: 0.0248 detection_loss_reg: 0.3119 caption_loss_cls: 1.9449 grounding_loss_reg: 2.0226 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0243 instance_segmentation_loss_reg: 0.3086 instance_segmentation_loss_poly: 0.8170 +2024/01/13 00:38:45 - mmengine - INFO - Iter(train) [585500/640000] base_lr: 5.5218e-06 lr: 2.3202e-06 eta: 22:33:03 time: 1.5126 data_time: 0.0287 memory: 25722 grad_norm: 3.6161 loss: 1.0890 detection_loss_cls: 0.0248 detection_loss_reg: 0.3119 caption_loss_cls: 1.9448 grounding_loss_reg: 2.0235 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3088 instance_segmentation_loss_poly: 0.8176 +2024/01/13 00:51:13 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/13 00:51:13 - mmengine - INFO - Iter(train) [586000/640000] base_lr: 5.4578e-06 lr: 2.3143e-06 eta: 22:20:42 time: 1.5144 data_time: 0.0287 memory: 25722 grad_norm: 3.6146 loss: 1.0876 detection_loss_cls: 0.0248 detection_loss_reg: 0.3123 caption_loss_cls: 1.9436 grounding_loss_reg: 2.0233 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0243 instance_segmentation_loss_reg: 0.3087 instance_segmentation_loss_poly: 0.8177 +2024/01/13 00:51:13 - mmengine - INFO - Saving checkpoint at 586000 iterations +2024/01/13 01:03:32 - mmengine - INFO - Iter(train) [586500/640000] base_lr: 5.3945e-06 lr: 2.3086e-06 eta: 22:08:10 time: 1.5045 data_time: 0.0285 memory: 25722 grad_norm: 3.6505 loss: 1.0939 detection_loss_cls: 0.0249 detection_loss_reg: 0.3126 caption_loss_cls: 1.9418 grounding_loss_reg: 2.0245 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3080 instance_segmentation_loss_poly: 0.8162 +2024/01/13 01:16:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/13 01:16:17 - mmengine - INFO - Iter(train) [587000/640000] base_lr: 5.3317e-06 lr: 2.3029e-06 eta: 21:56:07 time: 1.5120 data_time: 0.0285 memory: 25722 grad_norm: 3.6241 loss: 1.0797 detection_loss_cls: 0.0248 detection_loss_reg: 0.3117 caption_loss_cls: 1.9436 grounding_loss_reg: 2.0224 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3083 instance_segmentation_loss_poly: 0.8174 +2024/01/13 01:28:07 - mmengine - INFO - Iter(train) [587500/640000] base_lr: 5.2695e-06 lr: 2.2972e-06 eta: 21:43:04 time: 1.5004 data_time: 0.0282 memory: 25722 grad_norm: 3.6608 loss: 1.0807 detection_loss_cls: 0.0248 detection_loss_reg: 0.3109 caption_loss_cls: 1.9478 grounding_loss_reg: 2.0228 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3079 instance_segmentation_loss_poly: 0.8168 +2024/01/13 01:40:11 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/13 01:40:11 - mmengine - INFO - Iter(train) [588000/640000] base_lr: 5.2078e-06 lr: 2.2916e-06 eta: 21:30:16 time: 1.5040 data_time: 0.0283 memory: 25722 grad_norm: 3.6099 loss: 1.0716 detection_loss_cls: 0.0249 detection_loss_reg: 0.3113 caption_loss_cls: 1.9410 grounding_loss_reg: 2.0223 semantic_segmentation_loss_cls: 0.0066 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3073 instance_segmentation_loss_poly: 0.8158 +2024/01/13 01:40:11 - mmengine - INFO - Saving checkpoint at 588000 iterations +2024/01/13 01:52:49 - mmengine - INFO - Iter(train) [588500/640000] base_lr: 5.1467e-06 lr: 2.2861e-06 eta: 21:18:05 time: 1.4879 data_time: 0.0281 memory: 25722 grad_norm: 3.6551 loss: 1.0841 detection_loss_cls: 0.0248 detection_loss_reg: 0.3111 caption_loss_cls: 1.9427 grounding_loss_reg: 2.0206 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3087 instance_segmentation_loss_poly: 0.8181 +2024/01/13 02:05:35 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/13 02:05:35 - mmengine - INFO - Iter(train) [589000/640000] base_lr: 5.0863e-06 lr: 2.2806e-06 eta: 21:06:02 time: 1.4845 data_time: 0.0282 memory: 25722 grad_norm: 3.6691 loss: 1.0977 detection_loss_cls: 0.0249 detection_loss_reg: 0.3121 caption_loss_cls: 1.9444 grounding_loss_reg: 2.0242 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3084 instance_segmentation_loss_poly: 0.8189 +2024/01/13 02:18:06 - mmengine - INFO - Iter(train) [589500/640000] base_lr: 5.0264e-06 lr: 2.2751e-06 eta: 20:53:43 time: 1.4891 data_time: 0.0283 memory: 25722 grad_norm: 3.6394 loss: 1.0944 detection_loss_cls: 0.0248 detection_loss_reg: 0.3118 caption_loss_cls: 1.9430 grounding_loss_reg: 2.0242 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0241 instance_segmentation_loss_reg: 0.3082 instance_segmentation_loss_poly: 0.8180 +2024/01/13 02:30:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/13 02:30:25 - mmengine - INFO - Iter(train) [590000/640000] base_lr: 4.9670e-06 lr: 2.2697e-06 eta: 20:41:13 time: 1.4870 data_time: 0.0283 memory: 25722 grad_norm: 3.6617 loss: 1.0961 detection_loss_cls: 0.0248 detection_loss_reg: 0.3122 caption_loss_cls: 1.9412 grounding_loss_reg: 2.0214 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0241 instance_segmentation_loss_reg: 0.3086 instance_segmentation_loss_poly: 0.8185 +2024/01/13 02:30:25 - mmengine - INFO - Saving checkpoint at 590000 iterations +2024/01/13 02:43:01 - mmengine - INFO - Iter(train) [590500/640000] base_lr: 4.9083e-06 lr: 2.2644e-06 eta: 20:28:58 time: 1.4913 data_time: 0.0284 memory: 25722 grad_norm: 3.6119 loss: 1.0850 detection_loss_cls: 0.0249 detection_loss_reg: 0.3121 caption_loss_cls: 1.9424 grounding_loss_reg: 2.0223 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0241 instance_segmentation_loss_reg: 0.3088 instance_segmentation_loss_poly: 0.8187 +2024/01/13 02:55:15 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/13 02:55:15 - mmengine - INFO - Iter(train) [591000/640000] base_lr: 4.8501e-06 lr: 2.2591e-06 eta: 20:16:22 time: 1.4835 data_time: 0.0281 memory: 25722 grad_norm: 3.6381 loss: 1.0933 detection_loss_cls: 0.0249 detection_loss_reg: 0.3121 caption_loss_cls: 1.9446 grounding_loss_reg: 2.0209 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0241 instance_segmentation_loss_reg: 0.3091 instance_segmentation_loss_poly: 0.8193 +2024/01/13 03:07:14 - mmengine - INFO - Iter(train) [591500/640000] base_lr: 4.7925e-06 lr: 2.2539e-06 eta: 20:03:33 time: 1.4855 data_time: 0.0282 memory: 25722 grad_norm: 3.6362 loss: 1.0875 detection_loss_cls: 0.0248 detection_loss_reg: 0.3125 caption_loss_cls: 1.9415 grounding_loss_reg: 2.0185 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3086 instance_segmentation_loss_poly: 0.8177 +2024/01/13 03:19:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/13 03:19:29 - mmengine - INFO - Iter(train) [592000/640000] base_lr: 4.7355e-06 lr: 2.2487e-06 eta: 19:50:59 time: 1.4882 data_time: 0.0280 memory: 25722 grad_norm: 3.6344 loss: 1.0842 detection_loss_cls: 0.0249 detection_loss_reg: 0.3126 caption_loss_cls: 1.9417 grounding_loss_reg: 2.0179 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3080 instance_segmentation_loss_poly: 0.8161 +2024/01/13 03:19:29 - mmengine - INFO - Saving checkpoint at 592000 iterations +2024/01/13 03:32:21 - mmengine - INFO - Iter(train) [592500/640000] base_lr: 4.6791e-06 lr: 2.2436e-06 eta: 19:38:59 time: 1.4919 data_time: 0.0281 memory: 25722 grad_norm: 3.6388 loss: 1.0794 detection_loss_cls: 0.0249 detection_loss_reg: 0.3134 caption_loss_cls: 1.9425 grounding_loss_reg: 2.0185 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3088 instance_segmentation_loss_poly: 0.8171 +2024/01/13 03:44:49 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/13 03:44:49 - mmengine - INFO - Iter(train) [593000/640000] base_lr: 4.6232e-06 lr: 2.2385e-06 eta: 19:26:37 time: 1.4874 data_time: 0.0279 memory: 25722 grad_norm: 3.6626 loss: 1.0664 detection_loss_cls: 0.0249 detection_loss_reg: 0.3136 caption_loss_cls: 1.9349 grounding_loss_reg: 2.0207 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0241 instance_segmentation_loss_reg: 0.3089 instance_segmentation_loss_poly: 0.8166 +2024/01/13 03:56:45 - mmengine - INFO - Iter(train) [593500/640000] base_lr: 4.5679e-06 lr: 2.2334e-06 eta: 19:13:47 time: 1.4788 data_time: 0.0277 memory: 25722 grad_norm: 3.6628 loss: 1.0648 detection_loss_cls: 0.0250 detection_loss_reg: 0.3147 caption_loss_cls: 1.9370 grounding_loss_reg: 2.0214 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3101 instance_segmentation_loss_poly: 0.8191 +2024/01/13 04:09:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/13 04:09:14 - mmengine - INFO - Iter(train) [594000/640000] base_lr: 4.5132e-06 lr: 2.2285e-06 eta: 19:01:26 time: 1.4812 data_time: 0.0278 memory: 25722 grad_norm: 3.6490 loss: 1.0649 detection_loss_cls: 0.0250 detection_loss_reg: 0.3142 caption_loss_cls: 1.9351 grounding_loss_reg: 2.0213 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3102 instance_segmentation_loss_poly: 0.8194 +2024/01/13 04:09:14 - mmengine - INFO - Saving checkpoint at 594000 iterations +2024/01/13 04:21:33 - mmengine - INFO - Iter(train) [594500/640000] base_lr: 4.4591e-06 lr: 2.2236e-06 eta: 18:48:57 time: 1.4769 data_time: 0.0278 memory: 25722 grad_norm: 3.6784 loss: 1.0754 detection_loss_cls: 0.0250 detection_loss_reg: 0.3140 caption_loss_cls: 1.9358 grounding_loss_reg: 2.0221 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3094 instance_segmentation_loss_poly: 0.8172 +2024/01/13 04:34:21 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/13 04:34:21 - mmengine - INFO - Iter(train) [595000/640000] base_lr: 4.4056e-06 lr: 2.2187e-06 eta: 18:36:51 time: 1.4854 data_time: 0.0278 memory: 25722 grad_norm: 3.6762 loss: 1.0662 detection_loss_cls: 0.0249 detection_loss_reg: 0.3134 caption_loss_cls: 1.9358 grounding_loss_reg: 2.0212 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0242 instance_segmentation_loss_reg: 0.3094 instance_segmentation_loss_poly: 0.8182 +2024/01/13 04:47:06 - mmengine - INFO - Iter(train) [595500/640000] base_lr: 4.3526e-06 lr: 2.2139e-06 eta: 18:24:43 time: 1.4969 data_time: 0.0281 memory: 25722 grad_norm: 3.6502 loss: 1.0636 detection_loss_cls: 0.0248 detection_loss_reg: 0.3128 caption_loss_cls: 1.9330 grounding_loss_reg: 2.0206 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3074 instance_segmentation_loss_poly: 0.8142 +2024/01/13 04:59:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240112_050200 +2024/01/13 04:59:41 - mmengine - INFO - Iter(train) [596000/640000] base_lr: 4.3003e-06 lr: 2.2091e-06 eta: 18:12:25 time: 1.5019 data_time: 0.0282 memory: 25722 grad_norm: 3.6251 loss: 1.0611 detection_loss_cls: 0.0247 detection_loss_reg: 0.3121 caption_loss_cls: 1.9372 grounding_loss_reg: 2.0228 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3071 instance_segmentation_loss_poly: 0.8130 +2024/01/13 04:59:41 - mmengine - INFO - Saving checkpoint at 596000 iterations +2024/01/13 05:19:08 - mmengine - INFO - Iter(train) [596500/640000] base_lr: 4.2485e-06 lr: 2.2044e-06 eta: 17:41:29 time: 1.4920 data_time: 0.0229 memory: 25717 grad_norm: 3.6424 loss: 1.0604 detection_loss_cls: 0.0247 detection_loss_reg: 0.3125 caption_loss_cls: 1.9362 grounding_loss_reg: 2.0245 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3077 instance_segmentation_loss_poly: 0.8140 +2024/01/13 05:31:34 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 05:31:34 - mmengine - INFO - Iter(train) [597000/640000] base_lr: 4.1973e-06 lr: 2.1998e-06 eta: 17:39:14 time: 1.4916 data_time: 0.0226 memory: 25717 grad_norm: 3.6458 loss: 1.0700 detection_loss_cls: 0.0248 detection_loss_reg: 0.3128 caption_loss_cls: 1.9378 grounding_loss_reg: 2.0223 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0241 instance_segmentation_loss_reg: 0.3081 instance_segmentation_loss_poly: 0.8143 +2024/01/13 05:43:46 - mmengine - INFO - Iter(train) [597500/640000] base_lr: 4.1467e-06 lr: 2.1952e-06 eta: 17:23:11 time: 1.4955 data_time: 0.0223 memory: 25717 grad_norm: 3.6429 loss: 1.0635 detection_loss_cls: 0.0247 detection_loss_reg: 0.3122 caption_loss_cls: 1.9353 grounding_loss_reg: 2.0215 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3078 instance_segmentation_loss_poly: 0.8137 +2024/01/13 05:55:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 05:55:54 - mmengine - INFO - Iter(train) [598000/640000] base_lr: 4.0966e-06 lr: 2.1906e-06 eta: 17:07:49 time: 1.4902 data_time: 0.0218 memory: 25717 grad_norm: 3.6690 loss: 1.0637 detection_loss_cls: 0.0247 detection_loss_reg: 0.3119 caption_loss_cls: 1.9352 grounding_loss_reg: 2.0181 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3071 instance_segmentation_loss_poly: 0.8129 +2024/01/13 05:55:54 - mmengine - INFO - Saving checkpoint at 598000 iterations +2024/01/13 06:08:32 - mmengine - INFO - Iter(train) [598500/640000] base_lr: 4.0472e-06 lr: 2.1861e-06 eta: 17:02:01 time: 1.4949 data_time: 0.0213 memory: 25717 grad_norm: 3.6459 loss: 1.0621 detection_loss_cls: 0.0246 detection_loss_reg: 0.3104 caption_loss_cls: 1.9392 grounding_loss_reg: 2.0169 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3063 instance_segmentation_loss_poly: 0.8114 +2024/01/13 06:20:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 06:20:40 - mmengine - INFO - Iter(train) [599000/640000] base_lr: 3.9983e-06 lr: 2.1817e-06 eta: 16:47:08 time: 1.4850 data_time: 0.0210 memory: 25717 grad_norm: 3.6576 loss: 1.0715 detection_loss_cls: 0.0246 detection_loss_reg: 0.3109 caption_loss_cls: 1.9395 grounding_loss_reg: 2.0164 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3068 instance_segmentation_loss_poly: 0.8119 +2024/01/13 06:32:38 - mmengine - INFO - Iter(train) [599500/640000] base_lr: 3.9500e-06 lr: 2.1773e-06 eta: 16:31:12 time: 1.4734 data_time: 0.0205 memory: 25717 grad_norm: 3.6889 loss: 1.0762 detection_loss_cls: 0.0246 detection_loss_reg: 0.3112 caption_loss_cls: 1.9357 grounding_loss_reg: 2.0172 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3063 instance_segmentation_loss_poly: 0.8099 +2024/01/13 06:45:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 06:45:14 - mmengine - INFO - Iter(train) [600000/640000] base_lr: 3.9024e-06 lr: 2.1729e-06 eta: 16:22:27 time: 1.4737 data_time: 0.0202 memory: 25717 grad_norm: 3.6940 loss: 1.0746 detection_loss_cls: 0.0246 detection_loss_reg: 0.3102 caption_loss_cls: 1.9359 grounding_loss_reg: 2.0174 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0240 instance_segmentation_loss_reg: 0.3065 instance_segmentation_loss_poly: 0.8097 +2024/01/13 06:45:14 - mmengine - INFO - Saving checkpoint at 600000 iterations +2024/01/13 06:57:31 - mmengine - INFO - Evaluating bbox... +2024/01/13 06:58:27 - mmengine - INFO - bbox_mAP_copypaste: 0.514 0.694 0.561 0.352 0.563 0.649 +2024/01/13 06:58:27 - mmengine - INFO - Evaluating segm... +2024/01/13 06:59:41 - mmengine - INFO - segm_mAP_copypaste: 0.351 0.617 0.351 0.199 0.397 0.531 +2024/01/13 07:07:38 - mmengine - INFO - per class results: +2024/01/13 07:07:38 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.66 | 89.38 | +| building | 83.51 | 91.59 | +| sky | 93.38 | 97.69 | +| floor | 82.71 | 91.34 | +| tree | 74.23 | 88.07 | +| ceiling | 85.02 | 94.64 | +| road | 83.64 | 89.71 | +| bed | 90.16 | 96.06 | +| windowpane | 63.7 | 79.9 | +| grass | 67.27 | 85.26 | +| cabinet | 65.09 | 76.92 | +| sidewalk | 65.99 | 80.38 | +| person | 81.26 | 91.98 | +| earth | 42.18 | 53.96 | +| door | 54.64 | 71.03 | +| table | 66.45 | 80.87 | +| mountain | 62.58 | 75.69 | +| plant | 51.52 | 61.43 | +| curtain | 75.83 | 87.48 | +| chair | 61.31 | 73.98 | +| car | 85.13 | 92.12 | +| water | 56.0 | 70.75 | +| painting | 72.54 | 87.11 | +| sofa | 70.6 | 82.26 | +| shelf | 46.25 | 63.44 | +| house | 49.77 | 70.47 | +| sea | 54.08 | 72.68 | +| mirror | 70.09 | 78.45 | +| rug | 69.22 | 77.12 | +| field | 31.85 | 49.93 | +| armchair | 49.2 | 69.31 | +| seat | 62.07 | 80.21 | +| fence | 44.58 | 60.32 | +| desk | 47.3 | 67.6 | +| rock | 44.64 | 65.24 | +| wardrobe | 51.18 | 62.32 | +| lamp | 64.21 | 76.22 | +| bathtub | 80.77 | 83.97 | +| railing | 37.68 | 52.66 | +| cushion | 61.74 | 73.67 | +| base | 23.84 | 32.32 | +| box | 29.1 | 38.48 | +| column | 52.68 | 65.86 | +| signboard | 38.76 | 52.6 | +| chest of drawers | 39.42 | 58.13 | +| counter | 25.38 | 35.48 | +| sand | 48.63 | 65.1 | +| sink | 76.37 | 83.48 | +| skyscraper | 64.03 | 80.61 | +| fireplace | 79.06 | 90.24 | +| refrigerator | 74.44 | 79.35 | +| grandstand | 41.48 | 75.93 | +| path | 25.65 | 38.91 | +| stairs | 27.05 | 31.36 | +| runway | 67.42 | 86.86 | +| case | 51.65 | 68.29 | +| pool table | 91.97 | 96.76 | +| pillow | 59.82 | 70.21 | +| screen door | 78.03 | 81.18 | +| stairway | 30.61 | 46.34 | +| river | 13.33 | 27.99 | +| bridge | 56.03 | 74.8 | +| bookcase | 39.41 | 60.76 | +| blind | 40.01 | 44.4 | +| coffee table | 68.21 | 83.51 | +| toilet | 87.17 | 91.97 | +| flower | 41.03 | 56.05 | +| book | 52.88 | 72.3 | +| hill | 13.37 | 23.29 | +| bench | 60.83 | 67.98 | +| countertop | 62.52 | 79.45 | +| stove | 77.02 | 84.87 | +| palm | 44.7 | 59.39 | +| kitchen island | 43.33 | 74.95 | +| computer | 74.29 | 84.51 | +| swivel chair | 44.13 | 62.07 | +| boat | 74.21 | 79.57 | +| bar | 35.59 | 45.39 | +| arcade machine | 51.53 | 56.4 | +| hovel | 18.96 | 22.84 | +| bus | 93.07 | 95.65 | +| towel | 64.83 | 80.47 | +| light | 53.45 | 64.14 | +| truck | 43.65 | 60.05 | +| tower | 24.0 | 41.03 | +| chandelier | 66.3 | 80.18 | +| awning | 37.22 | 43.71 | +| streetlight | 33.18 | 44.6 | +| booth | 34.48 | 39.95 | +| television receiver | 71.43 | 81.64 | +| airplane | 59.51 | 74.86 | +| dirt track | 16.67 | 20.92 | +| apparel | 34.47 | 45.88 | +| pole | 28.67 | 40.2 | +| land | 2.92 | 4.7 | +| bannister | 16.35 | 21.51 | +| escalator | 26.79 | 29.59 | +| ottoman | 49.74 | 69.4 | +| bottle | 23.33 | 29.3 | +| buffet | 41.64 | 50.86 | +| poster | 34.19 | 42.26 | +| stage | 11.5 | 19.28 | +| van | 46.82 | 60.97 | +| ship | 16.61 | 18.74 | +| fountain | 21.18 | 21.71 | +| conveyer belt | 82.45 | 91.45 | +| canopy | 26.45 | 29.38 | +| washer | 70.2 | 70.92 | +| plaything | 28.31 | 33.0 | +| swimming pool | 65.83 | 71.53 | +| stool | 52.24 | 65.14 | +| barrel | 44.55 | 69.47 | +| basket | 30.11 | 45.84 | +| waterfall | 56.02 | 76.64 | +| tent | 92.21 | 96.7 | +| bag | 19.56 | 23.97 | +| minibike | 73.11 | 84.07 | +| cradle | 75.36 | 95.9 | +| oven | 54.86 | 72.91 | +| ball | 53.44 | 69.79 | +| food | 51.68 | 55.93 | +| step | 12.67 | 17.96 | +| tank | 37.24 | 44.32 | +| trade name | 27.13 | 31.62 | +| microwave | 85.75 | 91.19 | +| pot | 52.89 | 61.16 | +| animal | 58.68 | 62.15 | +| bicycle | 57.33 | 75.11 | +| lake | 56.31 | 63.47 | +| dishwasher | 59.52 | 68.9 | +| screen | 52.1 | 71.98 | +| blanket | 16.43 | 18.66 | +| sculpture | 56.62 | 66.88 | +| hood | 58.63 | 69.42 | +| sconce | 45.58 | 56.26 | +| vase | 46.21 | 60.79 | +| traffic light | 41.25 | 59.57 | +| tray | 8.58 | 15.64 | +| ashcan | 50.15 | 63.52 | +| fan | 60.0 | 71.51 | +| pier | 31.04 | 52.03 | +| crt screen | 7.62 | 19.08 | +| plate | 56.9 | 76.14 | +| monitor | 29.28 | 36.21 | +| bulletin board | 52.67 | 65.59 | +| shower | 2.78 | 4.89 | +| radiator | 58.8 | 65.04 | +| glass | 21.03 | 23.0 | +| clock | 26.89 | 33.5 | +| flag | 33.73 | 39.17 | ++---------------------+-------+-------+ +2024/01/13 07:07:56 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.5140 coco/bbox_mAP_50: 0.6940 coco/bbox_mAP_75: 0.5610 coco/bbox_mAP_s: 0.3520 coco/bbox_mAP_m: 0.5630 coco/bbox_mAP_l: 0.6490 coco/segm_mAP: 0.3510 coco/segm_mAP_50: 0.6170 coco/segm_mAP_75: 0.3510 coco/segm_mAP_s: 0.1990 coco/segm_mAP_m: 0.3970 coco/segm_mAP_l: 0.5310 Bleu_1: 0.7673 Bleu_2: 0.6062 Bleu_3: 0.4662 Bleu_4: 0.3555 METEOR: 0.2778 ROUGE_L: 0.5667 CIDEr: 1.1491 SPICE: 0.2066 aAcc: 84.0400 mIoU: 50.8900 mAcc: 62.2800 visual-grounding/miou: 0.8300 visual-grounding/acc: 0.8886 data_time: 0.0107 time: 1.3591 +2024/01/13 07:19:17 - mmengine - INFO - Iter(train) [600500/640000] base_lr: 3.8552e-06 lr: 2.1687e-06 eta: 16:02:15 time: 1.4613 data_time: 0.0210 memory: 25719 grad_norm: 3.7472 loss: 1.0853 detection_loss_cls: 0.0246 detection_loss_reg: 0.3106 caption_loss_cls: 1.9340 grounding_loss_reg: 2.0160 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3068 instance_segmentation_loss_poly: 0.8098 +2024/01/13 07:31:57 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 07:31:57 - mmengine - INFO - Iter(train) [601000/640000] base_lr: 3.8087e-06 lr: 2.1644e-06 eta: 15:53:49 time: 1.4648 data_time: 0.0211 memory: 25719 grad_norm: 3.6930 loss: 1.0745 detection_loss_cls: 0.0245 detection_loss_reg: 0.3093 caption_loss_cls: 1.9350 grounding_loss_reg: 2.0133 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3061 instance_segmentation_loss_poly: 0.8080 +2024/01/13 07:44:09 - mmengine - INFO - Iter(train) [601500/640000] base_lr: 3.7628e-06 lr: 2.1603e-06 eta: 15:41:22 time: 1.4650 data_time: 0.0215 memory: 25719 grad_norm: 3.7194 loss: 1.0871 detection_loss_cls: 0.0245 detection_loss_reg: 0.3098 caption_loss_cls: 1.9339 grounding_loss_reg: 2.0130 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3057 instance_segmentation_loss_poly: 0.8078 +2024/01/13 07:56:19 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 07:56:19 - mmengine - INFO - Iter(train) [602000/640000] base_lr: 3.7174e-06 lr: 2.1561e-06 eta: 15:28:39 time: 1.4653 data_time: 0.0218 memory: 25719 grad_norm: 3.7372 loss: 1.0924 detection_loss_cls: 0.0243 detection_loss_reg: 0.3094 caption_loss_cls: 1.9318 grounding_loss_reg: 2.0106 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3063 instance_segmentation_loss_poly: 0.8086 +2024/01/13 07:56:19 - mmengine - INFO - Saving checkpoint at 602000 iterations +2024/01/13 08:08:15 - mmengine - INFO - Iter(train) [602500/640000] base_lr: 3.6726e-06 lr: 2.1521e-06 eta: 15:14:44 time: 1.4548 data_time: 0.0223 memory: 25719 grad_norm: 3.7769 loss: 1.0908 detection_loss_cls: 0.0242 detection_loss_reg: 0.3084 caption_loss_cls: 1.9364 grounding_loss_reg: 2.0099 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3058 instance_segmentation_loss_poly: 0.8071 +2024/01/13 08:20:18 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 08:20:18 - mmengine - INFO - Iter(train) [603000/640000] base_lr: 3.6285e-06 lr: 2.1480e-06 eta: 15:01:45 time: 1.4536 data_time: 0.0223 memory: 25719 grad_norm: 3.7995 loss: 1.0828 detection_loss_cls: 0.0241 detection_loss_reg: 0.3068 caption_loss_cls: 1.9334 grounding_loss_reg: 2.0115 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3031 instance_segmentation_loss_poly: 0.8021 +2024/01/13 08:32:36 - mmengine - INFO - Iter(train) [603500/640000] base_lr: 3.5849e-06 lr: 2.1441e-06 eta: 14:50:02 time: 1.4584 data_time: 0.0226 memory: 25719 grad_norm: 3.7753 loss: 1.0799 detection_loss_cls: 0.0240 detection_loss_reg: 0.3063 caption_loss_cls: 1.9275 grounding_loss_reg: 2.0092 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3023 instance_segmentation_loss_poly: 0.8007 +2024/01/13 08:44:45 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 08:44:45 - mmengine - INFO - Iter(train) [604000/640000] base_lr: 3.5419e-06 lr: 2.1402e-06 eta: 14:37:38 time: 1.4518 data_time: 0.0229 memory: 25719 grad_norm: 3.8201 loss: 1.0911 detection_loss_cls: 0.0240 detection_loss_reg: 0.3061 caption_loss_cls: 1.9264 grounding_loss_reg: 2.0077 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3032 instance_segmentation_loss_poly: 0.8022 +2024/01/13 08:44:45 - mmengine - INFO - Saving checkpoint at 604000 iterations +2024/01/13 08:57:05 - mmengine - INFO - Iter(train) [604500/640000] base_lr: 3.4994e-06 lr: 2.1363e-06 eta: 14:26:00 time: 1.4659 data_time: 0.0272 memory: 25719 grad_norm: 3.7551 loss: 1.0798 detection_loss_cls: 0.0241 detection_loss_reg: 0.3065 caption_loss_cls: 1.9249 grounding_loss_reg: 2.0054 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3045 instance_segmentation_loss_poly: 0.8037 +2024/01/13 09:09:10 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 09:09:10 - mmengine - INFO - Iter(train) [605000/640000] base_lr: 3.4576e-06 lr: 2.1325e-06 eta: 14:13:22 time: 1.4573 data_time: 0.0271 memory: 25719 grad_norm: 3.7910 loss: 1.0858 detection_loss_cls: 0.0242 detection_loss_reg: 0.3085 caption_loss_cls: 1.9237 grounding_loss_reg: 2.0062 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3046 instance_segmentation_loss_poly: 0.8043 +2024/01/13 09:22:13 - mmengine - INFO - Iter(train) [605500/640000] base_lr: 3.4163e-06 lr: 2.1288e-06 eta: 14:04:15 time: 1.4699 data_time: 0.0273 memory: 25719 grad_norm: 3.7287 loss: 1.0691 detection_loss_cls: 0.0241 detection_loss_reg: 0.3078 caption_loss_cls: 1.9222 grounding_loss_reg: 2.0039 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3054 instance_segmentation_loss_poly: 0.8056 +2024/01/13 09:34:22 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 09:34:22 - mmengine - INFO - Iter(train) [606000/640000] base_lr: 3.3757e-06 lr: 2.1251e-06 eta: 13:51:42 time: 1.4698 data_time: 0.0273 memory: 25719 grad_norm: 3.7275 loss: 1.0744 detection_loss_cls: 0.0241 detection_loss_reg: 0.3082 caption_loss_cls: 1.9269 grounding_loss_reg: 2.0072 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3065 instance_segmentation_loss_poly: 0.8073 +2024/01/13 09:34:22 - mmengine - INFO - Saving checkpoint at 606000 iterations +2024/01/13 09:47:23 - mmengine - INFO - Iter(train) [606500/640000] base_lr: 3.3356e-06 lr: 2.1214e-06 eta: 13:41:55 time: 1.4859 data_time: 0.0273 memory: 25719 grad_norm: 3.6519 loss: 1.0569 detection_loss_cls: 0.0240 detection_loss_reg: 0.3085 caption_loss_cls: 1.9247 grounding_loss_reg: 2.0045 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3065 instance_segmentation_loss_poly: 0.8074 +2024/01/13 10:00:03 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 10:00:03 - mmengine - INFO - Iter(train) [607000/640000] base_lr: 3.2961e-06 lr: 2.1178e-06 eta: 13:30:50 time: 1.4952 data_time: 0.0276 memory: 25719 grad_norm: 3.5808 loss: 1.0542 detection_loss_cls: 0.0241 detection_loss_reg: 0.3091 caption_loss_cls: 1.9197 grounding_loss_reg: 2.0048 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3060 instance_segmentation_loss_poly: 0.8071 +2024/01/13 10:12:15 - mmengine - INFO - Iter(train) [607500/640000] base_lr: 3.2572e-06 lr: 2.1143e-06 eta: 13:18:16 time: 1.4937 data_time: 0.0277 memory: 25719 grad_norm: 3.6023 loss: 1.0628 detection_loss_cls: 0.0242 detection_loss_reg: 0.3106 caption_loss_cls: 1.9184 grounding_loss_reg: 2.0036 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3081 instance_segmentation_loss_poly: 0.8111 +2024/01/13 10:23:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 10:23:30 - mmengine - INFO - Iter(train) [608000/640000] base_lr: 3.2189e-06 lr: 2.1108e-06 eta: 13:03:13 time: 1.4802 data_time: 0.0275 memory: 25719 grad_norm: 3.6123 loss: 1.0593 detection_loss_cls: 0.0241 detection_loss_reg: 0.3102 caption_loss_cls: 1.9200 grounding_loss_reg: 1.9992 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3081 instance_segmentation_loss_poly: 0.8107 +2024/01/13 10:23:30 - mmengine - INFO - Saving checkpoint at 608000 iterations +2024/01/13 10:36:03 - mmengine - INFO - Iter(train) [608500/640000] base_lr: 3.1812e-06 lr: 2.1074e-06 eta: 12:51:46 time: 1.4836 data_time: 0.0276 memory: 25719 grad_norm: 3.6483 loss: 1.0595 detection_loss_cls: 0.0240 detection_loss_reg: 0.3091 caption_loss_cls: 1.9136 grounding_loss_reg: 2.0003 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3067 instance_segmentation_loss_poly: 0.8076 +2024/01/13 10:47:33 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 10:47:33 - mmengine - INFO - Iter(train) [609000/640000] base_lr: 3.1441e-06 lr: 2.1040e-06 eta: 12:37:42 time: 1.4746 data_time: 0.0274 memory: 25719 grad_norm: 3.6898 loss: 1.0599 detection_loss_cls: 0.0240 detection_loss_reg: 0.3089 caption_loss_cls: 1.9153 grounding_loss_reg: 1.9986 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3062 instance_segmentation_loss_poly: 0.8052 +2024/01/13 10:59:37 - mmengine - INFO - Iter(train) [609500/640000] base_lr: 3.1075e-06 lr: 2.1007e-06 eta: 12:25:06 time: 1.4598 data_time: 0.0273 memory: 25719 grad_norm: 3.7471 loss: 1.0751 detection_loss_cls: 0.0239 detection_loss_reg: 0.3085 caption_loss_cls: 1.9144 grounding_loss_reg: 1.9957 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3063 instance_segmentation_loss_poly: 0.8052 +2024/01/13 11:12:04 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 11:12:04 - mmengine - INFO - Iter(train) [610000/640000] base_lr: 3.0716e-06 lr: 2.0974e-06 eta: 12:13:22 time: 1.4643 data_time: 0.0273 memory: 25719 grad_norm: 3.7187 loss: 1.0648 detection_loss_cls: 0.0238 detection_loss_reg: 0.3070 caption_loss_cls: 1.9133 grounding_loss_reg: 1.9952 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3051 instance_segmentation_loss_poly: 0.8035 +2024/01/13 11:12:04 - mmengine - INFO - Saving checkpoint at 610000 iterations +2024/01/13 11:24:15 - mmengine - INFO - Iter(train) [610500/640000] base_lr: 3.0362e-06 lr: 2.0942e-06 eta: 12:01:03 time: 1.4521 data_time: 0.0272 memory: 25719 grad_norm: 3.7922 loss: 1.0830 detection_loss_cls: 0.0238 detection_loss_reg: 0.3070 caption_loss_cls: 1.9095 grounding_loss_reg: 1.9934 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3039 instance_segmentation_loss_poly: 0.8009 +2024/01/13 11:36:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 11:36:17 - mmengine - INFO - Iter(train) [611000/640000] base_lr: 3.0015e-06 lr: 2.0910e-06 eta: 11:48:28 time: 1.4425 data_time: 0.0271 memory: 25719 grad_norm: 3.8417 loss: 1.0880 detection_loss_cls: 0.0237 detection_loss_reg: 0.3065 caption_loss_cls: 1.9079 grounding_loss_reg: 1.9922 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3041 instance_segmentation_loss_poly: 0.8009 +2024/01/13 11:48:33 - mmengine - INFO - Iter(train) [611500/640000] base_lr: 2.9673e-06 lr: 2.0879e-06 eta: 11:36:19 time: 1.4435 data_time: 0.0270 memory: 25719 grad_norm: 3.8682 loss: 1.0875 detection_loss_cls: 0.0237 detection_loss_reg: 0.3069 caption_loss_cls: 1.9072 grounding_loss_reg: 1.9934 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3050 instance_segmentation_loss_poly: 0.8019 +2024/01/13 12:00:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 12:00:52 - mmengine - INFO - Iter(train) [612000/640000] base_lr: 2.9337e-06 lr: 2.0849e-06 eta: 11:24:16 time: 1.4595 data_time: 0.0272 memory: 25719 grad_norm: 3.8467 loss: 1.0865 detection_loss_cls: 0.0237 detection_loss_reg: 0.3074 caption_loss_cls: 1.9078 grounding_loss_reg: 1.9920 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0237 instance_segmentation_loss_reg: 0.3057 instance_segmentation_loss_poly: 0.8033 +2024/01/13 12:00:52 - mmengine - INFO - Saving checkpoint at 612000 iterations +2024/01/13 12:13:03 - mmengine - INFO - Iter(train) [612500/640000] base_lr: 2.9007e-06 lr: 2.0819e-06 eta: 11:11:58 time: 1.4540 data_time: 0.0269 memory: 25719 grad_norm: 3.8263 loss: 1.0777 detection_loss_cls: 0.0237 detection_loss_reg: 0.3070 caption_loss_cls: 1.9088 grounding_loss_reg: 1.9927 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0237 instance_segmentation_loss_reg: 0.3057 instance_segmentation_loss_poly: 0.8034 +2024/01/13 12:26:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 12:26:08 - mmengine - INFO - Iter(train) [613000/640000] base_lr: 2.8683e-06 lr: 2.0789e-06 eta: 11:01:07 time: 1.4777 data_time: 0.0274 memory: 25719 grad_norm: 3.7497 loss: 1.0737 detection_loss_cls: 0.0237 detection_loss_reg: 0.3065 caption_loss_cls: 1.9085 grounding_loss_reg: 1.9925 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3058 instance_segmentation_loss_poly: 0.8038 +2024/01/13 12:38:29 - mmengine - INFO - Iter(train) [613500/640000] base_lr: 2.8365e-06 lr: 2.0760e-06 eta: 10:49:00 time: 1.4819 data_time: 0.0273 memory: 25719 grad_norm: 3.7502 loss: 1.0699 detection_loss_cls: 0.0237 detection_loss_reg: 0.3061 caption_loss_cls: 1.9091 grounding_loss_reg: 1.9921 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3049 instance_segmentation_loss_poly: 0.8025 +2024/01/13 12:50:17 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 12:50:17 - mmengine - INFO - Iter(train) [614000/640000] base_lr: 2.8053e-06 lr: 2.0732e-06 eta: 10:36:07 time: 1.4724 data_time: 0.0272 memory: 25719 grad_norm: 3.7745 loss: 1.0801 detection_loss_cls: 0.0237 detection_loss_reg: 0.3065 caption_loss_cls: 1.9092 grounding_loss_reg: 1.9930 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0237 instance_segmentation_loss_reg: 0.3052 instance_segmentation_loss_poly: 0.8025 +2024/01/13 12:50:17 - mmengine - INFO - Saving checkpoint at 614000 iterations +2024/01/13 13:02:20 - mmengine - INFO - Iter(train) [614500/640000] base_lr: 2.7746e-06 lr: 2.0704e-06 eta: 10:23:37 time: 1.4702 data_time: 0.0272 memory: 25719 grad_norm: 3.7995 loss: 1.0886 detection_loss_cls: 0.0237 detection_loss_reg: 0.3067 caption_loss_cls: 1.9093 grounding_loss_reg: 1.9947 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3054 instance_segmentation_loss_poly: 0.8029 +2024/01/13 13:15:07 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 13:15:07 - mmengine - INFO - Iter(train) [615000/640000] base_lr: 2.7446e-06 lr: 2.0677e-06 eta: 10:12:06 time: 1.4814 data_time: 0.0274 memory: 25719 grad_norm: 3.8075 loss: 1.0836 detection_loss_cls: 0.0237 detection_loss_reg: 0.3059 caption_loss_cls: 1.9080 grounding_loss_reg: 1.9952 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3056 instance_segmentation_loss_poly: 0.8035 +2024/01/13 13:28:20 - mmengine - INFO - Iter(train) [615500/640000] base_lr: 2.7151e-06 lr: 2.0650e-06 eta: 10:01:04 time: 1.4957 data_time: 0.0276 memory: 25719 grad_norm: 3.7378 loss: 1.0661 detection_loss_cls: 0.0238 detection_loss_reg: 0.3060 caption_loss_cls: 1.9023 grounding_loss_reg: 1.9957 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3053 instance_segmentation_loss_poly: 0.8020 +2024/01/13 13:40:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 13:40:41 - mmengine - INFO - Iter(train) [616000/640000] base_lr: 2.6863e-06 lr: 2.0624e-06 eta: 9:48:54 time: 1.4962 data_time: 0.0277 memory: 25719 grad_norm: 3.7525 loss: 1.0676 detection_loss_cls: 0.0237 detection_loss_reg: 0.3057 caption_loss_cls: 1.8994 grounding_loss_reg: 1.9943 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3055 instance_segmentation_loss_poly: 0.8023 +2024/01/13 13:40:41 - mmengine - INFO - Saving checkpoint at 616000 iterations +2024/01/13 13:53:40 - mmengine - INFO - Iter(train) [616500/640000] base_lr: 2.6580e-06 lr: 2.0598e-06 eta: 9:37:26 time: 1.5081 data_time: 0.0280 memory: 25719 grad_norm: 3.7240 loss: 1.0659 detection_loss_cls: 0.0237 detection_loss_reg: 0.3061 caption_loss_cls: 1.8938 grounding_loss_reg: 1.9919 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3052 instance_segmentation_loss_poly: 0.8017 +2024/01/13 14:05:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 14:05:43 - mmengine - INFO - Iter(train) [617000/640000] base_lr: 2.6303e-06 lr: 2.0573e-06 eta: 9:24:53 time: 1.4926 data_time: 0.0277 memory: 25719 grad_norm: 3.7900 loss: 1.0704 detection_loss_cls: 0.0238 detection_loss_reg: 0.3056 caption_loss_cls: 1.8938 grounding_loss_reg: 1.9944 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3057 instance_segmentation_loss_poly: 0.8031 +2024/01/13 14:18:16 - mmengine - INFO - Iter(train) [617500/640000] base_lr: 2.6033e-06 lr: 2.0548e-06 eta: 9:12:52 time: 1.4956 data_time: 0.0279 memory: 25719 grad_norm: 3.8011 loss: 1.0750 detection_loss_cls: 0.0239 detection_loss_reg: 0.3072 caption_loss_cls: 1.8947 grounding_loss_reg: 1.9932 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3059 instance_segmentation_loss_poly: 0.8037 +2024/01/13 14:31:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 14:31:08 - mmengine - INFO - Iter(train) [618000/640000] base_lr: 2.5768e-06 lr: 2.0524e-06 eta: 9:01:09 time: 1.5115 data_time: 0.0280 memory: 25719 grad_norm: 3.7413 loss: 1.0584 detection_loss_cls: 0.0237 detection_loss_reg: 0.3062 caption_loss_cls: 1.8937 grounding_loss_reg: 1.9962 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3059 instance_segmentation_loss_poly: 0.8030 +2024/01/13 14:31:08 - mmengine - INFO - Saving checkpoint at 618000 iterations +2024/01/13 14:43:45 - mmengine - INFO - Iter(train) [618500/640000] base_lr: 2.5509e-06 lr: 2.0501e-06 eta: 8:49:09 time: 1.5201 data_time: 0.0280 memory: 25719 grad_norm: 3.7172 loss: 1.0433 detection_loss_cls: 0.0238 detection_loss_reg: 0.3062 caption_loss_cls: 1.8919 grounding_loss_reg: 1.9959 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3056 instance_segmentation_loss_poly: 0.8018 +2024/01/13 14:55:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 14:55:41 - mmengine - INFO - Iter(train) [619000/640000] base_lr: 2.5256e-06 lr: 2.0478e-06 eta: 8:36:30 time: 1.5073 data_time: 0.0277 memory: 25719 grad_norm: 3.7308 loss: 1.0464 detection_loss_cls: 0.0237 detection_loss_reg: 0.3053 caption_loss_cls: 1.8930 grounding_loss_reg: 1.9953 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0234 instance_segmentation_loss_reg: 0.3049 instance_segmentation_loss_poly: 0.8004 +2024/01/13 15:07:34 - mmengine - INFO - Iter(train) [619500/640000] base_lr: 2.5009e-06 lr: 2.0455e-06 eta: 8:23:50 time: 1.4874 data_time: 0.0273 memory: 25719 grad_norm: 3.7819 loss: 1.0563 detection_loss_cls: 0.0236 detection_loss_reg: 0.3046 caption_loss_cls: 1.8946 grounding_loss_reg: 1.9957 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0233 instance_segmentation_loss_reg: 0.3039 instance_segmentation_loss_poly: 0.7978 +2024/01/13 15:19:05 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 15:19:05 - mmengine - INFO - Iter(train) [620000/640000] base_lr: 2.4768e-06 lr: 2.0433e-06 eta: 8:10:54 time: 1.4749 data_time: 0.0271 memory: 25719 grad_norm: 3.7989 loss: 1.0595 detection_loss_cls: 0.0236 detection_loss_reg: 0.3048 caption_loss_cls: 1.8958 grounding_loss_reg: 1.9976 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0233 instance_segmentation_loss_reg: 0.3041 instance_segmentation_loss_poly: 0.7981 +2024/01/13 15:19:05 - mmengine - INFO - Saving checkpoint at 620000 iterations +2024/01/13 15:31:32 - mmengine - INFO - Evaluating bbox... +2024/01/13 15:32:28 - mmengine - INFO - bbox_mAP_copypaste: 0.513 0.694 0.560 0.355 0.562 0.653 +2024/01/13 15:32:28 - mmengine - INFO - Evaluating segm... +2024/01/13 15:33:40 - mmengine - INFO - segm_mAP_copypaste: 0.349 0.614 0.345 0.198 0.394 0.532 +2024/01/13 15:41:21 - mmengine - INFO - per class results: +2024/01/13 15:41:21 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.57 | 89.68 | +| building | 83.08 | 91.62 | +| sky | 93.36 | 97.66 | +| floor | 83.12 | 90.84 | +| tree | 73.99 | 87.99 | +| ceiling | 85.42 | 93.54 | +| road | 83.52 | 89.88 | +| bed | 90.09 | 96.2 | +| windowpane | 64.68 | 80.09 | +| grass | 66.56 | 84.62 | +| cabinet | 63.43 | 74.64 | +| sidewalk | 66.99 | 81.48 | +| person | 81.45 | 91.8 | +| earth | 40.56 | 50.89 | +| door | 54.65 | 68.1 | +| table | 67.05 | 80.5 | +| mountain | 61.1 | 72.15 | +| plant | 50.98 | 61.03 | +| curtain | 74.88 | 87.38 | +| chair | 60.52 | 73.56 | +| car | 85.25 | 92.15 | +| water | 52.38 | 64.76 | +| painting | 72.15 | 87.27 | +| sofa | 71.28 | 84.18 | +| shelf | 47.15 | 68.62 | +| house | 48.84 | 70.43 | +| sea | 52.83 | 73.19 | +| mirror | 68.81 | 76.52 | +| rug | 69.6 | 76.9 | +| field | 31.13 | 49.37 | +| armchair | 47.67 | 66.39 | +| seat | 63.47 | 82.17 | +| fence | 46.56 | 64.89 | +| desk | 49.08 | 70.85 | +| rock | 48.02 | 73.08 | +| wardrobe | 44.95 | 61.21 | +| lamp | 63.84 | 75.84 | +| bathtub | 81.14 | 84.86 | +| railing | 38.1 | 52.88 | +| cushion | 62.17 | 73.68 | +| base | 23.46 | 31.59 | +| box | 27.84 | 36.83 | +| column | 53.31 | 65.07 | +| signboard | 37.74 | 51.35 | +| chest of drawers | 39.3 | 62.0 | +| counter | 28.62 | 40.24 | +| sand | 46.34 | 68.48 | +| sink | 76.49 | 83.87 | +| skyscraper | 64.38 | 81.69 | +| fireplace | 79.31 | 90.26 | +| refrigerator | 75.76 | 82.05 | +| grandstand | 40.37 | 76.5 | +| path | 25.11 | 40.48 | +| stairs | 29.52 | 37.4 | +| runway | 66.04 | 86.46 | +| case | 50.96 | 65.08 | +| pool table | 91.86 | 96.79 | +| pillow | 59.63 | 71.25 | +| screen door | 78.61 | 82.0 | +| stairway | 34.09 | 45.65 | +| river | 14.44 | 36.54 | +| bridge | 55.08 | 77.56 | +| bookcase | 39.76 | 61.39 | +| blind | 39.54 | 44.29 | +| coffee table | 69.78 | 83.12 | +| toilet | 87.51 | 91.8 | +| flower | 41.29 | 54.56 | +| book | 52.98 | 70.76 | +| hill | 13.72 | 22.82 | +| bench | 59.44 | 67.54 | +| countertop | 62.05 | 76.25 | +| stove | 77.03 | 85.22 | +| palm | 46.03 | 63.36 | +| kitchen island | 46.07 | 78.13 | +| computer | 76.85 | 87.44 | +| swivel chair | 42.09 | 57.39 | +| boat | 75.4 | 82.49 | +| bar | 32.4 | 44.27 | +| arcade machine | 53.72 | 56.92 | +| hovel | 12.77 | 14.58 | +| bus | 93.02 | 95.81 | +| towel | 64.37 | 79.67 | +| light | 52.74 | 62.58 | +| truck | 42.53 | 59.01 | +| tower | 22.23 | 38.06 | +| chandelier | 64.15 | 77.8 | +| awning | 36.16 | 42.28 | +| streetlight | 33.57 | 44.87 | +| booth | 33.9 | 38.85 | +| television receiver | 71.06 | 83.89 | +| airplane | 66.49 | 76.9 | +| dirt track | 16.7 | 19.65 | +| apparel | 32.46 | 43.31 | +| pole | 27.88 | 41.99 | +| land | 2.91 | 4.64 | +| bannister | 17.13 | 23.02 | +| escalator | 20.75 | 21.14 | +| ottoman | 47.85 | 64.9 | +| bottle | 22.48 | 28.1 | +| buffet | 38.28 | 48.36 | +| poster | 33.76 | 43.18 | +| stage | 11.09 | 19.18 | +| van | 50.3 | 67.18 | +| ship | 20.35 | 22.51 | +| fountain | 22.54 | 23.25 | +| conveyer belt | 69.4 | 91.41 | +| canopy | 22.59 | 27.2 | +| washer | 70.34 | 71.75 | +| plaything | 26.17 | 29.96 | +| swimming pool | 69.19 | 71.84 | +| stool | 50.95 | 64.86 | +| barrel | 13.88 | 33.97 | +| basket | 30.47 | 47.5 | +| waterfall | 56.07 | 79.56 | +| tent | 79.7 | 96.95 | +| bag | 22.71 | 28.57 | +| minibike | 73.07 | 83.24 | +| cradle | 74.9 | 96.54 | +| oven | 54.48 | 73.05 | +| ball | 54.16 | 69.45 | +| food | 54.53 | 60.01 | +| step | 15.48 | 22.74 | +| tank | 38.63 | 50.77 | +| trade name | 29.74 | 35.89 | +| microwave | 85.95 | 91.67 | +| pot | 50.87 | 59.48 | +| animal | 57.52 | 60.8 | +| bicycle | 57.52 | 74.47 | +| lake | 56.25 | 63.78 | +| dishwasher | 64.32 | 75.5 | +| screen | 52.18 | 72.28 | +| blanket | 17.23 | 19.39 | +| sculpture | 59.79 | 71.25 | +| hood | 61.31 | 68.44 | +| sconce | 45.54 | 55.09 | +| vase | 47.38 | 61.86 | +| traffic light | 38.08 | 53.58 | +| tray | 9.95 | 19.59 | +| ashcan | 44.26 | 55.0 | +| fan | 60.1 | 72.58 | +| pier | 32.69 | 53.89 | +| crt screen | 10.19 | 19.37 | +| plate | 56.79 | 74.14 | +| monitor | 30.98 | 34.53 | +| bulletin board | 42.62 | 52.81 | +| shower | 3.34 | 6.58 | +| radiator | 57.56 | 64.48 | +| glass | 20.31 | 22.28 | +| clock | 27.7 | 35.55 | +| flag | 33.23 | 39.0 | ++---------------------+-------+-------+ +2024/01/13 15:41:38 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.5130 coco/bbox_mAP_50: 0.6940 coco/bbox_mAP_75: 0.5600 coco/bbox_mAP_s: 0.3550 coco/bbox_mAP_m: 0.5620 coco/bbox_mAP_l: 0.6530 coco/segm_mAP: 0.3490 coco/segm_mAP_50: 0.6140 coco/segm_mAP_75: 0.3450 coco/segm_mAP_s: 0.1980 coco/segm_mAP_m: 0.3940 coco/segm_mAP_l: 0.5320 Bleu_1: 0.7708 Bleu_2: 0.6094 Bleu_3: 0.4691 Bleu_4: 0.3581 METEOR: 0.2790 ROUGE_L: 0.5680 CIDEr: 1.1564 SPICE: 0.2081 aAcc: 83.8900 mIoU: 50.4700 mAcc: 62.1800 visual-grounding/miou: 0.8288 visual-grounding/acc: 0.8858 data_time: 0.0054 time: 1.3543 +2024/01/13 15:53:42 - mmengine - INFO - Iter(train) [620500/640000] base_lr: 2.4532e-06 lr: 2.0412e-06 eta: 7:58:29 time: 1.4619 data_time: 0.0228 memory: 25719 grad_norm: 3.8649 loss: 1.0753 detection_loss_cls: 0.0236 detection_loss_reg: 0.3044 caption_loss_cls: 1.8925 grounding_loss_reg: 1.9991 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0234 instance_segmentation_loss_reg: 0.3044 instance_segmentation_loss_poly: 0.7991 +2024/01/13 16:06:20 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 16:06:20 - mmengine - INFO - Iter(train) [621000/640000] base_lr: 2.4303e-06 lr: 2.0391e-06 eta: 7:46:29 time: 1.4706 data_time: 0.0230 memory: 25719 grad_norm: 3.8210 loss: 1.0688 detection_loss_cls: 0.0236 detection_loss_reg: 0.3043 caption_loss_cls: 1.8921 grounding_loss_reg: 2.0016 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0234 instance_segmentation_loss_reg: 0.3033 instance_segmentation_loss_poly: 0.7967 +2024/01/13 16:19:03 - mmengine - INFO - Iter(train) [621500/640000] base_lr: 2.4080e-06 lr: 2.0371e-06 eta: 7:34:31 time: 1.4730 data_time: 0.0231 memory: 25719 grad_norm: 3.7677 loss: 1.0634 detection_loss_cls: 0.0235 detection_loss_reg: 0.3044 caption_loss_cls: 1.8941 grounding_loss_reg: 1.9990 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0234 instance_segmentation_loss_reg: 0.3043 instance_segmentation_loss_poly: 0.7983 +2024/01/13 16:31:41 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 16:31:42 - mmengine - INFO - Iter(train) [622000/640000] base_lr: 2.3862e-06 lr: 2.0351e-06 eta: 7:22:29 time: 1.4697 data_time: 0.0231 memory: 25719 grad_norm: 3.8149 loss: 1.0700 detection_loss_cls: 0.0235 detection_loss_reg: 0.3042 caption_loss_cls: 1.8923 grounding_loss_reg: 2.0000 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0234 instance_segmentation_loss_reg: 0.3041 instance_segmentation_loss_poly: 0.7976 +2024/01/13 16:31:42 - mmengine - INFO - Saving checkpoint at 622000 iterations +2024/01/13 16:44:41 - mmengine - INFO - Iter(train) [622500/640000] base_lr: 2.3651e-06 lr: 2.0332e-06 eta: 7:10:39 time: 1.4754 data_time: 0.0234 memory: 25719 grad_norm: 3.7683 loss: 1.0733 detection_loss_cls: 0.0236 detection_loss_reg: 0.3054 caption_loss_cls: 1.8914 grounding_loss_reg: 2.0016 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0234 instance_segmentation_loss_reg: 0.3040 instance_segmentation_loss_poly: 0.7979 +2024/01/13 16:57:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 16:57:31 - mmengine - INFO - Iter(train) [623000/640000] base_lr: 2.3445e-06 lr: 2.0313e-06 eta: 6:58:40 time: 1.4888 data_time: 0.0237 memory: 25719 grad_norm: 3.7135 loss: 1.0778 detection_loss_cls: 0.0237 detection_loss_reg: 0.3070 caption_loss_cls: 1.8956 grounding_loss_reg: 1.9998 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3063 instance_segmentation_loss_poly: 0.8022 +2024/01/13 17:10:56 - mmengine - INFO - Iter(train) [623500/640000] base_lr: 2.3246e-06 lr: 2.0295e-06 eta: 6:47:00 time: 1.5119 data_time: 0.0243 memory: 25719 grad_norm: 3.6625 loss: 1.0759 detection_loss_cls: 0.0238 detection_loss_reg: 0.3083 caption_loss_cls: 1.8992 grounding_loss_reg: 1.9989 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3073 instance_segmentation_loss_poly: 0.8045 +2024/01/13 17:22:53 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 17:22:53 - mmengine - INFO - Iter(train) [624000/640000] base_lr: 2.3052e-06 lr: 2.0277e-06 eta: 6:34:27 time: 1.5183 data_time: 0.0244 memory: 25719 grad_norm: 3.6244 loss: 1.0762 detection_loss_cls: 0.0238 detection_loss_reg: 0.3078 caption_loss_cls: 1.9001 grounding_loss_reg: 1.9990 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3069 instance_segmentation_loss_poly: 0.8035 +2024/01/13 17:22:53 - mmengine - INFO - Saving checkpoint at 624000 iterations +2024/01/13 17:35:22 - mmengine - INFO - Iter(train) [624500/640000] base_lr: 2.2865e-06 lr: 2.0260e-06 eta: 6:22:12 time: 1.5238 data_time: 0.0288 memory: 25719 grad_norm: 3.5978 loss: 1.0787 detection_loss_cls: 0.0238 detection_loss_reg: 0.3079 caption_loss_cls: 1.9020 grounding_loss_reg: 2.0015 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3069 instance_segmentation_loss_poly: 0.8035 +2024/01/13 17:47:52 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 17:47:52 - mmengine - INFO - Iter(train) [625000/640000] base_lr: 2.2683e-06 lr: 2.0244e-06 eta: 6:09:57 time: 1.5219 data_time: 0.0288 memory: 25719 grad_norm: 3.6127 loss: 1.0822 detection_loss_cls: 0.0237 detection_loss_reg: 0.3076 caption_loss_cls: 1.9034 grounding_loss_reg: 2.0037 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3064 instance_segmentation_loss_poly: 0.8019 +2024/01/13 17:59:56 - mmengine - INFO - Iter(train) [625500/640000] base_lr: 2.2507e-06 lr: 2.0228e-06 eta: 5:57:29 time: 1.5123 data_time: 0.0287 memory: 25719 grad_norm: 3.6738 loss: 1.0950 detection_loss_cls: 0.0238 detection_loss_reg: 0.3089 caption_loss_cls: 1.9065 grounding_loss_reg: 2.0063 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3070 instance_segmentation_loss_poly: 0.8033 +2024/01/13 18:11:54 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 18:11:54 - mmengine - INFO - Iter(train) [626000/640000] base_lr: 2.2337e-06 lr: 2.0212e-06 eta: 5:44:59 time: 1.5020 data_time: 0.0285 memory: 25719 grad_norm: 3.6797 loss: 1.0975 detection_loss_cls: 0.0237 detection_loss_reg: 0.3090 caption_loss_cls: 1.9058 grounding_loss_reg: 2.0040 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3070 instance_segmentation_loss_poly: 0.8034 +2024/01/13 18:11:54 - mmengine - INFO - Saving checkpoint at 626000 iterations +2024/01/13 18:24:54 - mmengine - INFO - Iter(train) [626500/640000] base_lr: 2.2173e-06 lr: 2.0198e-06 eta: 5:32:58 time: 1.5019 data_time: 0.0285 memory: 25719 grad_norm: 3.7126 loss: 1.0945 detection_loss_cls: 0.0238 detection_loss_reg: 0.3097 caption_loss_cls: 1.9037 grounding_loss_reg: 2.0038 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3067 instance_segmentation_loss_poly: 0.8029 +2024/01/13 18:36:29 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 18:36:29 - mmengine - INFO - Iter(train) [627000/640000] base_lr: 2.2015e-06 lr: 2.0183e-06 eta: 5:20:19 time: 1.4833 data_time: 0.0282 memory: 25719 grad_norm: 3.7922 loss: 1.1038 detection_loss_cls: 0.0238 detection_loss_reg: 0.3095 caption_loss_cls: 1.9082 grounding_loss_reg: 2.0057 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3070 instance_segmentation_loss_poly: 0.8034 +2024/01/13 18:48:30 - mmengine - INFO - Iter(train) [627500/640000] base_lr: 2.1863e-06 lr: 2.0169e-06 eta: 5:07:52 time: 1.4624 data_time: 0.0278 memory: 25719 grad_norm: 3.8280 loss: 1.1084 detection_loss_cls: 0.0235 detection_loss_reg: 0.3071 caption_loss_cls: 1.9119 grounding_loss_reg: 2.0069 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0234 instance_segmentation_loss_reg: 0.3055 instance_segmentation_loss_poly: 0.8000 +2024/01/13 19:00:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 19:00:14 - mmengine - INFO - Iter(train) [628000/640000] base_lr: 2.1717e-06 lr: 2.0156e-06 eta: 4:55:20 time: 1.4590 data_time: 0.0278 memory: 25719 grad_norm: 3.8759 loss: 1.1062 detection_loss_cls: 0.0237 detection_loss_reg: 0.3078 caption_loss_cls: 1.9106 grounding_loss_reg: 2.0074 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0234 instance_segmentation_loss_reg: 0.3052 instance_segmentation_loss_poly: 0.7995 +2024/01/13 19:00:14 - mmengine - INFO - Saving checkpoint at 628000 iterations +2024/01/13 19:12:10 - mmengine - INFO - Iter(train) [628500/640000] base_lr: 2.1577e-06 lr: 2.0143e-06 eta: 4:42:54 time: 1.4510 data_time: 0.0275 memory: 25719 grad_norm: 3.9149 loss: 1.1001 detection_loss_cls: 0.0238 detection_loss_reg: 0.3091 caption_loss_cls: 1.9143 grounding_loss_reg: 2.0056 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3067 instance_segmentation_loss_poly: 0.8030 +2024/01/13 19:24:06 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 19:24:06 - mmengine - INFO - Iter(train) [629000/640000] base_lr: 2.1443e-06 lr: 2.0131e-06 eta: 4:30:28 time: 1.4424 data_time: 0.0273 memory: 25719 grad_norm: 4.0448 loss: 1.1029 detection_loss_cls: 0.0239 detection_loss_reg: 0.3090 caption_loss_cls: 1.9099 grounding_loss_reg: 2.0050 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3064 instance_segmentation_loss_poly: 0.8026 +2024/01/13 19:36:09 - mmengine - INFO - Iter(train) [629500/640000] base_lr: 2.1315e-06 lr: 2.0120e-06 eta: 4:18:05 time: 1.4420 data_time: 0.0273 memory: 25719 grad_norm: 4.0747 loss: 1.0928 detection_loss_cls: 0.0238 detection_loss_reg: 0.3092 caption_loss_cls: 1.9100 grounding_loss_reg: 2.0041 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3067 instance_segmentation_loss_poly: 0.8035 +2024/01/13 19:48:31 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 19:48:31 - mmengine - INFO - Iter(train) [630000/640000] base_lr: 2.1193e-06 lr: 2.0108e-06 eta: 4:05:49 time: 1.4482 data_time: 0.0272 memory: 25719 grad_norm: 4.0308 loss: 1.0848 detection_loss_cls: 0.0239 detection_loss_reg: 0.3096 caption_loss_cls: 1.9097 grounding_loss_reg: 2.0047 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3072 instance_segmentation_loss_poly: 0.8039 +2024/01/13 19:48:31 - mmengine - INFO - Saving checkpoint at 630000 iterations +2024/01/13 20:01:02 - mmengine - INFO - Iter(train) [630500/640000] base_lr: 2.1076e-06 lr: 2.0098e-06 eta: 3:53:35 time: 1.4410 data_time: 0.0271 memory: 25719 grad_norm: 4.0135 loss: 1.0887 detection_loss_cls: 0.0239 detection_loss_reg: 0.3093 caption_loss_cls: 1.9069 grounding_loss_reg: 2.0060 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3077 instance_segmentation_loss_poly: 0.8051 +2024/01/13 20:13:28 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 20:13:28 - mmengine - INFO - Iter(train) [631000/640000] base_lr: 2.0966e-06 lr: 2.0088e-06 eta: 3:41:20 time: 1.4538 data_time: 0.0273 memory: 25719 grad_norm: 3.9915 loss: 1.0736 detection_loss_cls: 0.0240 detection_loss_reg: 0.3100 caption_loss_cls: 1.9108 grounding_loss_reg: 2.0032 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3069 instance_segmentation_loss_poly: 0.8047 +2024/01/13 20:26:50 - mmengine - INFO - Iter(train) [631500/640000] base_lr: 2.0862e-06 lr: 2.0078e-06 eta: 3:29:17 time: 1.4738 data_time: 0.0276 memory: 25719 grad_norm: 3.9437 loss: 1.0674 detection_loss_cls: 0.0240 detection_loss_reg: 0.3097 caption_loss_cls: 1.9103 grounding_loss_reg: 2.0026 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0234 instance_segmentation_loss_reg: 0.3054 instance_segmentation_loss_poly: 0.8025 +2024/01/13 20:39:38 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 20:39:38 - mmengine - INFO - Iter(train) [632000/640000] base_lr: 2.0763e-06 lr: 2.0069e-06 eta: 3:17:05 time: 1.4900 data_time: 0.0278 memory: 25719 grad_norm: 3.8654 loss: 1.0557 detection_loss_cls: 0.0239 detection_loss_reg: 0.3093 caption_loss_cls: 1.9097 grounding_loss_reg: 2.0001 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0235 instance_segmentation_loss_reg: 0.3055 instance_segmentation_loss_poly: 0.8024 +2024/01/13 20:39:38 - mmengine - INFO - Saving checkpoint at 632000 iterations +2024/01/13 20:51:42 - mmengine - INFO - Iter(train) [632500/640000] base_lr: 2.0671e-06 lr: 2.0061e-06 eta: 3:04:43 time: 1.4917 data_time: 0.0278 memory: 25719 grad_norm: 3.8525 loss: 1.0532 detection_loss_cls: 0.0240 detection_loss_reg: 0.3105 caption_loss_cls: 1.9074 grounding_loss_reg: 1.9998 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0234 instance_segmentation_loss_reg: 0.3061 instance_segmentation_loss_poly: 0.8031 +2024/01/13 21:03:43 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 21:03:43 - mmengine - INFO - Iter(train) [633000/640000] base_lr: 2.0585e-06 lr: 2.0053e-06 eta: 2:52:20 time: 1.4931 data_time: 0.0278 memory: 25719 grad_norm: 3.7811 loss: 1.0539 detection_loss_cls: 0.0241 detection_loss_reg: 0.3105 caption_loss_cls: 1.9045 grounding_loss_reg: 1.9977 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3069 instance_segmentation_loss_poly: 0.8051 +2024/01/13 21:16:12 - mmengine - INFO - Iter(train) [633500/640000] base_lr: 2.0504e-06 lr: 2.0046e-06 eta: 2:40:03 time: 1.4998 data_time: 0.0279 memory: 25719 grad_norm: 3.7336 loss: 1.0527 detection_loss_cls: 0.0241 detection_loss_reg: 0.3108 caption_loss_cls: 1.9052 grounding_loss_reg: 1.9976 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3072 instance_segmentation_loss_poly: 0.8056 +2024/01/13 21:28:14 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 21:28:14 - mmengine - INFO - Iter(train) [634000/640000] base_lr: 2.0429e-06 lr: 2.0039e-06 eta: 2:27:42 time: 1.4947 data_time: 0.0280 memory: 25719 grad_norm: 3.7881 loss: 1.0657 detection_loss_cls: 0.0241 detection_loss_reg: 0.3104 caption_loss_cls: 1.9064 grounding_loss_reg: 1.9964 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0236 instance_segmentation_loss_reg: 0.3070 instance_segmentation_loss_poly: 0.8052 +2024/01/13 21:28:14 - mmengine - INFO - Saving checkpoint at 634000 iterations +2024/01/13 21:41:24 - mmengine - INFO - Iter(train) [634500/640000] base_lr: 2.0361e-06 lr: 2.0033e-06 eta: 2:15:30 time: 1.5043 data_time: 0.0282 memory: 25719 grad_norm: 3.7616 loss: 1.0629 detection_loss_cls: 0.0241 detection_loss_reg: 0.3111 caption_loss_cls: 1.9022 grounding_loss_reg: 1.9961 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0237 instance_segmentation_loss_reg: 0.3076 instance_segmentation_loss_poly: 0.8069 +2024/01/13 21:53:40 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 21:53:40 - mmengine - INFO - Iter(train) [635000/640000] base_lr: 2.0298e-06 lr: 2.0027e-06 eta: 2:03:11 time: 1.5017 data_time: 0.0282 memory: 25719 grad_norm: 3.7522 loss: 1.0684 detection_loss_cls: 0.0240 detection_loss_reg: 0.3103 caption_loss_cls: 1.9035 grounding_loss_reg: 1.9942 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0237 instance_segmentation_loss_reg: 0.3075 instance_segmentation_loss_poly: 0.8069 +2024/01/13 22:06:00 - mmengine - INFO - Iter(train) [635500/640000] base_lr: 2.0242e-06 lr: 2.0022e-06 eta: 1:50:52 time: 1.4865 data_time: 0.0279 memory: 25719 grad_norm: 3.7791 loss: 1.0704 detection_loss_cls: 0.0241 detection_loss_reg: 0.3115 caption_loss_cls: 1.9052 grounding_loss_reg: 1.9939 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3086 instance_segmentation_loss_poly: 0.8095 +2024/01/13 22:18:42 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 22:18:42 - mmengine - INFO - Iter(train) [636000/640000] base_lr: 2.0191e-06 lr: 2.0017e-06 eta: 1:38:35 time: 1.4848 data_time: 0.0278 memory: 25719 grad_norm: 3.7537 loss: 1.0735 detection_loss_cls: 0.0241 detection_loss_reg: 0.3109 caption_loss_cls: 1.9100 grounding_loss_reg: 1.9942 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3086 instance_segmentation_loss_poly: 0.8095 +2024/01/13 22:18:42 - mmengine - INFO - Saving checkpoint at 636000 iterations +2024/01/13 22:31:41 - mmengine - INFO - Iter(train) [636500/640000] base_lr: 2.0146e-06 lr: 2.0013e-06 eta: 1:26:19 time: 1.4987 data_time: 0.0281 memory: 25719 grad_norm: 3.7012 loss: 1.0694 detection_loss_cls: 0.0240 detection_loss_reg: 0.3110 caption_loss_cls: 1.9138 grounding_loss_reg: 1.9945 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3079 instance_segmentation_loss_poly: 0.8082 +2024/01/13 22:44:25 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 22:44:25 - mmengine - INFO - Iter(train) [637000/640000] base_lr: 2.0107e-06 lr: 2.0010e-06 eta: 1:14:01 time: 1.5093 data_time: 0.0281 memory: 25719 grad_norm: 3.6085 loss: 1.0594 detection_loss_cls: 0.0240 detection_loss_reg: 0.3112 caption_loss_cls: 1.9133 grounding_loss_reg: 1.9967 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3079 instance_segmentation_loss_poly: 0.8083 +2024/01/13 22:56:39 - mmengine - INFO - Iter(train) [637500/640000] base_lr: 2.0075e-06 lr: 2.0007e-06 eta: 1:01:40 time: 1.5056 data_time: 0.0281 memory: 25719 grad_norm: 3.6377 loss: 1.0635 detection_loss_cls: 0.0240 detection_loss_reg: 0.3105 caption_loss_cls: 1.9165 grounding_loss_reg: 1.9925 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0237 instance_segmentation_loss_reg: 0.3065 instance_segmentation_loss_poly: 0.8048 +2024/01/13 23:08:59 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 23:08:59 - mmengine - INFO - Iter(train) [638000/640000] base_lr: 2.0048e-06 lr: 2.0004e-06 eta: 0:49:20 time: 1.5102 data_time: 0.0281 memory: 25719 grad_norm: 3.6159 loss: 1.0516 detection_loss_cls: 0.0240 detection_loss_reg: 0.3100 caption_loss_cls: 1.9175 grounding_loss_reg: 1.9915 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0238 instance_segmentation_loss_reg: 0.3063 instance_segmentation_loss_poly: 0.8036 +2024/01/13 23:08:59 - mmengine - INFO - Saving checkpoint at 638000 iterations +2024/01/13 23:21:53 - mmengine - INFO - Iter(train) [638500/640000] base_lr: 2.0027e-06 lr: 2.0002e-06 eta: 0:37:01 time: 1.5062 data_time: 0.0280 memory: 25719 grad_norm: 3.6541 loss: 1.0493 detection_loss_cls: 0.0240 detection_loss_reg: 0.3103 caption_loss_cls: 1.9158 grounding_loss_reg: 1.9891 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3080 instance_segmentation_loss_poly: 0.8073 +2024/01/13 23:34:08 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 23:34:08 - mmengine - INFO - Iter(train) [639000/640000] base_lr: 2.0012e-06 lr: 2.0001e-06 eta: 0:24:40 time: 1.5059 data_time: 0.0280 memory: 25719 grad_norm: 3.6770 loss: 1.0433 detection_loss_cls: 0.0240 detection_loss_reg: 0.3110 caption_loss_cls: 1.9123 grounding_loss_reg: 1.9893 semantic_segmentation_loss_cls: 0.0065 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3079 instance_segmentation_loss_poly: 0.8072 +2024/01/13 23:46:43 - mmengine - INFO - Iter(train) [639500/640000] base_lr: 2.0003e-06 lr: 2.0000e-06 eta: 0:12:20 time: 1.5095 data_time: 0.0281 memory: 25719 grad_norm: 3.6955 loss: 1.0439 detection_loss_cls: 0.0240 detection_loss_reg: 0.3113 caption_loss_cls: 1.9134 grounding_loss_reg: 1.9868 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3081 instance_segmentation_loss_poly: 0.8076 +2024/01/13 23:58:30 - mmengine - INFO - Exp name: univision_joint_5_cosine_filteranno_64witer_1120_text_fixbug_final_large_dpr0p4_20240113_050346 +2024/01/13 23:58:30 - mmengine - INFO - Iter(train) [640000/640000] base_lr: 2.0000e-06 lr: 2.0000e-06 eta: 0:00:00 time: 1.4961 data_time: 0.0280 memory: 25719 grad_norm: 3.8123 loss: 1.0586 detection_loss_cls: 0.0241 detection_loss_reg: 0.3119 caption_loss_cls: 1.9131 grounding_loss_reg: 1.9838 semantic_segmentation_loss_cls: 0.0064 instance_segmentation_loss_cls: 0.0239 instance_segmentation_loss_reg: 0.3082 instance_segmentation_loss_poly: 0.8075 +2024/01/13 23:58:30 - mmengine - INFO - Saving checkpoint at 640000 iterations +2024/01/14 00:11:26 - mmengine - INFO - Evaluating bbox... +2024/01/14 00:12:23 - mmengine - INFO - bbox_mAP_copypaste: 0.513 0.692 0.559 0.351 0.561 0.652 +2024/01/14 00:12:23 - mmengine - INFO - Evaluating segm... +2024/01/14 00:13:34 - mmengine - INFO - segm_mAP_copypaste: 0.351 0.614 0.347 0.200 0.395 0.533 +2024/01/14 00:21:18 - mmengine - INFO - per class results: +2024/01/14 00:21:18 - mmengine - INFO - ++---------------------+-------+-------+ +| Class | IoU | Acc | ++---------------------+-------+-------+ +| wall | 78.72 | 89.72 | +| building | 83.27 | 92.1 | +| sky | 93.33 | 97.74 | +| floor | 83.05 | 91.15 | +| tree | 73.84 | 86.85 | +| ceiling | 85.28 | 93.99 | +| road | 83.58 | 88.94 | +| bed | 90.7 | 95.85 | +| windowpane | 64.51 | 80.4 | +| grass | 65.59 | 83.23 | +| cabinet | 64.49 | 77.08 | +| sidewalk | 66.87 | 82.37 | +| person | 81.64 | 91.73 | +| earth | 40.91 | 52.89 | +| door | 55.12 | 68.33 | +| table | 67.4 | 80.26 | +| mountain | 61.5 | 72.45 | +| plant | 51.37 | 62.45 | +| curtain | 75.16 | 86.98 | +| chair | 61.12 | 74.34 | +| car | 84.91 | 92.12 | +| water | 56.89 | 71.75 | +| painting | 72.47 | 86.82 | +| sofa | 70.91 | 83.97 | +| shelf | 46.47 | 64.51 | +| house | 49.31 | 67.87 | +| sea | 57.2 | 72.92 | +| mirror | 70.16 | 78.4 | +| rug | 67.8 | 78.1 | +| field | 30.47 | 48.08 | +| armchair | 48.32 | 65.86 | +| seat | 63.26 | 82.12 | +| fence | 47.23 | 68.37 | +| desk | 50.4 | 70.39 | +| rock | 47.43 | 70.92 | +| wardrobe | 53.82 | 66.55 | +| lamp | 64.3 | 75.95 | +| bathtub | 80.49 | 84.29 | +| railing | 37.9 | 52.79 | +| cushion | 63.2 | 74.31 | +| base | 23.6 | 31.55 | +| box | 27.79 | 36.43 | +| column | 53.54 | 64.4 | +| signboard | 37.71 | 52.66 | +| chest of drawers | 39.54 | 60.48 | +| counter | 26.2 | 36.62 | +| sand | 49.69 | 69.57 | +| sink | 76.48 | 83.05 | +| skyscraper | 60.93 | 76.13 | +| fireplace | 79.63 | 90.1 | +| refrigerator | 73.71 | 81.24 | +| grandstand | 38.63 | 77.82 | +| path | 24.66 | 39.0 | +| stairs | 27.08 | 32.32 | +| runway | 67.93 | 86.84 | +| case | 52.06 | 69.73 | +| pool table | 88.5 | 97.01 | +| pillow | 60.29 | 72.26 | +| screen door | 75.92 | 83.96 | +| stairway | 31.74 | 45.93 | +| river | 13.79 | 31.22 | +| bridge | 57.45 | 73.78 | +| bookcase | 39.38 | 61.9 | +| blind | 41.06 | 45.79 | +| coffee table | 68.73 | 84.2 | +| toilet | 87.54 | 91.51 | +| flower | 39.58 | 51.83 | +| book | 52.58 | 69.59 | +| hill | 12.56 | 21.32 | +| bench | 59.03 | 67.45 | +| countertop | 62.72 | 76.51 | +| stove | 77.57 | 85.45 | +| palm | 46.94 | 63.29 | +| kitchen island | 46.59 | 80.55 | +| computer | 76.5 | 86.87 | +| swivel chair | 40.64 | 55.15 | +| boat | 67.16 | 72.04 | +| bar | 32.94 | 43.62 | +| arcade machine | 58.42 | 63.73 | +| hovel | 20.88 | 23.78 | +| bus | 92.89 | 95.76 | +| towel | 64.58 | 79.3 | +| light | 53.1 | 62.75 | +| truck | 42.11 | 58.67 | +| tower | 20.28 | 32.49 | +| chandelier | 64.67 | 77.77 | +| awning | 36.14 | 42.16 | +| streetlight | 34.04 | 45.33 | +| booth | 36.21 | 42.18 | +| television receiver | 71.01 | 83.46 | +| airplane | 62.16 | 79.61 | +| dirt track | 17.14 | 20.84 | +| apparel | 32.09 | 43.48 | +| pole | 28.32 | 41.31 | +| land | 2.54 | 4.09 | +| bannister | 17.63 | 22.84 | +| escalator | 21.37 | 22.33 | +| ottoman | 48.4 | 61.53 | +| bottle | 22.94 | 28.17 | +| buffet | 39.35 | 48.53 | +| poster | 33.9 | 41.73 | +| stage | 11.44 | 20.34 | +| van | 45.93 | 59.24 | +| ship | 36.5 | 44.84 | +| fountain | 22.21 | 22.57 | +| conveyer belt | 76.35 | 91.13 | +| canopy | 23.73 | 27.23 | +| washer | 71.63 | 72.3 | +| plaything | 27.36 | 31.09 | +| swimming pool | 69.01 | 72.91 | +| stool | 49.58 | 63.68 | +| barrel | 21.06 | 68.01 | +| basket | 29.4 | 46.97 | +| waterfall | 54.17 | 72.68 | +| tent | 62.92 | 96.83 | +| bag | 23.83 | 30.33 | +| minibike | 73.64 | 83.81 | +| cradle | 74.13 | 96.07 | +| oven | 57.67 | 75.57 | +| ball | 52.94 | 68.94 | +| food | 53.64 | 59.23 | +| step | 14.69 | 20.04 | +| tank | 35.85 | 47.39 | +| trade name | 26.59 | 31.28 | +| microwave | 84.8 | 92.0 | +| pot | 50.48 | 58.38 | +| animal | 58.05 | 61.65 | +| bicycle | 58.47 | 74.66 | +| lake | 57.61 | 63.69 | +| dishwasher | 59.28 | 70.51 | +| screen | 51.57 | 72.11 | +| blanket | 17.46 | 20.33 | +| sculpture | 59.33 | 70.28 | +| hood | 61.04 | 69.06 | +| sconce | 44.03 | 52.81 | +| vase | 47.69 | 60.95 | +| traffic light | 40.57 | 59.48 | +| tray | 8.13 | 14.02 | +| ashcan | 43.91 | 55.8 | +| fan | 60.23 | 70.67 | +| pier | 32.34 | 68.19 | +| crt screen | 10.2 | 18.14 | +| plate | 56.34 | 74.18 | +| monitor | 40.79 | 46.39 | +| bulletin board | 45.53 | 57.45 | +| shower | 2.48 | 3.6 | +| radiator | 56.74 | 63.16 | +| glass | 20.33 | 22.22 | +| clock | 27.02 | 32.15 | +| flag | 34.04 | 39.52 | ++---------------------+-------+-------+ +2024/01/14 00:21:35 - mmengine - INFO - Iter(val) [209/209] coco/bbox_mAP: 0.5130 coco/bbox_mAP_50: 0.6920 coco/bbox_mAP_75: 0.5590 coco/bbox_mAP_s: 0.3510 coco/bbox_mAP_m: 0.5610 coco/bbox_mAP_l: 0.6520 coco/segm_mAP: 0.3510 coco/segm_mAP_50: 0.6140 coco/segm_mAP_75: 0.3470 coco/segm_mAP_s: 0.2000 coco/segm_mAP_m: 0.3950 coco/segm_mAP_l: 0.5330 Bleu_1: 0.7709 Bleu_2: 0.6105 Bleu_3: 0.4702 Bleu_4: 0.3587 METEOR: 0.2798 ROUGE_L: 0.5696 CIDEr: 1.1598 SPICE: 0.2087 aAcc: 84.0300 mIoU: 50.6100 mAcc: 62.4700 visual-grounding/miou: 0.8276 visual-grounding/acc: 0.8844 data_time: 0.0042 time: 1.3604