diff --git "a/training.log" "b/training.log" new file mode 100644--- /dev/null +++ "b/training.log" @@ -0,0 +1,2187 @@ +2023-04-05 11:55:52,514 ---------------------------------------------------------------------------------------------------- +2023-04-05 11:55:52,514 Model: "SequenceTagger( + (embeddings): StackedEmbeddings( + (list_embedding_0): WordEmbeddings( + 'en-crawl' + (embedding): Embedding(1000001, 300) + ) + (list_embedding_1): FlairEmbeddings( + (lm): LanguageModel( + (drop): Dropout(p=0.25, inplace=False) + (encoder): Embedding(275, 100) + (rnn): LSTM(100, 1024) + ) + ) + (list_embedding_2): FlairEmbeddings( + (lm): LanguageModel( + (drop): Dropout(p=0.25, inplace=False) + (encoder): Embedding(275, 100) + (rnn): LSTM(100, 1024) + ) + ) + ) + (word_dropout): WordDropout(p=0.05) + (locked_dropout): LockedDropout(p=0.5) + (embedding2nn): Linear(in_features=2348, out_features=2348, bias=True) + (rnn): LSTM(2348, 256, batch_first=True, bidirectional=True) + (linear): Linear(in_features=512, out_features=75, bias=True) + (loss_function): ViterbiLoss() + (crf): CRF() +)" +2023-04-05 11:55:52,514 ---------------------------------------------------------------------------------------------------- +2023-04-05 11:55:52,514 Corpus: "Corpus: 75187 train + 9603 dev + 9479 test sentences" +2023-04-05 11:55:52,514 ---------------------------------------------------------------------------------------------------- +2023-04-05 11:55:52,514 Parameters: +2023-04-05 11:55:52,514 - learning_rate: "0.100000" +2023-04-05 11:55:52,514 - mini_batch_size: "32" +2023-04-05 11:55:52,514 - patience: "3" +2023-04-05 11:55:52,514 - anneal_factor: "0.5" +2023-04-05 11:55:52,514 - max_epochs: "150" +2023-04-05 11:55:52,514 - shuffle: "True" +2023-04-05 11:55:52,514 - train_with_dev: "True" +2023-04-05 11:55:52,514 - batch_growth_annealing: "False" +2023-04-05 11:55:52,514 ---------------------------------------------------------------------------------------------------- +2023-04-05 11:55:52,514 Model training base path: "resources/taggers/release-ner-ontonotes-fast-0" +2023-04-05 11:55:52,514 ---------------------------------------------------------------------------------------------------- +2023-04-05 11:55:52,514 Device: cuda:1 +2023-04-05 11:55:52,514 ---------------------------------------------------------------------------------------------------- +2023-04-05 11:55:52,514 Embeddings storage mode: cpu +2023-04-05 11:55:52,514 ---------------------------------------------------------------------------------------------------- +2023-04-05 11:56:04,727 epoch 1 - iter 265/2650 - loss 0.23382084 - time (sec): 12.21 - samples/sec: 4964.59 - lr: 0.100000 +2023-04-05 11:56:29,457 epoch 1 - iter 530/2650 - loss 0.25783822 - time (sec): 36.94 - samples/sec: 5871.52 - lr: 0.100000 +2023-04-05 11:57:01,478 epoch 1 - iter 795/2650 - loss 0.23239070 - time (sec): 68.96 - samples/sec: 5698.31 - lr: 0.100000 +2023-04-05 11:57:28,868 epoch 1 - iter 1060/2650 - loss 0.21704976 - time (sec): 96.35 - samples/sec: 5713.75 - lr: 0.100000 +2023-04-05 11:57:47,016 epoch 1 - iter 1325/2650 - loss 0.17966939 - time (sec): 114.50 - samples/sec: 5855.33 - lr: 0.100000 +2023-04-05 11:58:08,819 epoch 1 - iter 1590/2650 - loss 0.16237454 - time (sec): 136.30 - samples/sec: 5945.77 - lr: 0.100000 +2023-04-05 11:58:53,164 epoch 1 - iter 1855/2650 - loss 0.16467915 - time (sec): 180.65 - samples/sec: 5675.19 - lr: 0.100000 +2023-04-05 11:59:18,620 epoch 1 - iter 2120/2650 - loss 0.16005373 - time (sec): 206.11 - samples/sec: 5807.58 - lr: 0.100000 +2023-04-05 11:59:38,716 epoch 1 - iter 2385/2650 - loss 0.15574297 - time (sec): 226.20 - samples/sec: 5776.53 - lr: 0.100000 +2023-04-05 12:00:03,859 epoch 1 - iter 2650/2650 - loss 0.15274049 - time (sec): 251.34 - samples/sec: 5818.17 - lr: 0.100000 +2023-04-05 12:00:03,859 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:00:03,859 EPOCH 1 done: loss 0.1527 - lr 0.100000 +2023-04-05 12:00:03,859 BAD EPOCHS (no improvement): 0 +2023-04-05 12:00:03,862 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:00:22,302 epoch 2 - iter 265/2650 - loss 0.11230987 - time (sec): 18.44 - samples/sec: 7930.04 - lr: 0.100000 +2023-04-05 12:00:40,755 epoch 2 - iter 530/2650 - loss 0.11000664 - time (sec): 36.89 - samples/sec: 7928.22 - lr: 0.100000 +2023-04-05 12:00:58,953 epoch 2 - iter 795/2650 - loss 0.10590899 - time (sec): 55.09 - samples/sec: 7962.22 - lr: 0.100000 +2023-04-05 12:01:17,011 epoch 2 - iter 1060/2650 - loss 0.10456016 - time (sec): 73.15 - samples/sec: 8006.86 - lr: 0.100000 +2023-04-05 12:01:35,307 epoch 2 - iter 1325/2650 - loss 0.10299613 - time (sec): 91.45 - samples/sec: 7998.49 - lr: 0.100000 +2023-04-05 12:01:53,010 epoch 2 - iter 1590/2650 - loss 0.10234779 - time (sec): 109.15 - samples/sec: 8036.01 - lr: 0.100000 +2023-04-05 12:02:11,169 epoch 2 - iter 1855/2650 - loss 0.10092398 - time (sec): 127.31 - samples/sec: 8033.53 - lr: 0.100000 +2023-04-05 12:02:29,735 epoch 2 - iter 2120/2650 - loss 0.09967544 - time (sec): 145.87 - samples/sec: 8017.43 - lr: 0.100000 +2023-04-05 12:02:47,627 epoch 2 - iter 2385/2650 - loss 0.09833540 - time (sec): 163.76 - samples/sec: 8034.08 - lr: 0.100000 +2023-04-05 12:03:06,117 epoch 2 - iter 2650/2650 - loss 0.09679572 - time (sec): 182.26 - samples/sec: 8023.70 - lr: 0.100000 +2023-04-05 12:03:06,118 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:03:06,118 EPOCH 2 done: loss 0.0968 - lr 0.100000 +2023-04-05 12:03:06,118 BAD EPOCHS (no improvement): 0 +2023-04-05 12:03:06,122 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:03:24,046 epoch 3 - iter 265/2650 - loss 0.08025058 - time (sec): 17.92 - samples/sec: 8120.22 - lr: 0.100000 +2023-04-05 12:03:42,172 epoch 3 - iter 530/2650 - loss 0.08058853 - time (sec): 36.05 - samples/sec: 8103.13 - lr: 0.100000 +2023-04-05 12:04:00,169 epoch 3 - iter 795/2650 - loss 0.08007842 - time (sec): 54.05 - samples/sec: 8111.93 - lr: 0.100000 +2023-04-05 12:04:18,593 epoch 3 - iter 1060/2650 - loss 0.07989288 - time (sec): 72.47 - samples/sec: 8098.01 - lr: 0.100000 +2023-04-05 12:04:37,220 epoch 3 - iter 1325/2650 - loss 0.07930660 - time (sec): 91.10 - samples/sec: 8065.14 - lr: 0.100000 +2023-04-05 12:04:54,804 epoch 3 - iter 1590/2650 - loss 0.07944105 - time (sec): 108.68 - samples/sec: 8093.83 - lr: 0.100000 +2023-04-05 12:05:12,398 epoch 3 - iter 1855/2650 - loss 0.07925325 - time (sec): 126.28 - samples/sec: 8107.21 - lr: 0.100000 +2023-04-05 12:05:31,140 epoch 3 - iter 2120/2650 - loss 0.07934683 - time (sec): 145.02 - samples/sec: 8073.32 - lr: 0.100000 +2023-04-05 12:05:49,207 epoch 3 - iter 2385/2650 - loss 0.07877380 - time (sec): 163.09 - samples/sec: 8074.20 - lr: 0.100000 +2023-04-05 12:06:07,574 epoch 3 - iter 2650/2650 - loss 0.07837080 - time (sec): 181.45 - samples/sec: 8059.19 - lr: 0.100000 +2023-04-05 12:06:07,575 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:06:07,575 EPOCH 3 done: loss 0.0784 - lr 0.100000 +2023-04-05 12:06:07,575 BAD EPOCHS (no improvement): 0 +2023-04-05 12:06:07,578 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:06:25,795 epoch 4 - iter 265/2650 - loss 0.07049225 - time (sec): 18.22 - samples/sec: 8071.06 - lr: 0.100000 +2023-04-05 12:06:44,220 epoch 4 - iter 530/2650 - loss 0.06976328 - time (sec): 36.64 - samples/sec: 8003.98 - lr: 0.100000 +2023-04-05 12:07:02,807 epoch 4 - iter 795/2650 - loss 0.06991982 - time (sec): 55.23 - samples/sec: 7989.04 - lr: 0.100000 +2023-04-05 12:07:20,854 epoch 4 - iter 1060/2650 - loss 0.06998252 - time (sec): 73.28 - samples/sec: 8014.19 - lr: 0.100000 +2023-04-05 12:07:39,283 epoch 4 - iter 1325/2650 - loss 0.07016229 - time (sec): 91.70 - samples/sec: 7986.90 - lr: 0.100000 +2023-04-05 12:07:57,510 epoch 4 - iter 1590/2650 - loss 0.06961714 - time (sec): 109.93 - samples/sec: 7986.38 - lr: 0.100000 +2023-04-05 12:08:15,480 epoch 4 - iter 1855/2650 - loss 0.06951484 - time (sec): 127.90 - samples/sec: 7998.26 - lr: 0.100000 +2023-04-05 12:08:34,087 epoch 4 - iter 2120/2650 - loss 0.06941234 - time (sec): 146.51 - samples/sec: 7983.38 - lr: 0.100000 +2023-04-05 12:08:52,262 epoch 4 - iter 2385/2650 - loss 0.06942456 - time (sec): 164.68 - samples/sec: 7995.34 - lr: 0.100000 +2023-04-05 12:09:10,119 epoch 4 - iter 2650/2650 - loss 0.06943630 - time (sec): 182.54 - samples/sec: 8011.16 - lr: 0.100000 +2023-04-05 12:09:10,119 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:09:10,119 EPOCH 4 done: loss 0.0694 - lr 0.100000 +2023-04-05 12:09:10,119 BAD EPOCHS (no improvement): 0 +2023-04-05 12:09:10,122 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:09:27,818 epoch 5 - iter 265/2650 - loss 0.06246776 - time (sec): 17.70 - samples/sec: 8255.90 - lr: 0.100000 +2023-04-05 12:09:46,253 epoch 5 - iter 530/2650 - loss 0.06366999 - time (sec): 36.13 - samples/sec: 8060.63 - lr: 0.100000 +2023-04-05 12:10:04,365 epoch 5 - iter 795/2650 - loss 0.06442438 - time (sec): 54.24 - samples/sec: 8087.10 - lr: 0.100000 +2023-04-05 12:10:22,432 epoch 5 - iter 1060/2650 - loss 0.06458944 - time (sec): 72.31 - samples/sec: 8113.16 - lr: 0.100000 +2023-04-05 12:10:40,248 epoch 5 - iter 1325/2650 - loss 0.06473427 - time (sec): 90.13 - samples/sec: 8136.97 - lr: 0.100000 +2023-04-05 12:10:58,458 epoch 5 - iter 1590/2650 - loss 0.06467943 - time (sec): 108.34 - samples/sec: 8128.61 - lr: 0.100000 +2023-04-05 12:11:16,416 epoch 5 - iter 1855/2650 - loss 0.06452677 - time (sec): 126.29 - samples/sec: 8127.53 - lr: 0.100000 +2023-04-05 12:11:34,473 epoch 5 - iter 2120/2650 - loss 0.06426157 - time (sec): 144.35 - samples/sec: 8118.67 - lr: 0.100000 +2023-04-05 12:11:53,009 epoch 5 - iter 2385/2650 - loss 0.06427012 - time (sec): 162.89 - samples/sec: 8093.25 - lr: 0.100000 +2023-04-05 12:12:10,966 epoch 5 - iter 2650/2650 - loss 0.06439649 - time (sec): 180.84 - samples/sec: 8086.29 - lr: 0.100000 +2023-04-05 12:12:10,967 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:12:10,967 EPOCH 5 done: loss 0.0644 - lr 0.100000 +2023-04-05 12:12:10,967 BAD EPOCHS (no improvement): 0 +2023-04-05 12:12:10,969 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:12:29,066 epoch 6 - iter 265/2650 - loss 0.05790724 - time (sec): 18.10 - samples/sec: 8050.64 - lr: 0.100000 +2023-04-05 12:12:47,566 epoch 6 - iter 530/2650 - loss 0.05843085 - time (sec): 36.60 - samples/sec: 8010.58 - lr: 0.100000 +2023-04-05 12:13:06,225 epoch 6 - iter 795/2650 - loss 0.05981691 - time (sec): 55.26 - samples/sec: 7991.76 - lr: 0.100000 +2023-04-05 12:13:24,311 epoch 6 - iter 1060/2650 - loss 0.06062779 - time (sec): 73.34 - samples/sec: 8022.23 - lr: 0.100000 +2023-04-05 12:13:42,282 epoch 6 - iter 1325/2650 - loss 0.06042401 - time (sec): 91.31 - samples/sec: 8028.02 - lr: 0.100000 +2023-04-05 12:14:00,756 epoch 6 - iter 1590/2650 - loss 0.06056236 - time (sec): 109.79 - samples/sec: 8005.10 - lr: 0.100000 +2023-04-05 12:14:18,492 epoch 6 - iter 1855/2650 - loss 0.06054906 - time (sec): 127.52 - samples/sec: 8027.15 - lr: 0.100000 +2023-04-05 12:14:37,090 epoch 6 - iter 2120/2650 - loss 0.06036658 - time (sec): 146.12 - samples/sec: 8007.85 - lr: 0.100000 +2023-04-05 12:14:55,412 epoch 6 - iter 2385/2650 - loss 0.06016822 - time (sec): 164.44 - samples/sec: 8003.95 - lr: 0.100000 +2023-04-05 12:15:13,513 epoch 6 - iter 2650/2650 - loss 0.06042134 - time (sec): 182.54 - samples/sec: 8011.05 - lr: 0.100000 +2023-04-05 12:15:13,513 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:15:13,513 EPOCH 6 done: loss 0.0604 - lr 0.100000 +2023-04-05 12:15:13,513 BAD EPOCHS (no improvement): 0 +2023-04-05 12:15:13,515 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:15:31,592 epoch 7 - iter 265/2650 - loss 0.05944745 - time (sec): 18.08 - samples/sec: 8097.30 - lr: 0.100000 +2023-04-05 12:15:49,822 epoch 7 - iter 530/2650 - loss 0.05811368 - time (sec): 36.31 - samples/sec: 8047.47 - lr: 0.100000 +2023-04-05 12:16:08,325 epoch 7 - iter 795/2650 - loss 0.05774613 - time (sec): 54.81 - samples/sec: 8025.25 - lr: 0.100000 +2023-04-05 12:16:26,579 epoch 7 - iter 1060/2650 - loss 0.05767583 - time (sec): 73.06 - samples/sec: 8008.10 - lr: 0.100000 +2023-04-05 12:16:44,456 epoch 7 - iter 1325/2650 - loss 0.05787860 - time (sec): 90.94 - samples/sec: 8040.02 - lr: 0.100000 +2023-04-05 12:17:02,622 epoch 7 - iter 1590/2650 - loss 0.05804474 - time (sec): 109.11 - samples/sec: 8026.11 - lr: 0.100000 +2023-04-05 12:17:20,506 epoch 7 - iter 1855/2650 - loss 0.05790756 - time (sec): 126.99 - samples/sec: 8051.17 - lr: 0.100000 +2023-04-05 12:17:38,941 epoch 7 - iter 2120/2650 - loss 0.05810694 - time (sec): 145.43 - samples/sec: 8037.42 - lr: 0.100000 +2023-04-05 12:17:57,167 epoch 7 - iter 2385/2650 - loss 0.05819172 - time (sec): 163.65 - samples/sec: 8045.04 - lr: 0.100000 +2023-04-05 12:18:14,918 epoch 7 - iter 2650/2650 - loss 0.05784669 - time (sec): 181.40 - samples/sec: 8061.42 - lr: 0.100000 +2023-04-05 12:18:14,919 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:18:14,919 EPOCH 7 done: loss 0.0578 - lr 0.100000 +2023-04-05 12:18:14,919 BAD EPOCHS (no improvement): 0 +2023-04-05 12:18:14,921 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:18:33,369 epoch 8 - iter 265/2650 - loss 0.05657238 - time (sec): 18.45 - samples/sec: 7919.80 - lr: 0.100000 +2023-04-05 12:18:51,141 epoch 8 - iter 530/2650 - loss 0.05533394 - time (sec): 36.22 - samples/sec: 8040.86 - lr: 0.100000 +2023-04-05 12:19:09,218 epoch 8 - iter 795/2650 - loss 0.05534134 - time (sec): 54.30 - samples/sec: 8050.31 - lr: 0.100000 +2023-04-05 12:19:27,044 epoch 8 - iter 1060/2650 - loss 0.05547612 - time (sec): 72.12 - samples/sec: 8068.69 - lr: 0.100000 +2023-04-05 12:19:45,283 epoch 8 - iter 1325/2650 - loss 0.05536765 - time (sec): 90.36 - samples/sec: 8059.63 - lr: 0.100000 +2023-04-05 12:20:03,707 epoch 8 - iter 1590/2650 - loss 0.05538248 - time (sec): 108.79 - samples/sec: 8034.49 - lr: 0.100000 +2023-04-05 12:20:22,645 epoch 8 - iter 1855/2650 - loss 0.05521424 - time (sec): 127.72 - samples/sec: 7999.41 - lr: 0.100000 +2023-04-05 12:20:40,899 epoch 8 - iter 2120/2650 - loss 0.05529887 - time (sec): 145.98 - samples/sec: 8007.73 - lr: 0.100000 +2023-04-05 12:20:58,846 epoch 8 - iter 2385/2650 - loss 0.05558498 - time (sec): 163.92 - samples/sec: 8025.52 - lr: 0.100000 +2023-04-05 12:21:16,768 epoch 8 - iter 2650/2650 - loss 0.05546903 - time (sec): 181.85 - samples/sec: 8041.77 - lr: 0.100000 +2023-04-05 12:21:16,768 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:21:16,768 EPOCH 8 done: loss 0.0555 - lr 0.100000 +2023-04-05 12:21:16,768 BAD EPOCHS (no improvement): 0 +2023-04-05 12:21:16,771 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:21:34,413 epoch 9 - iter 265/2650 - loss 0.05514030 - time (sec): 17.64 - samples/sec: 8221.34 - lr: 0.100000 +2023-04-05 12:21:52,244 epoch 9 - iter 530/2650 - loss 0.05470129 - time (sec): 35.47 - samples/sec: 8189.50 - lr: 0.100000 +2023-04-05 12:22:10,242 epoch 9 - iter 795/2650 - loss 0.05466464 - time (sec): 53.47 - samples/sec: 8139.94 - lr: 0.100000 +2023-04-05 12:22:28,701 epoch 9 - iter 1060/2650 - loss 0.05434786 - time (sec): 71.93 - samples/sec: 8127.46 - lr: 0.100000 +2023-04-05 12:22:46,936 epoch 9 - iter 1325/2650 - loss 0.05380690 - time (sec): 90.16 - samples/sec: 8112.07 - lr: 0.100000 +2023-04-05 12:23:05,477 epoch 9 - iter 1590/2650 - loss 0.05370828 - time (sec): 108.71 - samples/sec: 8074.25 - lr: 0.100000 +2023-04-05 12:23:23,573 epoch 9 - iter 1855/2650 - loss 0.05411363 - time (sec): 126.80 - samples/sec: 8077.94 - lr: 0.100000 +2023-04-05 12:23:41,702 epoch 9 - iter 2120/2650 - loss 0.05427407 - time (sec): 144.93 - samples/sec: 8075.19 - lr: 0.100000 +2023-04-05 12:24:00,336 epoch 9 - iter 2385/2650 - loss 0.05438808 - time (sec): 163.56 - samples/sec: 8058.71 - lr: 0.100000 +2023-04-05 12:24:18,428 epoch 9 - iter 2650/2650 - loss 0.05453123 - time (sec): 181.66 - samples/sec: 8050.13 - lr: 0.100000 +2023-04-05 12:24:18,429 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:24:18,429 EPOCH 9 done: loss 0.0545 - lr 0.100000 +2023-04-05 12:24:18,429 BAD EPOCHS (no improvement): 0 +2023-04-05 12:24:18,432 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:24:36,778 epoch 10 - iter 265/2650 - loss 0.05202438 - time (sec): 18.35 - samples/sec: 7990.81 - lr: 0.100000 +2023-04-05 12:24:55,101 epoch 10 - iter 530/2650 - loss 0.05354283 - time (sec): 36.67 - samples/sec: 8013.87 - lr: 0.100000 +2023-04-05 12:25:13,287 epoch 10 - iter 795/2650 - loss 0.05225011 - time (sec): 54.86 - samples/sec: 8030.12 - lr: 0.100000 +2023-04-05 12:25:31,826 epoch 10 - iter 1060/2650 - loss 0.05231810 - time (sec): 73.39 - samples/sec: 7987.56 - lr: 0.100000 +2023-04-05 12:25:49,712 epoch 10 - iter 1325/2650 - loss 0.05187882 - time (sec): 91.28 - samples/sec: 8022.72 - lr: 0.100000 +2023-04-05 12:26:08,235 epoch 10 - iter 1590/2650 - loss 0.05216325 - time (sec): 109.80 - samples/sec: 7984.32 - lr: 0.100000 +2023-04-05 12:26:26,736 epoch 10 - iter 1855/2650 - loss 0.05190296 - time (sec): 128.30 - samples/sec: 7960.04 - lr: 0.100000 +2023-04-05 12:26:46,199 epoch 10 - iter 2120/2650 - loss 0.05223343 - time (sec): 147.77 - samples/sec: 7913.12 - lr: 0.100000 +2023-04-05 12:27:05,152 epoch 10 - iter 2385/2650 - loss 0.05226226 - time (sec): 166.72 - samples/sec: 7893.19 - lr: 0.100000 +2023-04-05 12:27:24,673 epoch 10 - iter 2650/2650 - loss 0.05210672 - time (sec): 186.24 - samples/sec: 7851.98 - lr: 0.100000 +2023-04-05 12:27:24,673 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:27:24,673 EPOCH 10 done: loss 0.0521 - lr 0.100000 +2023-04-05 12:27:24,673 BAD EPOCHS (no improvement): 0 +2023-04-05 12:27:24,677 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:27:43,724 epoch 11 - iter 265/2650 - loss 0.05035804 - time (sec): 19.05 - samples/sec: 7672.63 - lr: 0.100000 +2023-04-05 12:28:02,544 epoch 11 - iter 530/2650 - loss 0.05068606 - time (sec): 37.87 - samples/sec: 7657.07 - lr: 0.100000 +2023-04-05 12:28:21,770 epoch 11 - iter 795/2650 - loss 0.05076615 - time (sec): 57.09 - samples/sec: 7656.84 - lr: 0.100000 +2023-04-05 12:28:40,457 epoch 11 - iter 1060/2650 - loss 0.05043864 - time (sec): 75.78 - samples/sec: 7692.52 - lr: 0.100000 +2023-04-05 12:28:59,705 epoch 11 - iter 1325/2650 - loss 0.05087034 - time (sec): 95.03 - samples/sec: 7666.45 - lr: 0.100000 +2023-04-05 12:29:19,595 epoch 11 - iter 1590/2650 - loss 0.05075048 - time (sec): 114.92 - samples/sec: 7622.88 - lr: 0.100000 +2023-04-05 12:29:39,059 epoch 11 - iter 1855/2650 - loss 0.05092614 - time (sec): 134.38 - samples/sec: 7610.38 - lr: 0.100000 +2023-04-05 12:29:58,822 epoch 11 - iter 2120/2650 - loss 0.05130763 - time (sec): 154.15 - samples/sec: 7577.38 - lr: 0.100000 +2023-04-05 12:30:17,970 epoch 11 - iter 2385/2650 - loss 0.05140729 - time (sec): 173.29 - samples/sec: 7586.29 - lr: 0.100000 +2023-04-05 12:30:37,494 epoch 11 - iter 2650/2650 - loss 0.05140431 - time (sec): 192.82 - samples/sec: 7584.21 - lr: 0.100000 +2023-04-05 12:30:37,494 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:30:37,494 EPOCH 11 done: loss 0.0514 - lr 0.100000 +2023-04-05 12:30:37,494 BAD EPOCHS (no improvement): 0 +2023-04-05 12:30:37,497 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:30:55,792 epoch 12 - iter 265/2650 - loss 0.05142969 - time (sec): 18.30 - samples/sec: 7938.95 - lr: 0.100000 +2023-04-05 12:31:14,931 epoch 12 - iter 530/2650 - loss 0.05101526 - time (sec): 37.43 - samples/sec: 7786.51 - lr: 0.100000 +2023-04-05 12:31:33,434 epoch 12 - iter 795/2650 - loss 0.05042159 - time (sec): 55.94 - samples/sec: 7827.24 - lr: 0.100000 +2023-04-05 12:32:02,198 epoch 12 - iter 1060/2650 - loss 0.05017825 - time (sec): 84.70 - samples/sec: 6917.33 - lr: 0.100000 +2023-04-05 12:32:20,821 epoch 12 - iter 1325/2650 - loss 0.05015871 - time (sec): 103.32 - samples/sec: 7091.76 - lr: 0.100000 +2023-04-05 12:32:38,930 epoch 12 - iter 1590/2650 - loss 0.04990136 - time (sec): 121.43 - samples/sec: 7238.21 - lr: 0.100000 +2023-04-05 12:32:57,262 epoch 12 - iter 1855/2650 - loss 0.04999932 - time (sec): 139.77 - samples/sec: 7333.36 - lr: 0.100000 +2023-04-05 12:33:15,257 epoch 12 - iter 2120/2650 - loss 0.05029461 - time (sec): 157.76 - samples/sec: 7419.87 - lr: 0.100000 +2023-04-05 12:33:33,647 epoch 12 - iter 2385/2650 - loss 0.05044099 - time (sec): 176.15 - samples/sec: 7475.19 - lr: 0.100000 +2023-04-05 12:33:52,373 epoch 12 - iter 2650/2650 - loss 0.05025042 - time (sec): 194.88 - samples/sec: 7504.05 - lr: 0.100000 +2023-04-05 12:33:52,374 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:33:52,374 EPOCH 12 done: loss 0.0503 - lr 0.100000 +2023-04-05 12:33:52,374 BAD EPOCHS (no improvement): 0 +2023-04-05 12:33:52,377 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:34:10,141 epoch 13 - iter 265/2650 - loss 0.04869784 - time (sec): 17.76 - samples/sec: 8147.50 - lr: 0.100000 +2023-04-05 12:34:27,656 epoch 13 - iter 530/2650 - loss 0.04833886 - time (sec): 35.28 - samples/sec: 8159.86 - lr: 0.100000 +2023-04-05 12:34:46,174 epoch 13 - iter 795/2650 - loss 0.04896568 - time (sec): 53.80 - samples/sec: 8094.52 - lr: 0.100000 +2023-04-05 12:35:04,386 epoch 13 - iter 1060/2650 - loss 0.04934329 - time (sec): 72.01 - samples/sec: 8073.63 - lr: 0.100000 +2023-04-05 12:35:22,560 epoch 13 - iter 1325/2650 - loss 0.04947801 - time (sec): 90.18 - samples/sec: 8056.63 - lr: 0.100000 +2023-04-05 12:35:41,217 epoch 13 - iter 1590/2650 - loss 0.04976344 - time (sec): 108.84 - samples/sec: 8049.25 - lr: 0.100000 +2023-04-05 12:36:00,059 epoch 13 - iter 1855/2650 - loss 0.04957149 - time (sec): 127.68 - samples/sec: 8005.30 - lr: 0.100000 +2023-04-05 12:36:18,102 epoch 13 - iter 2120/2650 - loss 0.04917012 - time (sec): 145.73 - samples/sec: 8022.10 - lr: 0.100000 +2023-04-05 12:36:36,131 epoch 13 - iter 2385/2650 - loss 0.04929011 - time (sec): 163.75 - samples/sec: 8034.14 - lr: 0.100000 +2023-04-05 12:36:53,884 epoch 13 - iter 2650/2650 - loss 0.04929423 - time (sec): 181.51 - samples/sec: 8056.77 - lr: 0.100000 +2023-04-05 12:36:53,885 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:36:53,885 EPOCH 13 done: loss 0.0493 - lr 0.100000 +2023-04-05 12:36:53,885 BAD EPOCHS (no improvement): 0 +2023-04-05 12:36:53,887 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:37:11,558 epoch 14 - iter 265/2650 - loss 0.05070119 - time (sec): 17.67 - samples/sec: 8249.23 - lr: 0.100000 +2023-04-05 12:37:29,406 epoch 14 - iter 530/2650 - loss 0.04894219 - time (sec): 35.52 - samples/sec: 8190.81 - lr: 0.100000 +2023-04-05 12:37:47,594 epoch 14 - iter 795/2650 - loss 0.04830202 - time (sec): 53.71 - samples/sec: 8125.62 - lr: 0.100000 +2023-04-05 12:38:06,375 epoch 14 - iter 1060/2650 - loss 0.04896686 - time (sec): 72.49 - samples/sec: 8083.61 - lr: 0.100000 +2023-04-05 12:38:25,103 epoch 14 - iter 1325/2650 - loss 0.04885832 - time (sec): 91.22 - samples/sec: 8050.97 - lr: 0.100000 +2023-04-05 12:38:42,814 epoch 14 - iter 1590/2650 - loss 0.04900945 - time (sec): 108.93 - samples/sec: 8069.28 - lr: 0.100000 +2023-04-05 12:39:00,686 epoch 14 - iter 1855/2650 - loss 0.04879396 - time (sec): 126.80 - samples/sec: 8086.54 - lr: 0.100000 +2023-04-05 12:39:19,624 epoch 14 - iter 2120/2650 - loss 0.04914099 - time (sec): 145.74 - samples/sec: 8052.80 - lr: 0.100000 +2023-04-05 12:39:37,651 epoch 14 - iter 2385/2650 - loss 0.04917636 - time (sec): 163.76 - samples/sec: 8051.35 - lr: 0.100000 +2023-04-05 12:39:55,112 epoch 14 - iter 2650/2650 - loss 0.04912956 - time (sec): 181.22 - samples/sec: 8069.36 - lr: 0.100000 +2023-04-05 12:39:55,112 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:39:55,112 EPOCH 14 done: loss 0.0491 - lr 0.100000 +2023-04-05 12:39:55,112 BAD EPOCHS (no improvement): 0 +2023-04-05 12:39:55,114 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:40:13,562 epoch 15 - iter 265/2650 - loss 0.04770681 - time (sec): 18.45 - samples/sec: 8048.53 - lr: 0.100000 +2023-04-05 12:40:31,328 epoch 15 - iter 530/2650 - loss 0.04720848 - time (sec): 36.21 - samples/sec: 8146.94 - lr: 0.100000 +2023-04-05 12:40:49,363 epoch 15 - iter 795/2650 - loss 0.04785518 - time (sec): 54.25 - samples/sec: 8146.11 - lr: 0.100000 +2023-04-05 12:41:07,786 epoch 15 - iter 1060/2650 - loss 0.04800242 - time (sec): 72.67 - samples/sec: 8077.61 - lr: 0.100000 +2023-04-05 12:41:25,997 epoch 15 - iter 1325/2650 - loss 0.04822847 - time (sec): 90.88 - samples/sec: 8073.97 - lr: 0.100000 +2023-04-05 12:41:44,124 epoch 15 - iter 1590/2650 - loss 0.04824853 - time (sec): 109.01 - samples/sec: 8075.87 - lr: 0.100000 +2023-04-05 12:42:02,573 epoch 15 - iter 1855/2650 - loss 0.04802729 - time (sec): 127.46 - samples/sec: 8058.30 - lr: 0.100000 +2023-04-05 12:42:20,962 epoch 15 - iter 2120/2650 - loss 0.04827911 - time (sec): 145.85 - samples/sec: 8040.04 - lr: 0.100000 +2023-04-05 12:42:38,237 epoch 15 - iter 2385/2650 - loss 0.04837887 - time (sec): 163.12 - samples/sec: 8065.94 - lr: 0.100000 +2023-04-05 12:42:56,431 epoch 15 - iter 2650/2650 - loss 0.04811435 - time (sec): 181.32 - samples/sec: 8065.24 - lr: 0.100000 +2023-04-05 12:42:56,431 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:42:56,431 EPOCH 15 done: loss 0.0481 - lr 0.100000 +2023-04-05 12:42:56,432 BAD EPOCHS (no improvement): 0 +2023-04-05 12:42:56,434 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:43:14,635 epoch 16 - iter 265/2650 - loss 0.04630785 - time (sec): 18.20 - samples/sec: 8009.11 - lr: 0.100000 +2023-04-05 12:43:32,318 epoch 16 - iter 530/2650 - loss 0.04618502 - time (sec): 35.88 - samples/sec: 8104.27 - lr: 0.100000 +2023-04-05 12:43:50,542 epoch 16 - iter 795/2650 - loss 0.04635297 - time (sec): 54.11 - samples/sec: 8095.55 - lr: 0.100000 +2023-04-05 12:44:08,855 epoch 16 - iter 1060/2650 - loss 0.04636492 - time (sec): 72.42 - samples/sec: 8066.14 - lr: 0.100000 +2023-04-05 12:44:27,258 epoch 16 - iter 1325/2650 - loss 0.04690913 - time (sec): 90.82 - samples/sec: 8045.54 - lr: 0.100000 +2023-04-05 12:44:45,564 epoch 16 - iter 1590/2650 - loss 0.04724407 - time (sec): 109.13 - samples/sec: 8032.83 - lr: 0.100000 +2023-04-05 12:45:03,846 epoch 16 - iter 1855/2650 - loss 0.04734092 - time (sec): 127.41 - samples/sec: 8035.39 - lr: 0.100000 +2023-04-05 12:45:21,556 epoch 16 - iter 2120/2650 - loss 0.04739831 - time (sec): 145.12 - samples/sec: 8051.10 - lr: 0.100000 +2023-04-05 12:45:39,934 epoch 16 - iter 2385/2650 - loss 0.04710078 - time (sec): 163.50 - samples/sec: 8043.60 - lr: 0.100000 +2023-04-05 12:45:58,148 epoch 16 - iter 2650/2650 - loss 0.04717087 - time (sec): 181.71 - samples/sec: 8047.64 - lr: 0.100000 +2023-04-05 12:45:58,148 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:45:58,148 EPOCH 16 done: loss 0.0472 - lr 0.100000 +2023-04-05 12:45:58,148 BAD EPOCHS (no improvement): 0 +2023-04-05 12:45:58,151 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:46:15,780 epoch 17 - iter 265/2650 - loss 0.04447271 - time (sec): 17.63 - samples/sec: 8296.63 - lr: 0.100000 +2023-04-05 12:46:33,987 epoch 17 - iter 530/2650 - loss 0.04585046 - time (sec): 35.84 - samples/sec: 8211.57 - lr: 0.100000 +2023-04-05 12:46:52,536 epoch 17 - iter 795/2650 - loss 0.04658852 - time (sec): 54.38 - samples/sec: 8111.57 - lr: 0.100000 +2023-04-05 12:47:10,623 epoch 17 - iter 1060/2650 - loss 0.04711308 - time (sec): 72.47 - samples/sec: 8110.04 - lr: 0.100000 +2023-04-05 12:47:29,006 epoch 17 - iter 1325/2650 - loss 0.04699361 - time (sec): 90.86 - samples/sec: 8090.16 - lr: 0.100000 +2023-04-05 12:47:46,870 epoch 17 - iter 1590/2650 - loss 0.04695491 - time (sec): 108.72 - samples/sec: 8077.02 - lr: 0.100000 +2023-04-05 12:48:05,515 epoch 17 - iter 1855/2650 - loss 0.04724098 - time (sec): 127.36 - samples/sec: 8044.65 - lr: 0.100000 +2023-04-05 12:48:23,969 epoch 17 - iter 2120/2650 - loss 0.04700970 - time (sec): 145.82 - samples/sec: 8032.33 - lr: 0.100000 +2023-04-05 12:48:42,057 epoch 17 - iter 2385/2650 - loss 0.04706724 - time (sec): 163.91 - samples/sec: 8046.61 - lr: 0.100000 +2023-04-05 12:48:59,697 epoch 17 - iter 2650/2650 - loss 0.04712588 - time (sec): 181.55 - samples/sec: 8055.04 - lr: 0.100000 +2023-04-05 12:48:59,698 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:48:59,698 EPOCH 17 done: loss 0.0471 - lr 0.100000 +2023-04-05 12:48:59,698 BAD EPOCHS (no improvement): 0 +2023-04-05 12:48:59,700 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:49:17,779 epoch 18 - iter 265/2650 - loss 0.04534113 - time (sec): 18.08 - samples/sec: 8105.65 - lr: 0.100000 +2023-04-05 12:49:36,247 epoch 18 - iter 530/2650 - loss 0.04500882 - time (sec): 36.55 - samples/sec: 8037.67 - lr: 0.100000 +2023-04-05 12:49:54,903 epoch 18 - iter 795/2650 - loss 0.04562249 - time (sec): 55.20 - samples/sec: 7966.61 - lr: 0.100000 +2023-04-05 12:50:12,466 epoch 18 - iter 1060/2650 - loss 0.04584471 - time (sec): 72.77 - samples/sec: 8031.68 - lr: 0.100000 +2023-04-05 12:50:30,446 epoch 18 - iter 1325/2650 - loss 0.04577433 - time (sec): 90.75 - samples/sec: 8050.38 - lr: 0.100000 +2023-04-05 12:50:48,330 epoch 18 - iter 1590/2650 - loss 0.04584530 - time (sec): 108.63 - samples/sec: 8066.93 - lr: 0.100000 +2023-04-05 12:51:06,888 epoch 18 - iter 1855/2650 - loss 0.04614281 - time (sec): 127.19 - samples/sec: 8049.02 - lr: 0.100000 +2023-04-05 12:51:25,822 epoch 18 - iter 2120/2650 - loss 0.04605253 - time (sec): 146.12 - samples/sec: 8012.92 - lr: 0.100000 +2023-04-05 12:51:43,924 epoch 18 - iter 2385/2650 - loss 0.04626635 - time (sec): 164.22 - samples/sec: 8018.25 - lr: 0.100000 +2023-04-05 12:52:01,853 epoch 18 - iter 2650/2650 - loss 0.04661335 - time (sec): 182.15 - samples/sec: 8028.23 - lr: 0.100000 +2023-04-05 12:52:01,853 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:52:01,853 EPOCH 18 done: loss 0.0466 - lr 0.100000 +2023-04-05 12:52:01,853 BAD EPOCHS (no improvement): 0 +2023-04-05 12:52:01,856 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:52:19,663 epoch 19 - iter 265/2650 - loss 0.04505265 - time (sec): 17.81 - samples/sec: 8223.56 - lr: 0.100000 +2023-04-05 12:52:38,041 epoch 19 - iter 530/2650 - loss 0.04439638 - time (sec): 36.19 - samples/sec: 8091.02 - lr: 0.100000 +2023-04-05 12:52:56,615 epoch 19 - iter 795/2650 - loss 0.04423008 - time (sec): 54.76 - samples/sec: 8018.48 - lr: 0.100000 +2023-04-05 12:53:15,321 epoch 19 - iter 1060/2650 - loss 0.04499290 - time (sec): 73.47 - samples/sec: 7975.07 - lr: 0.100000 +2023-04-05 12:53:33,845 epoch 19 - iter 1325/2650 - loss 0.04562271 - time (sec): 91.99 - samples/sec: 7982.62 - lr: 0.100000 +2023-04-05 12:53:51,826 epoch 19 - iter 1590/2650 - loss 0.04546048 - time (sec): 109.97 - samples/sec: 7994.45 - lr: 0.100000 +2023-04-05 12:54:09,327 epoch 19 - iter 1855/2650 - loss 0.04558059 - time (sec): 127.47 - samples/sec: 8030.34 - lr: 0.100000 +2023-04-05 12:54:27,628 epoch 19 - iter 2120/2650 - loss 0.04570780 - time (sec): 145.77 - samples/sec: 8024.29 - lr: 0.100000 +2023-04-05 12:54:46,386 epoch 19 - iter 2385/2650 - loss 0.04587781 - time (sec): 164.53 - samples/sec: 8003.36 - lr: 0.100000 +2023-04-05 12:55:04,505 epoch 19 - iter 2650/2650 - loss 0.04580571 - time (sec): 182.65 - samples/sec: 8006.42 - lr: 0.100000 +2023-04-05 12:55:04,505 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:55:04,505 EPOCH 19 done: loss 0.0458 - lr 0.100000 +2023-04-05 12:55:04,505 BAD EPOCHS (no improvement): 0 +2023-04-05 12:55:04,508 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:55:22,556 epoch 20 - iter 265/2650 - loss 0.04387430 - time (sec): 18.05 - samples/sec: 8116.85 - lr: 0.100000 +2023-04-05 12:55:40,810 epoch 20 - iter 530/2650 - loss 0.04445772 - time (sec): 36.30 - samples/sec: 8050.00 - lr: 0.100000 +2023-04-05 12:55:58,705 epoch 20 - iter 795/2650 - loss 0.04438246 - time (sec): 54.20 - samples/sec: 8073.68 - lr: 0.100000 +2023-04-05 12:56:16,861 epoch 20 - iter 1060/2650 - loss 0.04488826 - time (sec): 72.35 - samples/sec: 8076.96 - lr: 0.100000 +2023-04-05 12:56:35,426 epoch 20 - iter 1325/2650 - loss 0.04515160 - time (sec): 90.92 - samples/sec: 8050.84 - lr: 0.100000 +2023-04-05 12:56:53,780 epoch 20 - iter 1590/2650 - loss 0.04503194 - time (sec): 109.27 - samples/sec: 8033.88 - lr: 0.100000 +2023-04-05 12:57:12,307 epoch 20 - iter 1855/2650 - loss 0.04513114 - time (sec): 127.80 - samples/sec: 8018.82 - lr: 0.100000 +2023-04-05 12:57:30,000 epoch 20 - iter 2120/2650 - loss 0.04504153 - time (sec): 145.49 - samples/sec: 8044.30 - lr: 0.100000 +2023-04-05 12:57:48,103 epoch 20 - iter 2385/2650 - loss 0.04545527 - time (sec): 163.60 - samples/sec: 8053.17 - lr: 0.100000 +2023-04-05 12:58:06,486 epoch 20 - iter 2650/2650 - loss 0.04538527 - time (sec): 181.98 - samples/sec: 8035.91 - lr: 0.100000 +2023-04-05 12:58:06,486 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:58:06,486 EPOCH 20 done: loss 0.0454 - lr 0.100000 +2023-04-05 12:58:06,486 BAD EPOCHS (no improvement): 0 +2023-04-05 12:58:06,489 ---------------------------------------------------------------------------------------------------- +2023-04-05 12:58:24,763 epoch 21 - iter 265/2650 - loss 0.04522860 - time (sec): 18.27 - samples/sec: 8080.58 - lr: 0.100000 +2023-04-05 12:58:43,172 epoch 21 - iter 530/2650 - loss 0.04444685 - time (sec): 36.68 - samples/sec: 8004.57 - lr: 0.100000 +2023-04-05 12:59:01,115 epoch 21 - iter 795/2650 - loss 0.04384121 - time (sec): 54.63 - samples/sec: 8025.63 - lr: 0.100000 +2023-04-05 12:59:19,124 epoch 21 - iter 1060/2650 - loss 0.04426612 - time (sec): 72.63 - samples/sec: 8045.44 - lr: 0.100000 +2023-04-05 12:59:37,427 epoch 21 - iter 1325/2650 - loss 0.04421822 - time (sec): 90.94 - samples/sec: 8020.56 - lr: 0.100000 +2023-04-05 12:59:56,261 epoch 21 - iter 1590/2650 - loss 0.04453069 - time (sec): 109.77 - samples/sec: 7992.37 - lr: 0.100000 +2023-04-05 13:00:14,296 epoch 21 - iter 1855/2650 - loss 0.04465350 - time (sec): 127.81 - samples/sec: 8008.44 - lr: 0.100000 +2023-04-05 13:00:33,220 epoch 21 - iter 2120/2650 - loss 0.04460016 - time (sec): 146.73 - samples/sec: 7972.62 - lr: 0.100000 +2023-04-05 13:00:51,801 epoch 21 - iter 2385/2650 - loss 0.04483597 - time (sec): 165.31 - samples/sec: 7965.23 - lr: 0.100000 +2023-04-05 13:01:10,085 epoch 21 - iter 2650/2650 - loss 0.04493471 - time (sec): 183.60 - samples/sec: 7965.12 - lr: 0.100000 +2023-04-05 13:01:10,085 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:01:10,085 EPOCH 21 done: loss 0.0449 - lr 0.100000 +2023-04-05 13:01:10,085 BAD EPOCHS (no improvement): 0 +2023-04-05 13:01:10,090 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:01:28,506 epoch 22 - iter 265/2650 - loss 0.04511821 - time (sec): 18.42 - samples/sec: 7943.87 - lr: 0.100000 +2023-04-05 13:01:46,489 epoch 22 - iter 530/2650 - loss 0.04502722 - time (sec): 36.40 - samples/sec: 8024.47 - lr: 0.100000 +2023-04-05 13:02:05,121 epoch 22 - iter 795/2650 - loss 0.04494844 - time (sec): 55.03 - samples/sec: 8003.25 - lr: 0.100000 +2023-04-05 13:02:22,948 epoch 22 - iter 1060/2650 - loss 0.04452581 - time (sec): 72.86 - samples/sec: 8043.82 - lr: 0.100000 +2023-04-05 13:02:41,650 epoch 22 - iter 1325/2650 - loss 0.04475034 - time (sec): 91.56 - samples/sec: 7993.55 - lr: 0.100000 +2023-04-05 13:02:59,787 epoch 22 - iter 1590/2650 - loss 0.04504895 - time (sec): 109.70 - samples/sec: 7999.96 - lr: 0.100000 +2023-04-05 13:03:17,907 epoch 22 - iter 1855/2650 - loss 0.04496822 - time (sec): 127.82 - samples/sec: 8005.83 - lr: 0.100000 +2023-04-05 13:03:36,089 epoch 22 - iter 2120/2650 - loss 0.04484396 - time (sec): 146.00 - samples/sec: 8017.54 - lr: 0.100000 +2023-04-05 13:03:54,119 epoch 22 - iter 2385/2650 - loss 0.04474206 - time (sec): 164.03 - samples/sec: 8024.17 - lr: 0.100000 +2023-04-05 13:04:13,239 epoch 22 - iter 2650/2650 - loss 0.04474036 - time (sec): 183.15 - samples/sec: 7984.58 - lr: 0.100000 +2023-04-05 13:04:13,239 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:04:13,239 EPOCH 22 done: loss 0.0447 - lr 0.100000 +2023-04-05 13:04:13,239 BAD EPOCHS (no improvement): 0 +2023-04-05 13:04:13,244 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:04:31,485 epoch 23 - iter 265/2650 - loss 0.04164168 - time (sec): 18.24 - samples/sec: 8010.15 - lr: 0.100000 +2023-04-05 13:04:49,785 epoch 23 - iter 530/2650 - loss 0.04364843 - time (sec): 36.54 - samples/sec: 7985.82 - lr: 0.100000 +2023-04-05 13:05:07,837 epoch 23 - iter 795/2650 - loss 0.04316618 - time (sec): 54.59 - samples/sec: 8019.92 - lr: 0.100000 +2023-04-05 13:05:25,713 epoch 23 - iter 1060/2650 - loss 0.04361513 - time (sec): 72.47 - samples/sec: 8053.57 - lr: 0.100000 +2023-04-05 13:05:44,054 epoch 23 - iter 1325/2650 - loss 0.04343084 - time (sec): 90.81 - samples/sec: 8047.12 - lr: 0.100000 +2023-04-05 13:06:02,262 epoch 23 - iter 1590/2650 - loss 0.04345269 - time (sec): 109.02 - samples/sec: 8044.96 - lr: 0.100000 +2023-04-05 13:06:20,685 epoch 23 - iter 1855/2650 - loss 0.04372976 - time (sec): 127.44 - samples/sec: 8041.28 - lr: 0.100000 +2023-04-05 13:06:38,923 epoch 23 - iter 2120/2650 - loss 0.04398138 - time (sec): 145.68 - samples/sec: 8035.93 - lr: 0.100000 +2023-04-05 13:06:56,837 epoch 23 - iter 2385/2650 - loss 0.04379402 - time (sec): 163.59 - samples/sec: 8041.68 - lr: 0.100000 +2023-04-05 13:07:15,197 epoch 23 - iter 2650/2650 - loss 0.04418538 - time (sec): 181.95 - samples/sec: 8037.04 - lr: 0.100000 +2023-04-05 13:07:15,198 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:07:15,198 EPOCH 23 done: loss 0.0442 - lr 0.100000 +2023-04-05 13:07:15,198 BAD EPOCHS (no improvement): 0 +2023-04-05 13:07:15,201 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:07:33,174 epoch 24 - iter 265/2650 - loss 0.04156197 - time (sec): 17.97 - samples/sec: 8098.87 - lr: 0.100000 +2023-04-05 13:07:51,024 epoch 24 - iter 530/2650 - loss 0.04331153 - time (sec): 35.82 - samples/sec: 8121.57 - lr: 0.100000 +2023-04-05 13:08:09,442 epoch 24 - iter 795/2650 - loss 0.04350761 - time (sec): 54.24 - samples/sec: 8062.68 - lr: 0.100000 +2023-04-05 13:08:27,523 epoch 24 - iter 1060/2650 - loss 0.04390878 - time (sec): 72.32 - samples/sec: 8086.50 - lr: 0.100000 +2023-04-05 13:08:45,934 epoch 24 - iter 1325/2650 - loss 0.04354562 - time (sec): 90.73 - samples/sec: 8048.27 - lr: 0.100000 +2023-04-05 13:09:04,836 epoch 24 - iter 1590/2650 - loss 0.04379741 - time (sec): 109.63 - samples/sec: 8022.50 - lr: 0.100000 +2023-04-05 13:09:22,518 epoch 24 - iter 1855/2650 - loss 0.04377413 - time (sec): 127.32 - samples/sec: 8042.13 - lr: 0.100000 +2023-04-05 13:09:40,840 epoch 24 - iter 2120/2650 - loss 0.04379683 - time (sec): 145.64 - samples/sec: 8029.57 - lr: 0.100000 +2023-04-05 13:09:59,397 epoch 24 - iter 2385/2650 - loss 0.04376487 - time (sec): 164.20 - samples/sec: 8020.88 - lr: 0.100000 +2023-04-05 13:10:17,691 epoch 24 - iter 2650/2650 - loss 0.04388423 - time (sec): 182.49 - samples/sec: 8013.40 - lr: 0.100000 +2023-04-05 13:10:17,691 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:10:17,691 EPOCH 24 done: loss 0.0439 - lr 0.100000 +2023-04-05 13:10:17,691 BAD EPOCHS (no improvement): 0 +2023-04-05 13:10:17,695 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:10:36,202 epoch 25 - iter 265/2650 - loss 0.04323290 - time (sec): 18.51 - samples/sec: 7923.02 - lr: 0.100000 +2023-04-05 13:10:54,315 epoch 25 - iter 530/2650 - loss 0.04310124 - time (sec): 36.62 - samples/sec: 7965.22 - lr: 0.100000 +2023-04-05 13:11:13,064 epoch 25 - iter 795/2650 - loss 0.04346477 - time (sec): 55.37 - samples/sec: 7951.91 - lr: 0.100000 +2023-04-05 13:11:30,965 epoch 25 - iter 1060/2650 - loss 0.04365669 - time (sec): 73.27 - samples/sec: 8003.17 - lr: 0.100000 +2023-04-05 13:11:48,934 epoch 25 - iter 1325/2650 - loss 0.04364555 - time (sec): 91.24 - samples/sec: 8035.12 - lr: 0.100000 +2023-04-05 13:12:07,418 epoch 25 - iter 1590/2650 - loss 0.04344050 - time (sec): 109.72 - samples/sec: 8018.26 - lr: 0.100000 +2023-04-05 13:12:25,485 epoch 25 - iter 1855/2650 - loss 0.04342011 - time (sec): 127.79 - samples/sec: 8022.96 - lr: 0.100000 +2023-04-05 13:12:43,559 epoch 25 - iter 2120/2650 - loss 0.04361445 - time (sec): 145.86 - samples/sec: 8027.99 - lr: 0.100000 +2023-04-05 13:13:02,004 epoch 25 - iter 2385/2650 - loss 0.04374248 - time (sec): 164.31 - samples/sec: 8021.44 - lr: 0.100000 +2023-04-05 13:13:20,063 epoch 25 - iter 2650/2650 - loss 0.04363611 - time (sec): 182.37 - samples/sec: 8018.72 - lr: 0.100000 +2023-04-05 13:13:20,064 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:13:20,064 EPOCH 25 done: loss 0.0436 - lr 0.100000 +2023-04-05 13:13:20,064 BAD EPOCHS (no improvement): 0 +2023-04-05 13:13:20,067 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:13:38,392 epoch 26 - iter 265/2650 - loss 0.04477252 - time (sec): 18.32 - samples/sec: 7968.92 - lr: 0.100000 +2023-04-05 13:13:56,495 epoch 26 - iter 530/2650 - loss 0.04367345 - time (sec): 36.43 - samples/sec: 7969.02 - lr: 0.100000 +2023-04-05 13:14:14,737 epoch 26 - iter 795/2650 - loss 0.04407882 - time (sec): 54.67 - samples/sec: 7998.34 - lr: 0.100000 +2023-04-05 13:14:32,645 epoch 26 - iter 1060/2650 - loss 0.04416501 - time (sec): 72.58 - samples/sec: 8034.64 - lr: 0.100000 +2023-04-05 13:14:51,277 epoch 26 - iter 1325/2650 - loss 0.04376531 - time (sec): 91.21 - samples/sec: 8006.96 - lr: 0.100000 +2023-04-05 13:15:09,363 epoch 26 - iter 1590/2650 - loss 0.04380597 - time (sec): 109.30 - samples/sec: 8018.65 - lr: 0.100000 +2023-04-05 13:15:27,651 epoch 26 - iter 1855/2650 - loss 0.04374117 - time (sec): 127.58 - samples/sec: 8029.18 - lr: 0.100000 +2023-04-05 13:15:45,676 epoch 26 - iter 2120/2650 - loss 0.04389153 - time (sec): 145.61 - samples/sec: 8036.39 - lr: 0.100000 +2023-04-05 13:16:03,889 epoch 26 - iter 2385/2650 - loss 0.04381933 - time (sec): 163.82 - samples/sec: 8032.26 - lr: 0.100000 +2023-04-05 13:16:22,078 epoch 26 - iter 2650/2650 - loss 0.04370044 - time (sec): 182.01 - samples/sec: 8034.50 - lr: 0.100000 +2023-04-05 13:16:22,078 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:16:22,078 EPOCH 26 done: loss 0.0437 - lr 0.100000 +2023-04-05 13:16:22,078 BAD EPOCHS (no improvement): 1 +2023-04-05 13:16:22,082 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:16:40,599 epoch 27 - iter 265/2650 - loss 0.04403857 - time (sec): 18.52 - samples/sec: 7872.04 - lr: 0.100000 +2023-04-05 13:16:59,011 epoch 27 - iter 530/2650 - loss 0.04311112 - time (sec): 36.93 - samples/sec: 7928.55 - lr: 0.100000 +2023-04-05 13:17:17,221 epoch 27 - iter 795/2650 - loss 0.04312914 - time (sec): 55.14 - samples/sec: 7954.66 - lr: 0.100000 +2023-04-05 13:17:35,292 epoch 27 - iter 1060/2650 - loss 0.04346302 - time (sec): 73.21 - samples/sec: 7972.79 - lr: 0.100000 +2023-04-05 13:17:53,453 epoch 27 - iter 1325/2650 - loss 0.04320810 - time (sec): 91.37 - samples/sec: 7988.86 - lr: 0.100000 +2023-04-05 13:18:11,353 epoch 27 - iter 1590/2650 - loss 0.04322007 - time (sec): 109.27 - samples/sec: 8024.30 - lr: 0.100000 +2023-04-05 13:18:29,425 epoch 27 - iter 1855/2650 - loss 0.04326717 - time (sec): 127.34 - samples/sec: 8036.24 - lr: 0.100000 +2023-04-05 13:18:47,808 epoch 27 - iter 2120/2650 - loss 0.04329751 - time (sec): 145.73 - samples/sec: 8033.30 - lr: 0.100000 +2023-04-05 13:19:05,711 epoch 27 - iter 2385/2650 - loss 0.04329392 - time (sec): 163.63 - samples/sec: 8048.31 - lr: 0.100000 +2023-04-05 13:19:33,416 epoch 27 - iter 2650/2650 - loss 0.04321950 - time (sec): 191.33 - samples/sec: 7642.96 - lr: 0.100000 +2023-04-05 13:19:33,417 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:19:33,417 EPOCH 27 done: loss 0.0432 - lr 0.100000 +2023-04-05 13:19:33,417 BAD EPOCHS (no improvement): 0 +2023-04-05 13:19:33,419 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:19:51,483 epoch 28 - iter 265/2650 - loss 0.04074091 - time (sec): 18.06 - samples/sec: 8063.48 - lr: 0.100000 +2023-04-05 13:20:09,382 epoch 28 - iter 530/2650 - loss 0.04096435 - time (sec): 35.96 - samples/sec: 8130.18 - lr: 0.100000 +2023-04-05 13:20:27,302 epoch 28 - iter 795/2650 - loss 0.04174707 - time (sec): 53.88 - samples/sec: 8134.68 - lr: 0.100000 +2023-04-05 13:20:45,630 epoch 28 - iter 1060/2650 - loss 0.04178587 - time (sec): 72.21 - samples/sec: 8104.29 - lr: 0.100000 +2023-04-05 13:21:03,244 epoch 28 - iter 1325/2650 - loss 0.04190726 - time (sec): 89.82 - samples/sec: 8126.26 - lr: 0.100000 +2023-04-05 13:21:21,365 epoch 28 - iter 1590/2650 - loss 0.04200885 - time (sec): 107.95 - samples/sec: 8107.54 - lr: 0.100000 +2023-04-05 13:21:39,657 epoch 28 - iter 1855/2650 - loss 0.04210387 - time (sec): 126.24 - samples/sec: 8095.57 - lr: 0.100000 +2023-04-05 13:21:58,459 epoch 28 - iter 2120/2650 - loss 0.04225489 - time (sec): 145.04 - samples/sec: 8064.57 - lr: 0.100000 +2023-04-05 13:22:16,148 epoch 28 - iter 2385/2650 - loss 0.04275993 - time (sec): 162.73 - samples/sec: 8083.56 - lr: 0.100000 +2023-04-05 13:22:34,737 epoch 28 - iter 2650/2650 - loss 0.04290212 - time (sec): 181.32 - samples/sec: 8065.20 - lr: 0.100000 +2023-04-05 13:22:34,738 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:22:34,738 EPOCH 28 done: loss 0.0429 - lr 0.100000 +2023-04-05 13:22:34,738 BAD EPOCHS (no improvement): 0 +2023-04-05 13:22:34,740 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:22:52,768 epoch 29 - iter 265/2650 - loss 0.04376124 - time (sec): 18.03 - samples/sec: 8084.80 - lr: 0.100000 +2023-04-05 13:23:10,719 epoch 29 - iter 530/2650 - loss 0.04263117 - time (sec): 35.98 - samples/sec: 8133.67 - lr: 0.100000 +2023-04-05 13:23:29,475 epoch 29 - iter 795/2650 - loss 0.04264667 - time (sec): 54.73 - samples/sec: 8052.02 - lr: 0.100000 +2023-04-05 13:23:47,549 epoch 29 - iter 1060/2650 - loss 0.04260931 - time (sec): 72.81 - samples/sec: 8058.13 - lr: 0.100000 +2023-04-05 13:24:05,636 epoch 29 - iter 1325/2650 - loss 0.04231919 - time (sec): 90.90 - samples/sec: 8057.40 - lr: 0.100000 +2023-04-05 13:24:23,448 epoch 29 - iter 1590/2650 - loss 0.04242064 - time (sec): 108.71 - samples/sec: 8079.12 - lr: 0.100000 +2023-04-05 13:24:42,780 epoch 29 - iter 1855/2650 - loss 0.04259660 - time (sec): 128.04 - samples/sec: 8010.49 - lr: 0.100000 +2023-04-05 13:25:00,948 epoch 29 - iter 2120/2650 - loss 0.04236871 - time (sec): 146.21 - samples/sec: 8003.30 - lr: 0.100000 +2023-04-05 13:25:19,634 epoch 29 - iter 2385/2650 - loss 0.04241459 - time (sec): 164.89 - samples/sec: 7979.20 - lr: 0.100000 +2023-04-05 13:25:38,473 epoch 29 - iter 2650/2650 - loss 0.04279556 - time (sec): 183.73 - samples/sec: 7959.19 - lr: 0.100000 +2023-04-05 13:25:38,473 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:25:38,473 EPOCH 29 done: loss 0.0428 - lr 0.100000 +2023-04-05 13:25:38,473 BAD EPOCHS (no improvement): 0 +2023-04-05 13:25:38,476 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:25:57,144 epoch 30 - iter 265/2650 - loss 0.04278590 - time (sec): 18.67 - samples/sec: 7813.60 - lr: 0.100000 +2023-04-05 13:26:16,476 epoch 30 - iter 530/2650 - loss 0.04287335 - time (sec): 38.00 - samples/sec: 7710.33 - lr: 0.100000 +2023-04-05 13:26:35,938 epoch 30 - iter 795/2650 - loss 0.04271567 - time (sec): 57.46 - samples/sec: 7659.00 - lr: 0.100000 +2023-04-05 13:26:54,342 epoch 30 - iter 1060/2650 - loss 0.04278500 - time (sec): 75.87 - samples/sec: 7685.83 - lr: 0.100000 +2023-04-05 13:27:13,343 epoch 30 - iter 1325/2650 - loss 0.04283643 - time (sec): 94.87 - samples/sec: 7695.19 - lr: 0.100000 +2023-04-05 13:27:31,356 epoch 30 - iter 1590/2650 - loss 0.04278760 - time (sec): 112.88 - samples/sec: 7755.23 - lr: 0.100000 +2023-04-05 13:27:51,356 epoch 30 - iter 1855/2650 - loss 0.04262510 - time (sec): 132.88 - samples/sec: 7700.43 - lr: 0.100000 +2023-04-05 13:28:10,329 epoch 30 - iter 2120/2650 - loss 0.04273573 - time (sec): 151.85 - samples/sec: 7710.19 - lr: 0.100000 +2023-04-05 13:28:28,789 epoch 30 - iter 2385/2650 - loss 0.04256292 - time (sec): 170.31 - samples/sec: 7722.37 - lr: 0.100000 +2023-04-05 13:28:47,838 epoch 30 - iter 2650/2650 - loss 0.04250649 - time (sec): 189.36 - samples/sec: 7722.60 - lr: 0.100000 +2023-04-05 13:28:47,838 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:28:47,838 EPOCH 30 done: loss 0.0425 - lr 0.100000 +2023-04-05 13:28:47,838 BAD EPOCHS (no improvement): 0 +2023-04-05 13:28:47,841 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:29:06,510 epoch 31 - iter 265/2650 - loss 0.04048803 - time (sec): 18.67 - samples/sec: 7818.74 - lr: 0.100000 +2023-04-05 13:29:25,075 epoch 31 - iter 530/2650 - loss 0.04102968 - time (sec): 37.23 - samples/sec: 7878.84 - lr: 0.100000 +2023-04-05 13:29:43,938 epoch 31 - iter 795/2650 - loss 0.04190570 - time (sec): 56.10 - samples/sec: 7822.37 - lr: 0.100000 +2023-04-05 13:30:03,275 epoch 31 - iter 1060/2650 - loss 0.04211806 - time (sec): 75.43 - samples/sec: 7763.41 - lr: 0.100000 +2023-04-05 13:30:22,762 epoch 31 - iter 1325/2650 - loss 0.04224230 - time (sec): 94.92 - samples/sec: 7711.48 - lr: 0.100000 +2023-04-05 13:30:40,948 epoch 31 - iter 1590/2650 - loss 0.04203982 - time (sec): 113.11 - samples/sec: 7748.69 - lr: 0.100000 +2023-04-05 13:30:59,417 epoch 31 - iter 1855/2650 - loss 0.04228135 - time (sec): 131.58 - samples/sec: 7764.32 - lr: 0.100000 +2023-04-05 13:31:18,796 epoch 31 - iter 2120/2650 - loss 0.04266091 - time (sec): 150.96 - samples/sec: 7751.92 - lr: 0.100000 +2023-04-05 13:31:36,894 epoch 31 - iter 2385/2650 - loss 0.04269306 - time (sec): 169.05 - samples/sec: 7784.98 - lr: 0.100000 +2023-04-05 13:31:55,812 epoch 31 - iter 2650/2650 - loss 0.04277351 - time (sec): 187.97 - samples/sec: 7779.70 - lr: 0.100000 +2023-04-05 13:31:55,813 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:31:55,813 EPOCH 31 done: loss 0.0428 - lr 0.100000 +2023-04-05 13:31:55,813 BAD EPOCHS (no improvement): 1 +2023-04-05 13:31:55,815 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:32:14,247 epoch 32 - iter 265/2650 - loss 0.04114136 - time (sec): 18.43 - samples/sec: 7953.85 - lr: 0.100000 +2023-04-05 13:32:32,555 epoch 32 - iter 530/2650 - loss 0.04240506 - time (sec): 36.74 - samples/sec: 7987.19 - lr: 0.100000 +2023-04-05 13:32:50,934 epoch 32 - iter 795/2650 - loss 0.04217008 - time (sec): 55.12 - samples/sec: 7975.19 - lr: 0.100000 +2023-04-05 13:33:09,389 epoch 32 - iter 1060/2650 - loss 0.04241276 - time (sec): 73.57 - samples/sec: 7964.56 - lr: 0.100000 +2023-04-05 13:33:27,322 epoch 32 - iter 1325/2650 - loss 0.04250188 - time (sec): 91.51 - samples/sec: 7988.69 - lr: 0.100000 +2023-04-05 13:33:45,376 epoch 32 - iter 1590/2650 - loss 0.04214098 - time (sec): 109.56 - samples/sec: 8007.39 - lr: 0.100000 +2023-04-05 13:34:04,018 epoch 32 - iter 1855/2650 - loss 0.04217149 - time (sec): 128.20 - samples/sec: 7988.00 - lr: 0.100000 +2023-04-05 13:34:21,842 epoch 32 - iter 2120/2650 - loss 0.04232391 - time (sec): 146.03 - samples/sec: 8010.16 - lr: 0.100000 +2023-04-05 13:34:40,289 epoch 32 - iter 2385/2650 - loss 0.04220592 - time (sec): 164.47 - samples/sec: 8009.59 - lr: 0.100000 +2023-04-05 13:34:58,078 epoch 32 - iter 2650/2650 - loss 0.04211352 - time (sec): 182.26 - samples/sec: 8023.40 - lr: 0.100000 +2023-04-05 13:34:58,078 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:34:58,078 EPOCH 32 done: loss 0.0421 - lr 0.100000 +2023-04-05 13:34:58,078 BAD EPOCHS (no improvement): 0 +2023-04-05 13:34:58,081 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:35:16,103 epoch 33 - iter 265/2650 - loss 0.04113740 - time (sec): 18.02 - samples/sec: 7973.63 - lr: 0.100000 +2023-04-05 13:35:34,332 epoch 33 - iter 530/2650 - loss 0.04118676 - time (sec): 36.25 - samples/sec: 8018.59 - lr: 0.100000 +2023-04-05 13:35:52,516 epoch 33 - iter 795/2650 - loss 0.04086561 - time (sec): 54.43 - samples/sec: 8025.98 - lr: 0.100000 +2023-04-05 13:36:10,668 epoch 33 - iter 1060/2650 - loss 0.04127195 - time (sec): 72.59 - samples/sec: 8039.81 - lr: 0.100000 +2023-04-05 13:36:28,677 epoch 33 - iter 1325/2650 - loss 0.04126109 - time (sec): 90.60 - samples/sec: 8054.78 - lr: 0.100000 +2023-04-05 13:36:47,103 epoch 33 - iter 1590/2650 - loss 0.04123808 - time (sec): 109.02 - samples/sec: 8057.19 - lr: 0.100000 +2023-04-05 13:37:04,970 epoch 33 - iter 1855/2650 - loss 0.04145521 - time (sec): 126.89 - samples/sec: 8075.86 - lr: 0.100000 +2023-04-05 13:37:23,316 epoch 33 - iter 2120/2650 - loss 0.04140714 - time (sec): 145.24 - samples/sec: 8051.64 - lr: 0.100000 +2023-04-05 13:37:41,218 epoch 33 - iter 2385/2650 - loss 0.04159778 - time (sec): 163.14 - samples/sec: 8069.73 - lr: 0.100000 +2023-04-05 13:37:59,325 epoch 33 - iter 2650/2650 - loss 0.04164667 - time (sec): 181.24 - samples/sec: 8068.47 - lr: 0.100000 +2023-04-05 13:37:59,326 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:37:59,326 EPOCH 33 done: loss 0.0416 - lr 0.100000 +2023-04-05 13:37:59,326 BAD EPOCHS (no improvement): 0 +2023-04-05 13:37:59,328 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:38:17,152 epoch 34 - iter 265/2650 - loss 0.04032775 - time (sec): 17.82 - samples/sec: 8238.13 - lr: 0.100000 +2023-04-05 13:38:35,244 epoch 34 - iter 530/2650 - loss 0.04028572 - time (sec): 35.92 - samples/sec: 8133.77 - lr: 0.100000 +2023-04-05 13:38:53,010 epoch 34 - iter 795/2650 - loss 0.04087833 - time (sec): 53.68 - samples/sec: 8155.45 - lr: 0.100000 +2023-04-05 13:39:11,323 epoch 34 - iter 1060/2650 - loss 0.04105161 - time (sec): 71.99 - samples/sec: 8122.58 - lr: 0.100000 +2023-04-05 13:39:29,324 epoch 34 - iter 1325/2650 - loss 0.04118121 - time (sec): 90.00 - samples/sec: 8117.99 - lr: 0.100000 +2023-04-05 13:39:47,210 epoch 34 - iter 1590/2650 - loss 0.04152319 - time (sec): 107.88 - samples/sec: 8122.63 - lr: 0.100000 +2023-04-05 13:40:06,042 epoch 34 - iter 1855/2650 - loss 0.04173528 - time (sec): 126.71 - samples/sec: 8078.34 - lr: 0.100000 +2023-04-05 13:40:24,312 epoch 34 - iter 2120/2650 - loss 0.04174055 - time (sec): 144.98 - samples/sec: 8066.62 - lr: 0.100000 +2023-04-05 13:40:42,718 epoch 34 - iter 2385/2650 - loss 0.04186464 - time (sec): 163.39 - samples/sec: 8061.17 - lr: 0.100000 +2023-04-05 13:41:00,935 epoch 34 - iter 2650/2650 - loss 0.04196162 - time (sec): 181.61 - samples/sec: 8052.38 - lr: 0.100000 +2023-04-05 13:41:00,935 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:41:00,935 EPOCH 34 done: loss 0.0420 - lr 0.100000 +2023-04-05 13:41:00,935 BAD EPOCHS (no improvement): 1 +2023-04-05 13:41:00,938 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:41:18,891 epoch 35 - iter 265/2650 - loss 0.03902007 - time (sec): 17.95 - samples/sec: 8092.51 - lr: 0.100000 +2023-04-05 13:41:37,648 epoch 35 - iter 530/2650 - loss 0.03998737 - time (sec): 36.71 - samples/sec: 7956.01 - lr: 0.100000 +2023-04-05 13:41:55,964 epoch 35 - iter 795/2650 - loss 0.04052774 - time (sec): 55.03 - samples/sec: 7963.42 - lr: 0.100000 +2023-04-05 13:42:13,812 epoch 35 - iter 1060/2650 - loss 0.04073243 - time (sec): 72.87 - samples/sec: 8016.36 - lr: 0.100000 +2023-04-05 13:42:31,891 epoch 35 - iter 1325/2650 - loss 0.04130334 - time (sec): 90.95 - samples/sec: 8017.61 - lr: 0.100000 +2023-04-05 13:42:50,349 epoch 35 - iter 1590/2650 - loss 0.04130015 - time (sec): 109.41 - samples/sec: 7998.97 - lr: 0.100000 +2023-04-05 13:43:08,087 epoch 35 - iter 1855/2650 - loss 0.04155846 - time (sec): 127.15 - samples/sec: 8036.61 - lr: 0.100000 +2023-04-05 13:43:26,524 epoch 35 - iter 2120/2650 - loss 0.04151170 - time (sec): 145.59 - samples/sec: 8023.82 - lr: 0.100000 +2023-04-05 13:43:44,727 epoch 35 - iter 2385/2650 - loss 0.04165088 - time (sec): 163.79 - samples/sec: 8033.92 - lr: 0.100000 +2023-04-05 13:44:02,812 epoch 35 - iter 2650/2650 - loss 0.04172819 - time (sec): 181.87 - samples/sec: 8040.54 - lr: 0.100000 +2023-04-05 13:44:02,813 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:44:02,813 EPOCH 35 done: loss 0.0417 - lr 0.100000 +2023-04-05 13:44:02,813 BAD EPOCHS (no improvement): 2 +2023-04-05 13:44:02,816 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:44:20,787 epoch 36 - iter 265/2650 - loss 0.03989163 - time (sec): 17.97 - samples/sec: 8093.05 - lr: 0.100000 +2023-04-05 13:44:38,668 epoch 36 - iter 530/2650 - loss 0.04074671 - time (sec): 35.85 - samples/sec: 8145.16 - lr: 0.100000 +2023-04-05 13:44:56,943 epoch 36 - iter 795/2650 - loss 0.04063702 - time (sec): 54.13 - samples/sec: 8121.42 - lr: 0.100000 +2023-04-05 13:45:14,906 epoch 36 - iter 1060/2650 - loss 0.04123224 - time (sec): 72.09 - samples/sec: 8118.47 - lr: 0.100000 +2023-04-05 13:45:32,688 epoch 36 - iter 1325/2650 - loss 0.04144036 - time (sec): 89.87 - samples/sec: 8149.95 - lr: 0.100000 +2023-04-05 13:45:50,960 epoch 36 - iter 1590/2650 - loss 0.04126246 - time (sec): 108.14 - samples/sec: 8122.52 - lr: 0.100000 +2023-04-05 13:46:09,170 epoch 36 - iter 1855/2650 - loss 0.04113635 - time (sec): 126.35 - samples/sec: 8099.97 - lr: 0.100000 +2023-04-05 13:46:27,653 epoch 36 - iter 2120/2650 - loss 0.04139249 - time (sec): 144.84 - samples/sec: 8069.40 - lr: 0.100000 +2023-04-05 13:46:45,687 epoch 36 - iter 2385/2650 - loss 0.04164580 - time (sec): 162.87 - samples/sec: 8075.69 - lr: 0.100000 +2023-04-05 13:47:03,949 epoch 36 - iter 2650/2650 - loss 0.04177306 - time (sec): 181.13 - samples/sec: 8073.45 - lr: 0.100000 +2023-04-05 13:47:03,949 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:47:03,949 EPOCH 36 done: loss 0.0418 - lr 0.100000 +2023-04-05 13:47:03,949 BAD EPOCHS (no improvement): 3 +2023-04-05 13:47:03,953 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:47:22,548 epoch 37 - iter 265/2650 - loss 0.03937739 - time (sec): 18.60 - samples/sec: 7957.34 - lr: 0.100000 +2023-04-05 13:47:40,772 epoch 37 - iter 530/2650 - loss 0.03992319 - time (sec): 36.82 - samples/sec: 7996.47 - lr: 0.100000 +2023-04-05 13:47:58,599 epoch 37 - iter 795/2650 - loss 0.04038594 - time (sec): 54.65 - samples/sec: 8044.45 - lr: 0.100000 +2023-04-05 13:48:16,970 epoch 37 - iter 1060/2650 - loss 0.04056998 - time (sec): 73.02 - samples/sec: 8042.29 - lr: 0.100000 +2023-04-05 13:48:34,962 epoch 37 - iter 1325/2650 - loss 0.04079154 - time (sec): 91.01 - samples/sec: 8047.38 - lr: 0.100000 +2023-04-05 13:48:53,157 epoch 37 - iter 1590/2650 - loss 0.04065697 - time (sec): 109.20 - samples/sec: 8051.67 - lr: 0.100000 +2023-04-05 13:49:11,205 epoch 37 - iter 1855/2650 - loss 0.04088717 - time (sec): 127.25 - samples/sec: 8062.08 - lr: 0.100000 +2023-04-05 13:49:29,407 epoch 37 - iter 2120/2650 - loss 0.04096640 - time (sec): 145.45 - samples/sec: 8061.20 - lr: 0.100000 +2023-04-05 13:49:47,702 epoch 37 - iter 2385/2650 - loss 0.04125203 - time (sec): 163.75 - samples/sec: 8056.82 - lr: 0.100000 +2023-04-05 13:50:05,171 epoch 37 - iter 2650/2650 - loss 0.04132906 - time (sec): 181.22 - samples/sec: 8069.62 - lr: 0.100000 +2023-04-05 13:50:05,171 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:50:05,171 EPOCH 37 done: loss 0.0413 - lr 0.100000 +2023-04-05 13:50:05,171 BAD EPOCHS (no improvement): 0 +2023-04-05 13:50:05,175 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:50:23,928 epoch 38 - iter 265/2650 - loss 0.04383270 - time (sec): 18.75 - samples/sec: 7768.47 - lr: 0.100000 +2023-04-05 13:50:42,306 epoch 38 - iter 530/2650 - loss 0.04188365 - time (sec): 37.13 - samples/sec: 7851.35 - lr: 0.100000 +2023-04-05 13:51:00,731 epoch 38 - iter 795/2650 - loss 0.04194723 - time (sec): 55.56 - samples/sec: 7863.44 - lr: 0.100000 +2023-04-05 13:51:18,795 epoch 38 - iter 1060/2650 - loss 0.04151871 - time (sec): 73.62 - samples/sec: 7919.66 - lr: 0.100000 +2023-04-05 13:51:36,969 epoch 38 - iter 1325/2650 - loss 0.04133663 - time (sec): 91.79 - samples/sec: 7960.20 - lr: 0.100000 +2023-04-05 13:51:55,380 epoch 38 - iter 1590/2650 - loss 0.04135589 - time (sec): 110.20 - samples/sec: 7966.23 - lr: 0.100000 +2023-04-05 13:52:13,560 epoch 38 - iter 1855/2650 - loss 0.04119698 - time (sec): 128.39 - samples/sec: 7976.98 - lr: 0.100000 +2023-04-05 13:52:31,229 epoch 38 - iter 2120/2650 - loss 0.04159502 - time (sec): 146.05 - samples/sec: 8007.37 - lr: 0.100000 +2023-04-05 13:52:49,863 epoch 38 - iter 2385/2650 - loss 0.04160270 - time (sec): 164.69 - samples/sec: 7995.04 - lr: 0.100000 +2023-04-05 13:53:08,574 epoch 38 - iter 2650/2650 - loss 0.04163645 - time (sec): 183.40 - samples/sec: 7973.67 - lr: 0.100000 +2023-04-05 13:53:08,574 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:53:08,575 EPOCH 38 done: loss 0.0416 - lr 0.100000 +2023-04-05 13:53:08,575 BAD EPOCHS (no improvement): 1 +2023-04-05 13:53:08,578 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:53:26,022 epoch 39 - iter 265/2650 - loss 0.04087264 - time (sec): 17.44 - samples/sec: 8261.25 - lr: 0.100000 +2023-04-05 13:53:44,365 epoch 39 - iter 530/2650 - loss 0.04076545 - time (sec): 35.79 - samples/sec: 8063.32 - lr: 0.100000 +2023-04-05 13:54:03,189 epoch 39 - iter 795/2650 - loss 0.04057494 - time (sec): 54.61 - samples/sec: 7984.57 - lr: 0.100000 +2023-04-05 13:54:21,288 epoch 39 - iter 1060/2650 - loss 0.04079472 - time (sec): 72.71 - samples/sec: 8003.31 - lr: 0.100000 +2023-04-05 13:54:41,297 epoch 39 - iter 1325/2650 - loss 0.04079675 - time (sec): 92.72 - samples/sec: 7860.41 - lr: 0.100000 +2023-04-05 13:55:00,720 epoch 39 - iter 1590/2650 - loss 0.04082025 - time (sec): 112.14 - samples/sec: 7807.71 - lr: 0.100000 +2023-04-05 13:55:19,344 epoch 39 - iter 1855/2650 - loss 0.04083543 - time (sec): 130.77 - samples/sec: 7822.99 - lr: 0.100000 +2023-04-05 13:55:37,962 epoch 39 - iter 2120/2650 - loss 0.04110629 - time (sec): 149.38 - samples/sec: 7826.17 - lr: 0.100000 +2023-04-05 13:55:56,460 epoch 39 - iter 2385/2650 - loss 0.04124247 - time (sec): 167.88 - samples/sec: 7833.14 - lr: 0.100000 +2023-04-05 13:56:14,585 epoch 39 - iter 2650/2650 - loss 0.04118173 - time (sec): 186.01 - samples/sec: 7861.87 - lr: 0.100000 +2023-04-05 13:56:14,585 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:56:14,585 EPOCH 39 done: loss 0.0412 - lr 0.100000 +2023-04-05 13:56:14,586 BAD EPOCHS (no improvement): 0 +2023-04-05 13:56:14,588 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:56:32,742 epoch 40 - iter 265/2650 - loss 0.03876713 - time (sec): 18.15 - samples/sec: 8139.52 - lr: 0.100000 +2023-04-05 13:56:50,675 epoch 40 - iter 530/2650 - loss 0.03907344 - time (sec): 36.09 - samples/sec: 8129.75 - lr: 0.100000 +2023-04-05 13:57:08,793 epoch 40 - iter 795/2650 - loss 0.03958288 - time (sec): 54.20 - samples/sec: 8091.39 - lr: 0.100000 +2023-04-05 13:57:27,293 epoch 40 - iter 1060/2650 - loss 0.04017258 - time (sec): 72.70 - samples/sec: 8037.80 - lr: 0.100000 +2023-04-05 13:57:46,110 epoch 40 - iter 1325/2650 - loss 0.04036219 - time (sec): 91.52 - samples/sec: 7993.13 - lr: 0.100000 +2023-04-05 13:58:04,438 epoch 40 - iter 1590/2650 - loss 0.04024071 - time (sec): 109.85 - samples/sec: 7983.30 - lr: 0.100000 +2023-04-05 13:58:22,971 epoch 40 - iter 1855/2650 - loss 0.04031818 - time (sec): 128.38 - samples/sec: 7974.43 - lr: 0.100000 +2023-04-05 13:58:41,134 epoch 40 - iter 2120/2650 - loss 0.04045693 - time (sec): 146.55 - samples/sec: 7986.97 - lr: 0.100000 +2023-04-05 13:58:59,177 epoch 40 - iter 2385/2650 - loss 0.04070948 - time (sec): 164.59 - samples/sec: 8002.63 - lr: 0.100000 +2023-04-05 13:59:16,937 epoch 40 - iter 2650/2650 - loss 0.04090536 - time (sec): 182.35 - samples/sec: 8019.60 - lr: 0.100000 +2023-04-05 13:59:16,937 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:59:16,937 EPOCH 40 done: loss 0.0409 - lr 0.100000 +2023-04-05 13:59:16,938 BAD EPOCHS (no improvement): 0 +2023-04-05 13:59:16,941 ---------------------------------------------------------------------------------------------------- +2023-04-05 13:59:35,574 epoch 41 - iter 265/2650 - loss 0.04110906 - time (sec): 18.63 - samples/sec: 7794.26 - lr: 0.100000 +2023-04-05 13:59:54,105 epoch 41 - iter 530/2650 - loss 0.03991654 - time (sec): 37.16 - samples/sec: 7851.71 - lr: 0.100000 +2023-04-05 14:00:11,955 epoch 41 - iter 795/2650 - loss 0.04015277 - time (sec): 55.01 - samples/sec: 7953.94 - lr: 0.100000 +2023-04-05 14:00:30,102 epoch 41 - iter 1060/2650 - loss 0.04025711 - time (sec): 73.16 - samples/sec: 7974.91 - lr: 0.100000 +2023-04-05 14:00:48,255 epoch 41 - iter 1325/2650 - loss 0.04093862 - time (sec): 91.31 - samples/sec: 8004.37 - lr: 0.100000 +2023-04-05 14:01:06,770 epoch 41 - iter 1590/2650 - loss 0.04115403 - time (sec): 109.83 - samples/sec: 8017.84 - lr: 0.100000 +2023-04-05 14:01:24,717 epoch 41 - iter 1855/2650 - loss 0.04092722 - time (sec): 127.78 - samples/sec: 8035.12 - lr: 0.100000 +2023-04-05 14:01:42,808 epoch 41 - iter 2120/2650 - loss 0.04087952 - time (sec): 145.87 - samples/sec: 8032.41 - lr: 0.100000 +2023-04-05 14:02:00,694 epoch 41 - iter 2385/2650 - loss 0.04097686 - time (sec): 163.75 - samples/sec: 8041.19 - lr: 0.100000 +2023-04-05 14:02:18,474 epoch 41 - iter 2650/2650 - loss 0.04108247 - time (sec): 181.53 - samples/sec: 8055.63 - lr: 0.100000 +2023-04-05 14:02:18,474 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:02:18,474 EPOCH 41 done: loss 0.0411 - lr 0.100000 +2023-04-05 14:02:18,475 BAD EPOCHS (no improvement): 1 +2023-04-05 14:02:18,478 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:02:36,748 epoch 42 - iter 265/2650 - loss 0.03884482 - time (sec): 18.27 - samples/sec: 7957.35 - lr: 0.100000 +2023-04-05 14:02:54,675 epoch 42 - iter 530/2650 - loss 0.03966526 - time (sec): 36.20 - samples/sec: 8051.20 - lr: 0.100000 +2023-04-05 14:03:12,380 epoch 42 - iter 795/2650 - loss 0.04064784 - time (sec): 53.90 - samples/sec: 8082.66 - lr: 0.100000 +2023-04-05 14:03:30,494 epoch 42 - iter 1060/2650 - loss 0.04042028 - time (sec): 72.02 - samples/sec: 8100.35 - lr: 0.100000 +2023-04-05 14:03:48,404 epoch 42 - iter 1325/2650 - loss 0.04078388 - time (sec): 89.93 - samples/sec: 8106.27 - lr: 0.100000 +2023-04-05 14:04:07,710 epoch 42 - iter 1590/2650 - loss 0.04081253 - time (sec): 109.23 - samples/sec: 8039.81 - lr: 0.100000 +2023-04-05 14:04:25,522 epoch 42 - iter 1855/2650 - loss 0.04083092 - time (sec): 127.04 - samples/sec: 8061.94 - lr: 0.100000 +2023-04-05 14:04:43,875 epoch 42 - iter 2120/2650 - loss 0.04087742 - time (sec): 145.40 - samples/sec: 8059.79 - lr: 0.100000 +2023-04-05 14:05:02,174 epoch 42 - iter 2385/2650 - loss 0.04109521 - time (sec): 163.70 - samples/sec: 8043.70 - lr: 0.100000 +2023-04-05 14:05:20,221 epoch 42 - iter 2650/2650 - loss 0.04124523 - time (sec): 181.74 - samples/sec: 8046.34 - lr: 0.100000 +2023-04-05 14:05:20,221 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:05:20,221 EPOCH 42 done: loss 0.0412 - lr 0.100000 +2023-04-05 14:05:20,221 BAD EPOCHS (no improvement): 2 +2023-04-05 14:05:20,224 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:05:38,918 epoch 43 - iter 265/2650 - loss 0.03914060 - time (sec): 18.69 - samples/sec: 7854.03 - lr: 0.100000 +2023-04-05 14:05:57,098 epoch 43 - iter 530/2650 - loss 0.03897795 - time (sec): 36.87 - samples/sec: 7908.67 - lr: 0.100000 +2023-04-05 14:06:16,108 epoch 43 - iter 795/2650 - loss 0.03987165 - time (sec): 55.88 - samples/sec: 7871.89 - lr: 0.100000 +2023-04-05 14:06:34,505 epoch 43 - iter 1060/2650 - loss 0.04058359 - time (sec): 74.28 - samples/sec: 7897.61 - lr: 0.100000 +2023-04-05 14:06:52,733 epoch 43 - iter 1325/2650 - loss 0.04030989 - time (sec): 92.51 - samples/sec: 7942.58 - lr: 0.100000 +2023-04-05 14:07:10,926 epoch 43 - iter 1590/2650 - loss 0.04036084 - time (sec): 110.70 - samples/sec: 7966.59 - lr: 0.100000 +2023-04-05 14:07:28,763 epoch 43 - iter 1855/2650 - loss 0.04070626 - time (sec): 128.54 - samples/sec: 7988.79 - lr: 0.100000 +2023-04-05 14:07:55,812 epoch 43 - iter 2120/2650 - loss 0.04058306 - time (sec): 155.59 - samples/sec: 7531.35 - lr: 0.100000 +2023-04-05 14:08:14,044 epoch 43 - iter 2385/2650 - loss 0.04072473 - time (sec): 173.82 - samples/sec: 7577.65 - lr: 0.100000 +2023-04-05 14:08:32,143 epoch 43 - iter 2650/2650 - loss 0.04060954 - time (sec): 191.92 - samples/sec: 7619.68 - lr: 0.100000 +2023-04-05 14:08:32,144 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:08:32,144 EPOCH 43 done: loss 0.0406 - lr 0.100000 +2023-04-05 14:08:32,144 BAD EPOCHS (no improvement): 0 +2023-04-05 14:08:32,146 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:08:51,106 epoch 44 - iter 265/2650 - loss 0.03918091 - time (sec): 18.96 - samples/sec: 7821.38 - lr: 0.100000 +2023-04-05 14:09:08,660 epoch 44 - iter 530/2650 - loss 0.04020787 - time (sec): 36.51 - samples/sec: 8022.04 - lr: 0.100000 +2023-04-05 14:09:26,637 epoch 44 - iter 795/2650 - loss 0.03937184 - time (sec): 54.49 - samples/sec: 8059.12 - lr: 0.100000 +2023-04-05 14:09:45,099 epoch 44 - iter 1060/2650 - loss 0.03995217 - time (sec): 72.95 - samples/sec: 8037.76 - lr: 0.100000 +2023-04-05 14:10:03,263 epoch 44 - iter 1325/2650 - loss 0.04010491 - time (sec): 91.12 - samples/sec: 8056.04 - lr: 0.100000 +2023-04-05 14:10:21,345 epoch 44 - iter 1590/2650 - loss 0.04013148 - time (sec): 109.20 - samples/sec: 8053.45 - lr: 0.100000 +2023-04-05 14:10:39,310 epoch 44 - iter 1855/2650 - loss 0.04003366 - time (sec): 127.16 - samples/sec: 8065.66 - lr: 0.100000 +2023-04-05 14:10:57,206 epoch 44 - iter 2120/2650 - loss 0.04030451 - time (sec): 145.06 - samples/sec: 8076.87 - lr: 0.100000 +2023-04-05 14:11:15,096 epoch 44 - iter 2385/2650 - loss 0.04020923 - time (sec): 162.95 - samples/sec: 8088.81 - lr: 0.100000 +2023-04-05 14:11:32,871 epoch 44 - iter 2650/2650 - loss 0.04042246 - time (sec): 180.72 - samples/sec: 8091.66 - lr: 0.100000 +2023-04-05 14:11:32,872 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:11:32,872 EPOCH 44 done: loss 0.0404 - lr 0.100000 +2023-04-05 14:11:32,872 BAD EPOCHS (no improvement): 0 +2023-04-05 14:11:32,874 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:11:51,266 epoch 45 - iter 265/2650 - loss 0.03909350 - time (sec): 18.39 - samples/sec: 7909.82 - lr: 0.100000 +2023-04-05 14:12:09,482 epoch 45 - iter 530/2650 - loss 0.03970351 - time (sec): 36.61 - samples/sec: 7989.91 - lr: 0.100000 +2023-04-05 14:12:28,294 epoch 45 - iter 795/2650 - loss 0.03992902 - time (sec): 55.42 - samples/sec: 7939.87 - lr: 0.100000 +2023-04-05 14:12:46,034 epoch 45 - iter 1060/2650 - loss 0.04013327 - time (sec): 73.16 - samples/sec: 8019.64 - lr: 0.100000 +2023-04-05 14:13:04,536 epoch 45 - iter 1325/2650 - loss 0.04013230 - time (sec): 91.66 - samples/sec: 7994.35 - lr: 0.100000 +2023-04-05 14:13:22,865 epoch 45 - iter 1590/2650 - loss 0.04026092 - time (sec): 109.99 - samples/sec: 7990.03 - lr: 0.100000 +2023-04-05 14:13:40,754 epoch 45 - iter 1855/2650 - loss 0.04063067 - time (sec): 127.88 - samples/sec: 8003.10 - lr: 0.100000 +2023-04-05 14:13:58,644 epoch 45 - iter 2120/2650 - loss 0.04077307 - time (sec): 145.77 - samples/sec: 8022.51 - lr: 0.100000 +2023-04-05 14:14:17,364 epoch 45 - iter 2385/2650 - loss 0.04088952 - time (sec): 164.49 - samples/sec: 8015.16 - lr: 0.100000 +2023-04-05 14:14:35,673 epoch 45 - iter 2650/2650 - loss 0.04079982 - time (sec): 182.80 - samples/sec: 7999.86 - lr: 0.100000 +2023-04-05 14:14:35,673 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:14:35,673 EPOCH 45 done: loss 0.0408 - lr 0.100000 +2023-04-05 14:14:35,674 BAD EPOCHS (no improvement): 1 +2023-04-05 14:14:35,676 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:14:54,969 epoch 46 - iter 265/2650 - loss 0.03921600 - time (sec): 19.29 - samples/sec: 7714.65 - lr: 0.100000 +2023-04-05 14:15:12,757 epoch 46 - iter 530/2650 - loss 0.03954477 - time (sec): 37.08 - samples/sec: 7951.82 - lr: 0.100000 +2023-04-05 14:15:31,395 epoch 46 - iter 795/2650 - loss 0.03974565 - time (sec): 55.72 - samples/sec: 7916.98 - lr: 0.100000 +2023-04-05 14:15:49,141 epoch 46 - iter 1060/2650 - loss 0.03950021 - time (sec): 73.47 - samples/sec: 7967.96 - lr: 0.100000 +2023-04-05 14:16:07,351 epoch 46 - iter 1325/2650 - loss 0.03964841 - time (sec): 91.68 - samples/sec: 7991.27 - lr: 0.100000 +2023-04-05 14:16:25,473 epoch 46 - iter 1590/2650 - loss 0.03972167 - time (sec): 109.80 - samples/sec: 7985.77 - lr: 0.100000 +2023-04-05 14:16:43,255 epoch 46 - iter 1855/2650 - loss 0.03997422 - time (sec): 127.58 - samples/sec: 8016.41 - lr: 0.100000 +2023-04-05 14:17:01,586 epoch 46 - iter 2120/2650 - loss 0.04025568 - time (sec): 145.91 - samples/sec: 8025.58 - lr: 0.100000 +2023-04-05 14:17:20,163 epoch 46 - iter 2385/2650 - loss 0.04016361 - time (sec): 164.49 - samples/sec: 8010.97 - lr: 0.100000 +2023-04-05 14:17:37,775 epoch 46 - iter 2650/2650 - loss 0.04033806 - time (sec): 182.10 - samples/sec: 8030.57 - lr: 0.100000 +2023-04-05 14:17:37,776 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:17:37,776 EPOCH 46 done: loss 0.0403 - lr 0.100000 +2023-04-05 14:17:37,776 BAD EPOCHS (no improvement): 0 +2023-04-05 14:17:37,779 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:17:56,066 epoch 47 - iter 265/2650 - loss 0.03836738 - time (sec): 18.29 - samples/sec: 8105.17 - lr: 0.100000 +2023-04-05 14:18:13,844 epoch 47 - iter 530/2650 - loss 0.03914521 - time (sec): 36.07 - samples/sec: 8107.21 - lr: 0.100000 +2023-04-05 14:18:31,844 epoch 47 - iter 795/2650 - loss 0.03978921 - time (sec): 54.06 - samples/sec: 8110.23 - lr: 0.100000 +2023-04-05 14:18:49,931 epoch 47 - iter 1060/2650 - loss 0.03988945 - time (sec): 72.15 - samples/sec: 8105.02 - lr: 0.100000 +2023-04-05 14:19:08,014 epoch 47 - iter 1325/2650 - loss 0.03935177 - time (sec): 90.24 - samples/sec: 8102.06 - lr: 0.100000 +2023-04-05 14:19:26,173 epoch 47 - iter 1590/2650 - loss 0.03932793 - time (sec): 108.39 - samples/sec: 8082.27 - lr: 0.100000 +2023-04-05 14:19:44,948 epoch 47 - iter 1855/2650 - loss 0.03972726 - time (sec): 127.17 - samples/sec: 8053.81 - lr: 0.100000 +2023-04-05 14:20:03,101 epoch 47 - iter 2120/2650 - loss 0.04007483 - time (sec): 145.32 - samples/sec: 8056.54 - lr: 0.100000 +2023-04-05 14:20:21,206 epoch 47 - iter 2385/2650 - loss 0.04021612 - time (sec): 163.43 - samples/sec: 8053.54 - lr: 0.100000 +2023-04-05 14:20:39,687 epoch 47 - iter 2650/2650 - loss 0.04022225 - time (sec): 181.91 - samples/sec: 8039.05 - lr: 0.100000 +2023-04-05 14:20:39,687 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:20:39,687 EPOCH 47 done: loss 0.0402 - lr 0.100000 +2023-04-05 14:20:39,687 BAD EPOCHS (no improvement): 0 +2023-04-05 14:20:39,690 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:20:57,948 epoch 48 - iter 265/2650 - loss 0.03861889 - time (sec): 18.26 - samples/sec: 8013.37 - lr: 0.100000 +2023-04-05 14:21:16,325 epoch 48 - iter 530/2650 - loss 0.03927915 - time (sec): 36.63 - samples/sec: 7983.59 - lr: 0.100000 +2023-04-05 14:21:34,509 epoch 48 - iter 795/2650 - loss 0.03907398 - time (sec): 54.82 - samples/sec: 8026.12 - lr: 0.100000 +2023-04-05 14:21:52,225 epoch 48 - iter 1060/2650 - loss 0.03936735 - time (sec): 72.53 - samples/sec: 8083.39 - lr: 0.100000 +2023-04-05 14:22:10,266 epoch 48 - iter 1325/2650 - loss 0.03945020 - time (sec): 90.58 - samples/sec: 8083.65 - lr: 0.100000 +2023-04-05 14:22:28,340 epoch 48 - iter 1590/2650 - loss 0.03941673 - time (sec): 108.65 - samples/sec: 8085.16 - lr: 0.100000 +2023-04-05 14:22:46,621 epoch 48 - iter 1855/2650 - loss 0.03970985 - time (sec): 126.93 - samples/sec: 8069.04 - lr: 0.100000 +2023-04-05 14:23:05,078 epoch 48 - iter 2120/2650 - loss 0.03998193 - time (sec): 145.39 - samples/sec: 8058.90 - lr: 0.100000 +2023-04-05 14:23:22,996 epoch 48 - iter 2385/2650 - loss 0.04013525 - time (sec): 163.31 - samples/sec: 8061.25 - lr: 0.100000 +2023-04-05 14:23:41,357 epoch 48 - iter 2650/2650 - loss 0.04024657 - time (sec): 181.67 - samples/sec: 8049.68 - lr: 0.100000 +2023-04-05 14:23:41,358 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:23:41,358 EPOCH 48 done: loss 0.0402 - lr 0.100000 +2023-04-05 14:23:41,358 BAD EPOCHS (no improvement): 1 +2023-04-05 14:23:41,361 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:23:59,850 epoch 49 - iter 265/2650 - loss 0.04012170 - time (sec): 18.49 - samples/sec: 7958.22 - lr: 0.100000 +2023-04-05 14:24:17,564 epoch 49 - iter 530/2650 - loss 0.04024082 - time (sec): 36.20 - samples/sec: 8120.15 - lr: 0.100000 +2023-04-05 14:24:35,455 epoch 49 - iter 795/2650 - loss 0.04026430 - time (sec): 54.09 - samples/sec: 8138.42 - lr: 0.100000 +2023-04-05 14:24:53,336 epoch 49 - iter 1060/2650 - loss 0.04039873 - time (sec): 71.98 - samples/sec: 8136.12 - lr: 0.100000 +2023-04-05 14:25:11,251 epoch 49 - iter 1325/2650 - loss 0.04000186 - time (sec): 89.89 - samples/sec: 8122.60 - lr: 0.100000 +2023-04-05 14:25:29,036 epoch 49 - iter 1590/2650 - loss 0.03977296 - time (sec): 107.67 - samples/sec: 8141.63 - lr: 0.100000 +2023-04-05 14:25:47,620 epoch 49 - iter 1855/2650 - loss 0.04003576 - time (sec): 126.26 - samples/sec: 8102.92 - lr: 0.100000 +2023-04-05 14:26:05,504 epoch 49 - iter 2120/2650 - loss 0.04005786 - time (sec): 144.14 - samples/sec: 8108.69 - lr: 0.100000 +2023-04-05 14:26:23,786 epoch 49 - iter 2385/2650 - loss 0.04030304 - time (sec): 162.43 - samples/sec: 8101.21 - lr: 0.100000 +2023-04-05 14:26:42,050 epoch 49 - iter 2650/2650 - loss 0.04048654 - time (sec): 180.69 - samples/sec: 8093.24 - lr: 0.100000 +2023-04-05 14:26:42,051 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:26:42,051 EPOCH 49 done: loss 0.0405 - lr 0.100000 +2023-04-05 14:26:42,051 BAD EPOCHS (no improvement): 2 +2023-04-05 14:26:42,053 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:27:00,467 epoch 50 - iter 265/2650 - loss 0.03922237 - time (sec): 18.41 - samples/sec: 7996.92 - lr: 0.100000 +2023-04-05 14:27:18,706 epoch 50 - iter 530/2650 - loss 0.03893051 - time (sec): 36.65 - samples/sec: 7991.19 - lr: 0.100000 +2023-04-05 14:27:36,864 epoch 50 - iter 795/2650 - loss 0.03915797 - time (sec): 54.81 - samples/sec: 8016.82 - lr: 0.100000 +2023-04-05 14:27:54,589 epoch 50 - iter 1060/2650 - loss 0.03960933 - time (sec): 72.54 - samples/sec: 8065.62 - lr: 0.100000 +2023-04-05 14:28:12,839 epoch 50 - iter 1325/2650 - loss 0.04011978 - time (sec): 90.79 - samples/sec: 8047.01 - lr: 0.100000 +2023-04-05 14:28:31,217 epoch 50 - iter 1590/2650 - loss 0.03994922 - time (sec): 109.16 - samples/sec: 8025.53 - lr: 0.100000 +2023-04-05 14:28:49,229 epoch 50 - iter 1855/2650 - loss 0.04000701 - time (sec): 127.18 - samples/sec: 8035.68 - lr: 0.100000 +2023-04-05 14:29:07,625 epoch 50 - iter 2120/2650 - loss 0.04003744 - time (sec): 145.57 - samples/sec: 8025.48 - lr: 0.100000 +2023-04-05 14:29:25,484 epoch 50 - iter 2385/2650 - loss 0.04015971 - time (sec): 163.43 - samples/sec: 8049.02 - lr: 0.100000 +2023-04-05 14:29:43,390 epoch 50 - iter 2650/2650 - loss 0.04025809 - time (sec): 181.34 - samples/sec: 8064.34 - lr: 0.100000 +2023-04-05 14:29:43,390 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:29:43,390 EPOCH 50 done: loss 0.0403 - lr 0.100000 +2023-04-05 14:29:43,390 BAD EPOCHS (no improvement): 3 +2023-04-05 14:29:43,393 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:30:01,962 epoch 51 - iter 265/2650 - loss 0.03812507 - time (sec): 18.57 - samples/sec: 7876.75 - lr: 0.100000 +2023-04-05 14:30:19,636 epoch 51 - iter 530/2650 - loss 0.03858783 - time (sec): 36.24 - samples/sec: 8030.27 - lr: 0.100000 +2023-04-05 14:30:38,481 epoch 51 - iter 795/2650 - loss 0.03893180 - time (sec): 55.09 - samples/sec: 7990.47 - lr: 0.100000 +2023-04-05 14:30:56,569 epoch 51 - iter 1060/2650 - loss 0.03893548 - time (sec): 73.18 - samples/sec: 8010.98 - lr: 0.100000 +2023-04-05 14:31:13,963 epoch 51 - iter 1325/2650 - loss 0.03895381 - time (sec): 90.57 - samples/sec: 8055.51 - lr: 0.100000 +2023-04-05 14:31:31,783 epoch 51 - iter 1590/2650 - loss 0.03915072 - time (sec): 108.39 - samples/sec: 8070.45 - lr: 0.100000 +2023-04-05 14:31:49,688 epoch 51 - iter 1855/2650 - loss 0.03921638 - time (sec): 126.30 - samples/sec: 8087.95 - lr: 0.100000 +2023-04-05 14:32:07,845 epoch 51 - iter 2120/2650 - loss 0.03945988 - time (sec): 144.45 - samples/sec: 8086.10 - lr: 0.100000 +2023-04-05 14:32:26,305 epoch 51 - iter 2385/2650 - loss 0.03969158 - time (sec): 162.91 - samples/sec: 8069.70 - lr: 0.100000 +2023-04-05 14:32:44,612 epoch 51 - iter 2650/2650 - loss 0.03989519 - time (sec): 181.22 - samples/sec: 8069.61 - lr: 0.100000 +2023-04-05 14:32:44,612 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:32:44,612 EPOCH 51 done: loss 0.0399 - lr 0.100000 +2023-04-05 14:32:44,612 BAD EPOCHS (no improvement): 0 +2023-04-05 14:32:44,614 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:33:02,454 epoch 52 - iter 265/2650 - loss 0.03949242 - time (sec): 17.84 - samples/sec: 8216.43 - lr: 0.100000 +2023-04-05 14:33:20,781 epoch 52 - iter 530/2650 - loss 0.03898969 - time (sec): 36.17 - samples/sec: 8109.99 - lr: 0.100000 +2023-04-05 14:33:38,605 epoch 52 - iter 795/2650 - loss 0.03908908 - time (sec): 53.99 - samples/sec: 8112.98 - lr: 0.100000 +2023-04-05 14:33:56,851 epoch 52 - iter 1060/2650 - loss 0.03912563 - time (sec): 72.24 - samples/sec: 8074.43 - lr: 0.100000 +2023-04-05 14:34:14,681 epoch 52 - iter 1325/2650 - loss 0.03957400 - time (sec): 90.07 - samples/sec: 8094.01 - lr: 0.100000 +2023-04-05 14:34:32,832 epoch 52 - iter 1590/2650 - loss 0.03964304 - time (sec): 108.22 - samples/sec: 8083.37 - lr: 0.100000 +2023-04-05 14:34:51,643 epoch 52 - iter 1855/2650 - loss 0.03965549 - time (sec): 127.03 - samples/sec: 8050.19 - lr: 0.100000 +2023-04-05 14:35:09,852 epoch 52 - iter 2120/2650 - loss 0.03975091 - time (sec): 145.24 - samples/sec: 8050.67 - lr: 0.100000 +2023-04-05 14:35:28,196 epoch 52 - iter 2385/2650 - loss 0.03974329 - time (sec): 163.58 - samples/sec: 8047.40 - lr: 0.100000 +2023-04-05 14:35:46,422 epoch 52 - iter 2650/2650 - loss 0.03983553 - time (sec): 181.81 - samples/sec: 8043.48 - lr: 0.100000 +2023-04-05 14:35:46,422 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:35:46,422 EPOCH 52 done: loss 0.0398 - lr 0.100000 +2023-04-05 14:35:46,422 BAD EPOCHS (no improvement): 0 +2023-04-05 14:35:46,425 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:36:05,020 epoch 53 - iter 265/2650 - loss 0.03997397 - time (sec): 18.60 - samples/sec: 7883.01 - lr: 0.100000 +2023-04-05 14:36:23,894 epoch 53 - iter 530/2650 - loss 0.04065717 - time (sec): 37.47 - samples/sec: 7824.79 - lr: 0.100000 +2023-04-05 14:36:41,635 epoch 53 - iter 795/2650 - loss 0.04068847 - time (sec): 55.21 - samples/sec: 7925.63 - lr: 0.100000 +2023-04-05 14:37:00,023 epoch 53 - iter 1060/2650 - loss 0.04045005 - time (sec): 73.60 - samples/sec: 7970.72 - lr: 0.100000 +2023-04-05 14:37:18,752 epoch 53 - iter 1325/2650 - loss 0.04077156 - time (sec): 92.33 - samples/sec: 7952.90 - lr: 0.100000 +2023-04-05 14:37:36,955 epoch 53 - iter 1590/2650 - loss 0.04053930 - time (sec): 110.53 - samples/sec: 7950.94 - lr: 0.100000 +2023-04-05 14:37:55,333 epoch 53 - iter 1855/2650 - loss 0.04032789 - time (sec): 128.91 - samples/sec: 7953.67 - lr: 0.100000 +2023-04-05 14:38:13,740 epoch 53 - iter 2120/2650 - loss 0.04016615 - time (sec): 147.32 - samples/sec: 7952.71 - lr: 0.100000 +2023-04-05 14:38:31,850 epoch 53 - iter 2385/2650 - loss 0.04022834 - time (sec): 165.43 - samples/sec: 7961.15 - lr: 0.100000 +2023-04-05 14:38:49,605 epoch 53 - iter 2650/2650 - loss 0.04031738 - time (sec): 183.18 - samples/sec: 7983.19 - lr: 0.100000 +2023-04-05 14:38:49,606 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:38:49,606 EPOCH 53 done: loss 0.0403 - lr 0.100000 +2023-04-05 14:38:49,606 BAD EPOCHS (no improvement): 1 +2023-04-05 14:38:49,609 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:39:08,414 epoch 54 - iter 265/2650 - loss 0.03981605 - time (sec): 18.80 - samples/sec: 7865.02 - lr: 0.100000 +2023-04-05 14:39:26,505 epoch 54 - iter 530/2650 - loss 0.03929504 - time (sec): 36.90 - samples/sec: 7969.28 - lr: 0.100000 +2023-04-05 14:39:45,534 epoch 54 - iter 795/2650 - loss 0.03963348 - time (sec): 55.93 - samples/sec: 7857.65 - lr: 0.100000 +2023-04-05 14:40:04,767 epoch 54 - iter 1060/2650 - loss 0.03916536 - time (sec): 75.16 - samples/sec: 7780.08 - lr: 0.100000 +2023-04-05 14:40:24,477 epoch 54 - iter 1325/2650 - loss 0.03970923 - time (sec): 94.87 - samples/sec: 7694.55 - lr: 0.100000 +2023-04-05 14:40:44,409 epoch 54 - iter 1590/2650 - loss 0.03964163 - time (sec): 114.80 - samples/sec: 7632.03 - lr: 0.100000 +2023-04-05 14:41:04,175 epoch 54 - iter 1855/2650 - loss 0.03981455 - time (sec): 134.57 - samples/sec: 7602.85 - lr: 0.100000 +2023-04-05 14:41:23,642 epoch 54 - iter 2120/2650 - loss 0.03981412 - time (sec): 154.03 - samples/sec: 7590.31 - lr: 0.100000 +2023-04-05 14:41:43,725 epoch 54 - iter 2385/2650 - loss 0.03986044 - time (sec): 174.12 - samples/sec: 7556.32 - lr: 0.100000 +2023-04-05 14:42:03,660 epoch 54 - iter 2650/2650 - loss 0.04008108 - time (sec): 194.05 - samples/sec: 7535.97 - lr: 0.100000 +2023-04-05 14:42:03,660 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:42:03,660 EPOCH 54 done: loss 0.0401 - lr 0.100000 +2023-04-05 14:42:03,660 BAD EPOCHS (no improvement): 2 +2023-04-05 14:42:03,663 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:42:23,194 epoch 55 - iter 265/2650 - loss 0.04017381 - time (sec): 19.53 - samples/sec: 7419.58 - lr: 0.100000 +2023-04-05 14:42:42,458 epoch 55 - iter 530/2650 - loss 0.03991760 - time (sec): 38.79 - samples/sec: 7487.44 - lr: 0.100000 +2023-04-05 14:43:01,639 epoch 55 - iter 795/2650 - loss 0.03980712 - time (sec): 57.98 - samples/sec: 7531.65 - lr: 0.100000 +2023-04-05 14:43:20,860 epoch 55 - iter 1060/2650 - loss 0.04031493 - time (sec): 77.20 - samples/sec: 7549.20 - lr: 0.100000 +2023-04-05 14:43:39,860 epoch 55 - iter 1325/2650 - loss 0.04080985 - time (sec): 96.20 - samples/sec: 7587.81 - lr: 0.100000 +2023-04-05 14:43:59,211 epoch 55 - iter 1590/2650 - loss 0.04015990 - time (sec): 115.55 - samples/sec: 7592.55 - lr: 0.100000 +2023-04-05 14:44:18,240 epoch 55 - iter 1855/2650 - loss 0.04041682 - time (sec): 134.58 - samples/sec: 7602.15 - lr: 0.100000 +2023-04-05 14:44:37,083 epoch 55 - iter 2120/2650 - loss 0.04028490 - time (sec): 153.42 - samples/sec: 7618.85 - lr: 0.100000 +2023-04-05 14:44:56,310 epoch 55 - iter 2385/2650 - loss 0.04010795 - time (sec): 172.65 - samples/sec: 7618.51 - lr: 0.100000 +2023-04-05 14:45:15,215 epoch 55 - iter 2650/2650 - loss 0.04013712 - time (sec): 191.55 - samples/sec: 7634.29 - lr: 0.100000 +2023-04-05 14:45:15,216 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:45:15,216 EPOCH 55 done: loss 0.0401 - lr 0.100000 +2023-04-05 14:45:15,216 BAD EPOCHS (no improvement): 3 +2023-04-05 14:45:15,219 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:45:33,724 epoch 56 - iter 265/2650 - loss 0.03769394 - time (sec): 18.51 - samples/sec: 7833.29 - lr: 0.100000 +2023-04-05 14:45:52,223 epoch 56 - iter 530/2650 - loss 0.03896277 - time (sec): 37.00 - samples/sec: 7855.85 - lr: 0.100000 +2023-04-05 14:46:11,732 epoch 56 - iter 795/2650 - loss 0.03943176 - time (sec): 56.51 - samples/sec: 7739.18 - lr: 0.100000 +2023-04-05 14:46:30,409 epoch 56 - iter 1060/2650 - loss 0.03952033 - time (sec): 75.19 - samples/sec: 7764.41 - lr: 0.100000 +2023-04-05 14:46:49,448 epoch 56 - iter 1325/2650 - loss 0.03985000 - time (sec): 94.23 - samples/sec: 7742.72 - lr: 0.100000 +2023-04-05 14:47:08,186 epoch 56 - iter 1590/2650 - loss 0.03981211 - time (sec): 112.97 - samples/sec: 7770.54 - lr: 0.100000 +2023-04-05 14:47:27,662 epoch 56 - iter 1855/2650 - loss 0.03993281 - time (sec): 132.44 - samples/sec: 7740.40 - lr: 0.100000 +2023-04-05 14:47:46,803 epoch 56 - iter 2120/2650 - loss 0.03999352 - time (sec): 151.58 - samples/sec: 7733.18 - lr: 0.100000 +2023-04-05 14:48:05,260 epoch 56 - iter 2385/2650 - loss 0.03994656 - time (sec): 170.04 - samples/sec: 7738.90 - lr: 0.100000 +2023-04-05 14:48:24,098 epoch 56 - iter 2650/2650 - loss 0.03998935 - time (sec): 188.88 - samples/sec: 7742.30 - lr: 0.100000 +2023-04-05 14:48:24,099 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:48:24,099 EPOCH 56 done: loss 0.0400 - lr 0.100000 +2023-04-05 14:48:24,099 Epoch 56: reducing learning rate of group 0 to 5.0000e-02. +2023-04-05 14:48:24,099 BAD EPOCHS (no improvement): 4 +2023-04-05 14:48:24,102 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:48:43,205 epoch 57 - iter 265/2650 - loss 0.03907072 - time (sec): 19.10 - samples/sec: 7694.36 - lr: 0.050000 +2023-04-05 14:49:01,838 epoch 57 - iter 530/2650 - loss 0.03779608 - time (sec): 37.74 - samples/sec: 7756.67 - lr: 0.050000 +2023-04-05 14:49:20,730 epoch 57 - iter 795/2650 - loss 0.03769503 - time (sec): 56.63 - samples/sec: 7742.26 - lr: 0.050000 +2023-04-05 14:49:39,359 epoch 57 - iter 1060/2650 - loss 0.03746349 - time (sec): 75.26 - samples/sec: 7764.88 - lr: 0.050000 +2023-04-05 14:49:58,372 epoch 57 - iter 1325/2650 - loss 0.03742412 - time (sec): 94.27 - samples/sec: 7756.47 - lr: 0.050000 +2023-04-05 14:50:16,763 epoch 57 - iter 1590/2650 - loss 0.03735298 - time (sec): 112.66 - samples/sec: 7770.76 - lr: 0.050000 +2023-04-05 14:50:35,864 epoch 57 - iter 1855/2650 - loss 0.03732667 - time (sec): 131.76 - samples/sec: 7768.05 - lr: 0.050000 +2023-04-05 14:50:54,584 epoch 57 - iter 2120/2650 - loss 0.03733433 - time (sec): 150.48 - samples/sec: 7777.84 - lr: 0.050000 +2023-04-05 14:51:13,434 epoch 57 - iter 2385/2650 - loss 0.03742976 - time (sec): 169.33 - samples/sec: 7774.35 - lr: 0.050000 +2023-04-05 14:51:32,226 epoch 57 - iter 2650/2650 - loss 0.03726013 - time (sec): 188.12 - samples/sec: 7773.40 - lr: 0.050000 +2023-04-05 14:51:32,226 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:51:32,226 EPOCH 57 done: loss 0.0373 - lr 0.050000 +2023-04-05 14:51:32,226 BAD EPOCHS (no improvement): 0 +2023-04-05 14:51:32,229 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:51:51,201 epoch 58 - iter 265/2650 - loss 0.03620344 - time (sec): 18.97 - samples/sec: 7703.67 - lr: 0.050000 +2023-04-05 14:52:10,175 epoch 58 - iter 530/2650 - loss 0.03597562 - time (sec): 37.95 - samples/sec: 7690.36 - lr: 0.050000 +2023-04-05 14:52:28,592 epoch 58 - iter 795/2650 - loss 0.03633511 - time (sec): 56.36 - samples/sec: 7753.59 - lr: 0.050000 +2023-04-05 14:52:47,752 epoch 58 - iter 1060/2650 - loss 0.03635033 - time (sec): 75.52 - samples/sec: 7746.99 - lr: 0.050000 +2023-04-05 14:53:06,615 epoch 58 - iter 1325/2650 - loss 0.03666345 - time (sec): 94.39 - samples/sec: 7758.81 - lr: 0.050000 +2023-04-05 14:53:25,609 epoch 58 - iter 1590/2650 - loss 0.03633440 - time (sec): 113.38 - samples/sec: 7746.62 - lr: 0.050000 +2023-04-05 14:53:44,356 epoch 58 - iter 1855/2650 - loss 0.03603023 - time (sec): 132.13 - samples/sec: 7758.56 - lr: 0.050000 +2023-04-05 14:54:03,267 epoch 58 - iter 2120/2650 - loss 0.03602336 - time (sec): 151.04 - samples/sec: 7759.14 - lr: 0.050000 +2023-04-05 14:54:22,244 epoch 58 - iter 2385/2650 - loss 0.03619007 - time (sec): 170.01 - samples/sec: 7749.16 - lr: 0.050000 +2023-04-05 14:54:40,653 epoch 58 - iter 2650/2650 - loss 0.03619407 - time (sec): 188.42 - samples/sec: 7761.03 - lr: 0.050000 +2023-04-05 14:54:40,653 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:54:40,654 EPOCH 58 done: loss 0.0362 - lr 0.050000 +2023-04-05 14:54:40,654 BAD EPOCHS (no improvement): 0 +2023-04-05 14:54:40,657 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:54:58,786 epoch 59 - iter 265/2650 - loss 0.03423522 - time (sec): 18.13 - samples/sec: 8028.99 - lr: 0.050000 +2023-04-05 14:55:18,138 epoch 59 - iter 530/2650 - loss 0.03525574 - time (sec): 37.48 - samples/sec: 7750.49 - lr: 0.050000 +2023-04-05 14:55:47,191 epoch 59 - iter 795/2650 - loss 0.03520167 - time (sec): 66.53 - samples/sec: 6560.71 - lr: 0.050000 +2023-04-05 14:56:06,258 epoch 59 - iter 1060/2650 - loss 0.03537619 - time (sec): 85.60 - samples/sec: 6814.03 - lr: 0.050000 +2023-04-05 14:56:25,073 epoch 59 - iter 1325/2650 - loss 0.03507860 - time (sec): 104.42 - samples/sec: 6989.40 - lr: 0.050000 +2023-04-05 14:56:44,237 epoch 59 - iter 1590/2650 - loss 0.03525300 - time (sec): 123.58 - samples/sec: 7093.52 - lr: 0.050000 +2023-04-05 14:57:02,899 epoch 59 - iter 1855/2650 - loss 0.03544920 - time (sec): 142.24 - samples/sec: 7202.62 - lr: 0.050000 +2023-04-05 14:57:22,195 epoch 59 - iter 2120/2650 - loss 0.03540620 - time (sec): 161.54 - samples/sec: 7243.33 - lr: 0.050000 +2023-04-05 14:57:40,927 epoch 59 - iter 2385/2650 - loss 0.03553751 - time (sec): 180.27 - samples/sec: 7300.38 - lr: 0.050000 +2023-04-05 14:57:59,711 epoch 59 - iter 2650/2650 - loss 0.03535828 - time (sec): 199.05 - samples/sec: 7346.55 - lr: 0.050000 +2023-04-05 14:57:59,712 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:57:59,712 EPOCH 59 done: loss 0.0354 - lr 0.050000 +2023-04-05 14:57:59,712 BAD EPOCHS (no improvement): 0 +2023-04-05 14:57:59,753 ---------------------------------------------------------------------------------------------------- +2023-04-05 14:58:18,486 epoch 60 - iter 265/2650 - loss 0.03567379 - time (sec): 18.73 - samples/sec: 7782.76 - lr: 0.050000 +2023-04-05 14:58:37,545 epoch 60 - iter 530/2650 - loss 0.03492927 - time (sec): 37.79 - samples/sec: 7764.48 - lr: 0.050000 +2023-04-05 14:58:56,285 epoch 60 - iter 795/2650 - loss 0.03532277 - time (sec): 56.53 - samples/sec: 7773.21 - lr: 0.050000 +2023-04-05 14:59:15,852 epoch 60 - iter 1060/2650 - loss 0.03495618 - time (sec): 76.10 - samples/sec: 7689.99 - lr: 0.050000 +2023-04-05 14:59:35,464 epoch 60 - iter 1325/2650 - loss 0.03458261 - time (sec): 95.71 - samples/sec: 7630.56 - lr: 0.050000 +2023-04-05 14:59:54,269 epoch 60 - iter 1590/2650 - loss 0.03468048 - time (sec): 114.52 - samples/sec: 7655.05 - lr: 0.050000 +2023-04-05 15:00:13,191 epoch 60 - iter 1855/2650 - loss 0.03463277 - time (sec): 133.44 - samples/sec: 7670.41 - lr: 0.050000 +2023-04-05 15:00:31,920 epoch 60 - iter 2120/2650 - loss 0.03467261 - time (sec): 152.17 - samples/sec: 7686.65 - lr: 0.050000 +2023-04-05 15:00:50,579 epoch 60 - iter 2385/2650 - loss 0.03481973 - time (sec): 170.83 - samples/sec: 7694.72 - lr: 0.050000 +2023-04-05 15:01:10,481 epoch 60 - iter 2650/2650 - loss 0.03499557 - time (sec): 190.73 - samples/sec: 7667.25 - lr: 0.050000 +2023-04-05 15:01:10,482 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:01:10,482 EPOCH 60 done: loss 0.0350 - lr 0.050000 +2023-04-05 15:01:10,482 BAD EPOCHS (no improvement): 0 +2023-04-05 15:01:10,485 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:01:29,204 epoch 61 - iter 265/2650 - loss 0.03459561 - time (sec): 18.72 - samples/sec: 7868.99 - lr: 0.050000 +2023-04-05 15:01:48,169 epoch 61 - iter 530/2650 - loss 0.03437296 - time (sec): 37.68 - samples/sec: 7804.57 - lr: 0.050000 +2023-04-05 15:02:06,951 epoch 61 - iter 795/2650 - loss 0.03437846 - time (sec): 56.47 - samples/sec: 7767.89 - lr: 0.050000 +2023-04-05 15:02:25,630 epoch 61 - iter 1060/2650 - loss 0.03475811 - time (sec): 75.15 - samples/sec: 7755.07 - lr: 0.050000 +2023-04-05 15:02:44,777 epoch 61 - iter 1325/2650 - loss 0.03463230 - time (sec): 94.29 - samples/sec: 7738.28 - lr: 0.050000 +2023-04-05 15:03:04,230 epoch 61 - iter 1590/2650 - loss 0.03474684 - time (sec): 113.75 - samples/sec: 7707.02 - lr: 0.050000 +2023-04-05 15:03:22,833 epoch 61 - iter 1855/2650 - loss 0.03475785 - time (sec): 132.35 - samples/sec: 7729.88 - lr: 0.050000 +2023-04-05 15:03:42,040 epoch 61 - iter 2120/2650 - loss 0.03463848 - time (sec): 151.55 - samples/sec: 7711.61 - lr: 0.050000 +2023-04-05 15:04:01,076 epoch 61 - iter 2385/2650 - loss 0.03463164 - time (sec): 170.59 - samples/sec: 7707.98 - lr: 0.050000 +2023-04-05 15:04:19,934 epoch 61 - iter 2650/2650 - loss 0.03482403 - time (sec): 189.45 - samples/sec: 7719.03 - lr: 0.050000 +2023-04-05 15:04:19,935 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:04:19,935 EPOCH 61 done: loss 0.0348 - lr 0.050000 +2023-04-05 15:04:19,935 BAD EPOCHS (no improvement): 0 +2023-04-05 15:04:19,938 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:04:38,884 epoch 62 - iter 265/2650 - loss 0.03219591 - time (sec): 18.95 - samples/sec: 7699.05 - lr: 0.050000 +2023-04-05 15:04:57,559 epoch 62 - iter 530/2650 - loss 0.03388253 - time (sec): 37.62 - samples/sec: 7720.99 - lr: 0.050000 +2023-04-05 15:05:16,666 epoch 62 - iter 795/2650 - loss 0.03378619 - time (sec): 56.73 - samples/sec: 7722.38 - lr: 0.050000 +2023-04-05 15:05:35,264 epoch 62 - iter 1060/2650 - loss 0.03413625 - time (sec): 75.33 - samples/sec: 7737.59 - lr: 0.050000 +2023-04-05 15:05:54,377 epoch 62 - iter 1325/2650 - loss 0.03416657 - time (sec): 94.44 - samples/sec: 7725.00 - lr: 0.050000 +2023-04-05 15:06:13,461 epoch 62 - iter 1590/2650 - loss 0.03370168 - time (sec): 113.52 - samples/sec: 7711.13 - lr: 0.050000 +2023-04-05 15:06:32,882 epoch 62 - iter 1855/2650 - loss 0.03363980 - time (sec): 132.94 - samples/sec: 7704.77 - lr: 0.050000 +2023-04-05 15:06:51,698 epoch 62 - iter 2120/2650 - loss 0.03362355 - time (sec): 151.76 - samples/sec: 7713.51 - lr: 0.050000 +2023-04-05 15:07:10,268 epoch 62 - iter 2385/2650 - loss 0.03390164 - time (sec): 170.33 - samples/sec: 7734.76 - lr: 0.050000 +2023-04-05 15:07:28,651 epoch 62 - iter 2650/2650 - loss 0.03388849 - time (sec): 188.71 - samples/sec: 7749.13 - lr: 0.050000 +2023-04-05 15:07:28,652 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:07:28,652 EPOCH 62 done: loss 0.0339 - lr 0.050000 +2023-04-05 15:07:28,652 BAD EPOCHS (no improvement): 0 +2023-04-05 15:07:28,654 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:07:47,139 epoch 63 - iter 265/2650 - loss 0.03266954 - time (sec): 18.48 - samples/sec: 7884.70 - lr: 0.050000 +2023-04-05 15:08:05,894 epoch 63 - iter 530/2650 - loss 0.03269010 - time (sec): 37.24 - samples/sec: 7867.54 - lr: 0.050000 +2023-04-05 15:08:25,257 epoch 63 - iter 795/2650 - loss 0.03305519 - time (sec): 56.60 - samples/sec: 7778.90 - lr: 0.050000 +2023-04-05 15:08:43,713 epoch 63 - iter 1060/2650 - loss 0.03313278 - time (sec): 75.06 - samples/sec: 7815.10 - lr: 0.050000 +2023-04-05 15:09:02,719 epoch 63 - iter 1325/2650 - loss 0.03295265 - time (sec): 94.06 - samples/sec: 7798.32 - lr: 0.050000 +2023-04-05 15:09:21,790 epoch 63 - iter 1590/2650 - loss 0.03308877 - time (sec): 113.14 - samples/sec: 7764.37 - lr: 0.050000 +2023-04-05 15:09:40,821 epoch 63 - iter 1855/2650 - loss 0.03345972 - time (sec): 132.17 - samples/sec: 7756.00 - lr: 0.050000 +2023-04-05 15:09:59,280 epoch 63 - iter 2120/2650 - loss 0.03346671 - time (sec): 150.63 - samples/sec: 7770.31 - lr: 0.050000 +2023-04-05 15:10:17,982 epoch 63 - iter 2385/2650 - loss 0.03378690 - time (sec): 169.33 - samples/sec: 7781.22 - lr: 0.050000 +2023-04-05 15:10:37,191 epoch 63 - iter 2650/2650 - loss 0.03390191 - time (sec): 188.54 - samples/sec: 7756.37 - lr: 0.050000 +2023-04-05 15:10:37,192 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:10:37,192 EPOCH 63 done: loss 0.0339 - lr 0.050000 +2023-04-05 15:10:37,192 BAD EPOCHS (no improvement): 1 +2023-04-05 15:10:37,195 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:10:56,324 epoch 64 - iter 265/2650 - loss 0.03362924 - time (sec): 19.13 - samples/sec: 7591.97 - lr: 0.050000 +2023-04-05 15:11:15,727 epoch 64 - iter 530/2650 - loss 0.03441093 - time (sec): 38.53 - samples/sec: 7589.10 - lr: 0.050000 +2023-04-05 15:11:35,865 epoch 64 - iter 795/2650 - loss 0.03391532 - time (sec): 58.67 - samples/sec: 7487.02 - lr: 0.050000 +2023-04-05 15:11:55,932 epoch 64 - iter 1060/2650 - loss 0.03397607 - time (sec): 78.74 - samples/sec: 7420.15 - lr: 0.050000 +2023-04-05 15:12:15,636 epoch 64 - iter 1325/2650 - loss 0.03374106 - time (sec): 98.44 - samples/sec: 7407.92 - lr: 0.050000 +2023-04-05 15:12:34,967 epoch 64 - iter 1590/2650 - loss 0.03347775 - time (sec): 117.77 - samples/sec: 7432.65 - lr: 0.050000 +2023-04-05 15:12:54,724 epoch 64 - iter 1855/2650 - loss 0.03361139 - time (sec): 137.53 - samples/sec: 7435.73 - lr: 0.050000 +2023-04-05 15:13:14,618 epoch 64 - iter 2120/2650 - loss 0.03360450 - time (sec): 157.42 - samples/sec: 7436.66 - lr: 0.050000 +2023-04-05 15:13:33,887 epoch 64 - iter 2385/2650 - loss 0.03364149 - time (sec): 176.69 - samples/sec: 7449.92 - lr: 0.050000 +2023-04-05 15:13:52,355 epoch 64 - iter 2650/2650 - loss 0.03344772 - time (sec): 195.16 - samples/sec: 7493.16 - lr: 0.050000 +2023-04-05 15:13:52,356 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:13:52,356 EPOCH 64 done: loss 0.0334 - lr 0.050000 +2023-04-05 15:13:52,356 BAD EPOCHS (no improvement): 0 +2023-04-05 15:13:52,358 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:14:10,790 epoch 65 - iter 265/2650 - loss 0.03288048 - time (sec): 18.43 - samples/sec: 7864.48 - lr: 0.050000 +2023-04-05 15:14:30,664 epoch 65 - iter 530/2650 - loss 0.03250524 - time (sec): 38.31 - samples/sec: 7638.13 - lr: 0.050000 +2023-04-05 15:14:49,936 epoch 65 - iter 795/2650 - loss 0.03313956 - time (sec): 57.58 - samples/sec: 7640.26 - lr: 0.050000 +2023-04-05 15:15:08,655 epoch 65 - iter 1060/2650 - loss 0.03331832 - time (sec): 76.30 - samples/sec: 7683.99 - lr: 0.050000 +2023-04-05 15:15:27,260 epoch 65 - iter 1325/2650 - loss 0.03337080 - time (sec): 94.90 - samples/sec: 7711.43 - lr: 0.050000 +2023-04-05 15:15:46,612 epoch 65 - iter 1590/2650 - loss 0.03336752 - time (sec): 114.25 - samples/sec: 7689.62 - lr: 0.050000 +2023-04-05 15:16:05,046 epoch 65 - iter 1855/2650 - loss 0.03324501 - time (sec): 132.69 - samples/sec: 7717.02 - lr: 0.050000 +2023-04-05 15:16:23,503 epoch 65 - iter 2120/2650 - loss 0.03323006 - time (sec): 151.14 - samples/sec: 7743.93 - lr: 0.050000 +2023-04-05 15:16:41,955 epoch 65 - iter 2385/2650 - loss 0.03325825 - time (sec): 169.60 - samples/sec: 7763.36 - lr: 0.050000 +2023-04-05 15:17:00,730 epoch 65 - iter 2650/2650 - loss 0.03327492 - time (sec): 188.37 - samples/sec: 7763.18 - lr: 0.050000 +2023-04-05 15:17:00,731 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:17:00,731 EPOCH 65 done: loss 0.0333 - lr 0.050000 +2023-04-05 15:17:00,731 BAD EPOCHS (no improvement): 0 +2023-04-05 15:17:00,734 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:17:19,608 epoch 66 - iter 265/2650 - loss 0.03453069 - time (sec): 18.87 - samples/sec: 7762.66 - lr: 0.050000 +2023-04-05 15:17:38,856 epoch 66 - iter 530/2650 - loss 0.03478302 - time (sec): 38.12 - samples/sec: 7735.47 - lr: 0.050000 +2023-04-05 15:17:57,617 epoch 66 - iter 795/2650 - loss 0.03363654 - time (sec): 56.88 - samples/sec: 7743.84 - lr: 0.050000 +2023-04-05 15:18:15,681 epoch 66 - iter 1060/2650 - loss 0.03360564 - time (sec): 74.95 - samples/sec: 7808.49 - lr: 0.050000 +2023-04-05 15:18:34,515 epoch 66 - iter 1325/2650 - loss 0.03340537 - time (sec): 93.78 - samples/sec: 7785.64 - lr: 0.050000 +2023-04-05 15:18:52,971 epoch 66 - iter 1590/2650 - loss 0.03337737 - time (sec): 112.24 - samples/sec: 7801.42 - lr: 0.050000 +2023-04-05 15:19:12,162 epoch 66 - iter 1855/2650 - loss 0.03317414 - time (sec): 131.43 - samples/sec: 7780.12 - lr: 0.050000 +2023-04-05 15:19:30,931 epoch 66 - iter 2120/2650 - loss 0.03315331 - time (sec): 150.20 - samples/sec: 7782.80 - lr: 0.050000 +2023-04-05 15:19:49,759 epoch 66 - iter 2385/2650 - loss 0.03335950 - time (sec): 169.03 - samples/sec: 7784.18 - lr: 0.050000 +2023-04-05 15:20:08,762 epoch 66 - iter 2650/2650 - loss 0.03326953 - time (sec): 188.03 - samples/sec: 7777.35 - lr: 0.050000 +2023-04-05 15:20:08,763 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:20:08,763 EPOCH 66 done: loss 0.0333 - lr 0.050000 +2023-04-05 15:20:08,763 BAD EPOCHS (no improvement): 0 +2023-04-05 15:20:08,766 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:20:27,413 epoch 67 - iter 265/2650 - loss 0.03321950 - time (sec): 18.65 - samples/sec: 7825.69 - lr: 0.050000 +2023-04-05 15:20:45,717 epoch 67 - iter 530/2650 - loss 0.03272982 - time (sec): 36.95 - samples/sec: 7834.68 - lr: 0.050000 +2023-04-05 15:21:05,004 epoch 67 - iter 795/2650 - loss 0.03271262 - time (sec): 56.24 - samples/sec: 7773.98 - lr: 0.050000 +2023-04-05 15:21:24,015 epoch 67 - iter 1060/2650 - loss 0.03282520 - time (sec): 75.25 - samples/sec: 7773.65 - lr: 0.050000 +2023-04-05 15:21:43,055 epoch 67 - iter 1325/2650 - loss 0.03274082 - time (sec): 94.29 - samples/sec: 7756.71 - lr: 0.050000 +2023-04-05 15:22:01,632 epoch 67 - iter 1590/2650 - loss 0.03274120 - time (sec): 112.87 - samples/sec: 7766.18 - lr: 0.050000 +2023-04-05 15:22:20,142 epoch 67 - iter 1855/2650 - loss 0.03303001 - time (sec): 131.38 - samples/sec: 7776.79 - lr: 0.050000 +2023-04-05 15:22:39,613 epoch 67 - iter 2120/2650 - loss 0.03319422 - time (sec): 150.85 - samples/sec: 7749.58 - lr: 0.050000 +2023-04-05 15:22:58,788 epoch 67 - iter 2385/2650 - loss 0.03322667 - time (sec): 170.02 - samples/sec: 7740.24 - lr: 0.050000 +2023-04-05 15:23:17,919 epoch 67 - iter 2650/2650 - loss 0.03317443 - time (sec): 189.15 - samples/sec: 7731.10 - lr: 0.050000 +2023-04-05 15:23:17,919 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:23:17,919 EPOCH 67 done: loss 0.0332 - lr 0.050000 +2023-04-05 15:23:17,919 BAD EPOCHS (no improvement): 0 +2023-04-05 15:23:17,923 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:23:36,837 epoch 68 - iter 265/2650 - loss 0.03117733 - time (sec): 18.91 - samples/sec: 7673.06 - lr: 0.050000 +2023-04-05 15:23:55,963 epoch 68 - iter 530/2650 - loss 0.03198562 - time (sec): 38.04 - samples/sec: 7686.78 - lr: 0.050000 +2023-04-05 15:24:16,429 epoch 68 - iter 795/2650 - loss 0.03239173 - time (sec): 58.51 - samples/sec: 7504.45 - lr: 0.050000 +2023-04-05 15:24:35,409 epoch 68 - iter 1060/2650 - loss 0.03246876 - time (sec): 77.49 - samples/sec: 7553.31 - lr: 0.050000 +2023-04-05 15:24:53,993 epoch 68 - iter 1325/2650 - loss 0.03252904 - time (sec): 96.07 - samples/sec: 7603.49 - lr: 0.050000 +2023-04-05 15:25:12,963 epoch 68 - iter 1590/2650 - loss 0.03256733 - time (sec): 115.04 - samples/sec: 7620.88 - lr: 0.050000 +2023-04-05 15:25:32,189 epoch 68 - iter 1855/2650 - loss 0.03258630 - time (sec): 134.27 - samples/sec: 7633.07 - lr: 0.050000 +2023-04-05 15:25:50,712 epoch 68 - iter 2120/2650 - loss 0.03258580 - time (sec): 152.79 - samples/sec: 7669.26 - lr: 0.050000 +2023-04-05 15:26:09,750 epoch 68 - iter 2385/2650 - loss 0.03279360 - time (sec): 171.83 - samples/sec: 7666.96 - lr: 0.050000 +2023-04-05 15:26:28,753 epoch 68 - iter 2650/2650 - loss 0.03274483 - time (sec): 190.83 - samples/sec: 7663.17 - lr: 0.050000 +2023-04-05 15:26:28,753 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:26:28,753 EPOCH 68 done: loss 0.0327 - lr 0.050000 +2023-04-05 15:26:28,753 BAD EPOCHS (no improvement): 0 +2023-04-05 15:26:28,756 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:26:47,367 epoch 69 - iter 265/2650 - loss 0.03300039 - time (sec): 18.61 - samples/sec: 7835.16 - lr: 0.050000 +2023-04-05 15:27:06,726 epoch 69 - iter 530/2650 - loss 0.03385157 - time (sec): 37.97 - samples/sec: 7728.45 - lr: 0.050000 +2023-04-05 15:27:25,414 epoch 69 - iter 795/2650 - loss 0.03315806 - time (sec): 56.66 - samples/sec: 7768.01 - lr: 0.050000 +2023-04-05 15:27:44,854 epoch 69 - iter 1060/2650 - loss 0.03327379 - time (sec): 76.10 - samples/sec: 7724.62 - lr: 0.050000 +2023-04-05 15:28:03,568 epoch 69 - iter 1325/2650 - loss 0.03298657 - time (sec): 94.81 - samples/sec: 7731.09 - lr: 0.050000 +2023-04-05 15:28:22,924 epoch 69 - iter 1590/2650 - loss 0.03292389 - time (sec): 114.17 - samples/sec: 7697.92 - lr: 0.050000 +2023-04-05 15:28:41,778 epoch 69 - iter 1855/2650 - loss 0.03291942 - time (sec): 133.02 - samples/sec: 7706.39 - lr: 0.050000 +2023-04-05 15:29:00,486 epoch 69 - iter 2120/2650 - loss 0.03295967 - time (sec): 151.73 - samples/sec: 7720.73 - lr: 0.050000 +2023-04-05 15:29:19,336 epoch 69 - iter 2385/2650 - loss 0.03261018 - time (sec): 170.58 - samples/sec: 7720.40 - lr: 0.050000 +2023-04-05 15:29:38,289 epoch 69 - iter 2650/2650 - loss 0.03253121 - time (sec): 189.53 - samples/sec: 7715.63 - lr: 0.050000 +2023-04-05 15:29:38,289 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:29:38,289 EPOCH 69 done: loss 0.0325 - lr 0.050000 +2023-04-05 15:29:38,289 BAD EPOCHS (no improvement): 0 +2023-04-05 15:29:38,292 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:29:56,789 epoch 70 - iter 265/2650 - loss 0.03203543 - time (sec): 18.50 - samples/sec: 7897.25 - lr: 0.050000 +2023-04-05 15:30:15,698 epoch 70 - iter 530/2650 - loss 0.03172506 - time (sec): 37.41 - samples/sec: 7785.60 - lr: 0.050000 +2023-04-05 15:30:35,420 epoch 70 - iter 795/2650 - loss 0.03140745 - time (sec): 57.13 - samples/sec: 7653.76 - lr: 0.050000 +2023-04-05 15:30:55,007 epoch 70 - iter 1060/2650 - loss 0.03198195 - time (sec): 76.72 - samples/sec: 7598.20 - lr: 0.050000 +2023-04-05 15:31:13,804 epoch 70 - iter 1325/2650 - loss 0.03222199 - time (sec): 95.51 - samples/sec: 7637.14 - lr: 0.050000 +2023-04-05 15:31:32,554 epoch 70 - iter 1590/2650 - loss 0.03236273 - time (sec): 114.26 - samples/sec: 7668.29 - lr: 0.050000 +2023-04-05 15:31:51,653 epoch 70 - iter 1855/2650 - loss 0.03233581 - time (sec): 133.36 - samples/sec: 7661.01 - lr: 0.050000 +2023-04-05 15:32:10,638 epoch 70 - iter 2120/2650 - loss 0.03245261 - time (sec): 152.35 - samples/sec: 7672.04 - lr: 0.050000 +2023-04-05 15:32:29,587 epoch 70 - iter 2385/2650 - loss 0.03258235 - time (sec): 171.29 - samples/sec: 7682.46 - lr: 0.050000 +2023-04-05 15:32:47,812 epoch 70 - iter 2650/2650 - loss 0.03260023 - time (sec): 189.52 - samples/sec: 7716.14 - lr: 0.050000 +2023-04-05 15:32:47,812 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:32:47,812 EPOCH 70 done: loss 0.0326 - lr 0.050000 +2023-04-05 15:32:47,812 BAD EPOCHS (no improvement): 1 +2023-04-05 15:32:47,815 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:33:06,623 epoch 71 - iter 265/2650 - loss 0.03243372 - time (sec): 18.81 - samples/sec: 7707.29 - lr: 0.050000 +2023-04-05 15:33:25,164 epoch 71 - iter 530/2650 - loss 0.03200419 - time (sec): 37.35 - samples/sec: 7772.22 - lr: 0.050000 +2023-04-05 15:33:43,891 epoch 71 - iter 795/2650 - loss 0.03257660 - time (sec): 56.08 - samples/sec: 7803.16 - lr: 0.050000 +2023-04-05 15:34:02,399 epoch 71 - iter 1060/2650 - loss 0.03263374 - time (sec): 74.58 - samples/sec: 7824.22 - lr: 0.050000 +2023-04-05 15:34:21,332 epoch 71 - iter 1325/2650 - loss 0.03284093 - time (sec): 93.52 - samples/sec: 7803.10 - lr: 0.050000 +2023-04-05 15:34:40,323 epoch 71 - iter 1590/2650 - loss 0.03259694 - time (sec): 112.51 - samples/sec: 7798.91 - lr: 0.050000 +2023-04-05 15:34:58,782 epoch 71 - iter 1855/2650 - loss 0.03267710 - time (sec): 130.97 - samples/sec: 7813.11 - lr: 0.050000 +2023-04-05 15:35:17,689 epoch 71 - iter 2120/2650 - loss 0.03272215 - time (sec): 149.87 - samples/sec: 7801.96 - lr: 0.050000 +2023-04-05 15:35:36,704 epoch 71 - iter 2385/2650 - loss 0.03271667 - time (sec): 168.89 - samples/sec: 7792.86 - lr: 0.050000 +2023-04-05 15:35:56,182 epoch 71 - iter 2650/2650 - loss 0.03282474 - time (sec): 188.37 - samples/sec: 7763.40 - lr: 0.050000 +2023-04-05 15:35:56,182 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:35:56,182 EPOCH 71 done: loss 0.0328 - lr 0.050000 +2023-04-05 15:35:56,182 BAD EPOCHS (no improvement): 2 +2023-04-05 15:35:56,185 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:36:15,097 epoch 72 - iter 265/2650 - loss 0.03151443 - time (sec): 18.91 - samples/sec: 7654.73 - lr: 0.050000 +2023-04-05 15:36:34,341 epoch 72 - iter 530/2650 - loss 0.03280041 - time (sec): 38.16 - samples/sec: 7646.55 - lr: 0.050000 +2023-04-05 15:36:53,431 epoch 72 - iter 795/2650 - loss 0.03244706 - time (sec): 57.25 - samples/sec: 7693.06 - lr: 0.050000 +2023-04-05 15:37:11,898 epoch 72 - iter 1060/2650 - loss 0.03218374 - time (sec): 75.71 - samples/sec: 7716.62 - lr: 0.050000 +2023-04-05 15:37:30,345 epoch 72 - iter 1325/2650 - loss 0.03218432 - time (sec): 94.16 - samples/sec: 7755.00 - lr: 0.050000 +2023-04-05 15:37:48,354 epoch 72 - iter 1590/2650 - loss 0.03227949 - time (sec): 112.17 - samples/sec: 7798.71 - lr: 0.050000 +2023-04-05 15:38:07,512 epoch 72 - iter 1855/2650 - loss 0.03241668 - time (sec): 131.33 - samples/sec: 7785.25 - lr: 0.050000 +2023-04-05 15:38:26,525 epoch 72 - iter 2120/2650 - loss 0.03241169 - time (sec): 150.34 - samples/sec: 7772.49 - lr: 0.050000 +2023-04-05 15:38:45,661 epoch 72 - iter 2385/2650 - loss 0.03224397 - time (sec): 169.48 - samples/sec: 7763.80 - lr: 0.050000 +2023-04-05 15:39:04,439 epoch 72 - iter 2650/2650 - loss 0.03223035 - time (sec): 188.25 - samples/sec: 7768.04 - lr: 0.050000 +2023-04-05 15:39:04,440 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:39:04,440 EPOCH 72 done: loss 0.0322 - lr 0.050000 +2023-04-05 15:39:04,440 BAD EPOCHS (no improvement): 0 +2023-04-05 15:39:04,443 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:39:23,446 epoch 73 - iter 265/2650 - loss 0.03025159 - time (sec): 19.00 - samples/sec: 7655.93 - lr: 0.050000 +2023-04-05 15:39:41,831 epoch 73 - iter 530/2650 - loss 0.03154995 - time (sec): 37.39 - samples/sec: 7822.92 - lr: 0.050000 +2023-04-05 15:40:01,268 epoch 73 - iter 795/2650 - loss 0.03153581 - time (sec): 56.82 - samples/sec: 7749.24 - lr: 0.050000 +2023-04-05 15:40:20,654 epoch 73 - iter 1060/2650 - loss 0.03158741 - time (sec): 76.21 - samples/sec: 7700.37 - lr: 0.050000 +2023-04-05 15:40:40,088 epoch 73 - iter 1325/2650 - loss 0.03174891 - time (sec): 95.64 - samples/sec: 7676.64 - lr: 0.050000 +2023-04-05 15:40:58,902 epoch 73 - iter 1590/2650 - loss 0.03194426 - time (sec): 114.46 - samples/sec: 7685.86 - lr: 0.050000 +2023-04-05 15:41:17,836 epoch 73 - iter 1855/2650 - loss 0.03183025 - time (sec): 133.39 - samples/sec: 7682.11 - lr: 0.050000 +2023-04-05 15:41:36,813 epoch 73 - iter 2120/2650 - loss 0.03173949 - time (sec): 152.37 - samples/sec: 7675.42 - lr: 0.050000 +2023-04-05 15:41:56,314 epoch 73 - iter 2385/2650 - loss 0.03183578 - time (sec): 171.87 - samples/sec: 7654.72 - lr: 0.050000 +2023-04-05 15:42:15,521 epoch 73 - iter 2650/2650 - loss 0.03208117 - time (sec): 191.08 - samples/sec: 7653.23 - lr: 0.050000 +2023-04-05 15:42:15,521 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:42:15,521 EPOCH 73 done: loss 0.0321 - lr 0.050000 +2023-04-05 15:42:15,521 BAD EPOCHS (no improvement): 0 +2023-04-05 15:42:15,525 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:42:34,403 epoch 74 - iter 265/2650 - loss 0.03131834 - time (sec): 18.88 - samples/sec: 7794.49 - lr: 0.050000 +2023-04-05 15:42:53,190 epoch 74 - iter 530/2650 - loss 0.03209112 - time (sec): 37.67 - samples/sec: 7824.70 - lr: 0.050000 +2023-04-05 15:43:11,694 epoch 74 - iter 795/2650 - loss 0.03136822 - time (sec): 56.17 - samples/sec: 7844.32 - lr: 0.050000 +2023-04-05 15:43:30,360 epoch 74 - iter 1060/2650 - loss 0.03169248 - time (sec): 74.83 - samples/sec: 7839.33 - lr: 0.050000 +2023-04-05 15:43:49,146 epoch 74 - iter 1325/2650 - loss 0.03192538 - time (sec): 93.62 - samples/sec: 7830.22 - lr: 0.050000 +2023-04-05 15:44:07,183 epoch 74 - iter 1590/2650 - loss 0.03185558 - time (sec): 111.66 - samples/sec: 7874.33 - lr: 0.050000 +2023-04-05 15:44:25,814 epoch 74 - iter 1855/2650 - loss 0.03180182 - time (sec): 130.29 - samples/sec: 7871.49 - lr: 0.050000 +2023-04-05 15:44:44,392 epoch 74 - iter 2120/2650 - loss 0.03193431 - time (sec): 148.87 - samples/sec: 7873.45 - lr: 0.050000 +2023-04-05 15:45:13,830 epoch 74 - iter 2385/2650 - loss 0.03199040 - time (sec): 178.30 - samples/sec: 7389.15 - lr: 0.050000 +2023-04-05 15:45:32,314 epoch 74 - iter 2650/2650 - loss 0.03202721 - time (sec): 196.79 - samples/sec: 7431.12 - lr: 0.050000 +2023-04-05 15:45:32,315 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:45:32,315 EPOCH 74 done: loss 0.0320 - lr 0.050000 +2023-04-05 15:45:32,315 BAD EPOCHS (no improvement): 0 +2023-04-05 15:45:32,317 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:45:50,450 epoch 75 - iter 265/2650 - loss 0.03141618 - time (sec): 18.13 - samples/sec: 8034.93 - lr: 0.050000 +2023-04-05 15:46:08,623 epoch 75 - iter 530/2650 - loss 0.03197292 - time (sec): 36.31 - samples/sec: 7988.43 - lr: 0.050000 +2023-04-05 15:46:26,808 epoch 75 - iter 795/2650 - loss 0.03134681 - time (sec): 54.49 - samples/sec: 7995.31 - lr: 0.050000 +2023-04-05 15:46:44,933 epoch 75 - iter 1060/2650 - loss 0.03192776 - time (sec): 72.62 - samples/sec: 8002.01 - lr: 0.050000 +2023-04-05 15:47:03,176 epoch 75 - iter 1325/2650 - loss 0.03152328 - time (sec): 90.86 - samples/sec: 8009.14 - lr: 0.050000 +2023-04-05 15:47:21,555 epoch 75 - iter 1590/2650 - loss 0.03146836 - time (sec): 109.24 - samples/sec: 8012.41 - lr: 0.050000 +2023-04-05 15:47:40,149 epoch 75 - iter 1855/2650 - loss 0.03180467 - time (sec): 127.83 - samples/sec: 7987.72 - lr: 0.050000 +2023-04-05 15:47:58,238 epoch 75 - iter 2120/2650 - loss 0.03174516 - time (sec): 145.92 - samples/sec: 8006.60 - lr: 0.050000 +2023-04-05 15:48:16,628 epoch 75 - iter 2385/2650 - loss 0.03176793 - time (sec): 164.31 - samples/sec: 8005.61 - lr: 0.050000 +2023-04-05 15:48:35,161 epoch 75 - iter 2650/2650 - loss 0.03181570 - time (sec): 182.84 - samples/sec: 7997.90 - lr: 0.050000 +2023-04-05 15:48:35,161 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:48:35,161 EPOCH 75 done: loss 0.0318 - lr 0.050000 +2023-04-05 15:48:35,161 BAD EPOCHS (no improvement): 0 +2023-04-05 15:48:35,164 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:48:53,513 epoch 76 - iter 265/2650 - loss 0.03017883 - time (sec): 18.35 - samples/sec: 7961.79 - lr: 0.050000 +2023-04-05 15:49:11,821 epoch 76 - iter 530/2650 - loss 0.03026187 - time (sec): 36.66 - samples/sec: 7981.36 - lr: 0.050000 +2023-04-05 15:49:29,609 epoch 76 - iter 795/2650 - loss 0.03093123 - time (sec): 54.45 - samples/sec: 8042.26 - lr: 0.050000 +2023-04-05 15:49:47,618 epoch 76 - iter 1060/2650 - loss 0.03127987 - time (sec): 72.45 - samples/sec: 8020.51 - lr: 0.050000 +2023-04-05 15:50:05,789 epoch 76 - iter 1325/2650 - loss 0.03173655 - time (sec): 90.63 - samples/sec: 8032.44 - lr: 0.050000 +2023-04-05 15:50:24,029 epoch 76 - iter 1590/2650 - loss 0.03166301 - time (sec): 108.87 - samples/sec: 8039.17 - lr: 0.050000 +2023-04-05 15:50:42,505 epoch 76 - iter 1855/2650 - loss 0.03166008 - time (sec): 127.34 - samples/sec: 8030.32 - lr: 0.050000 +2023-04-05 15:50:59,933 epoch 76 - iter 2120/2650 - loss 0.03158149 - time (sec): 144.77 - samples/sec: 8065.07 - lr: 0.050000 +2023-04-05 15:51:18,046 epoch 76 - iter 2385/2650 - loss 0.03162405 - time (sec): 162.88 - samples/sec: 8070.88 - lr: 0.050000 +2023-04-05 15:51:36,782 epoch 76 - iter 2650/2650 - loss 0.03160297 - time (sec): 181.62 - samples/sec: 8051.84 - lr: 0.050000 +2023-04-05 15:51:36,783 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:51:36,783 EPOCH 76 done: loss 0.0316 - lr 0.050000 +2023-04-05 15:51:36,783 BAD EPOCHS (no improvement): 0 +2023-04-05 15:51:36,785 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:51:55,713 epoch 77 - iter 265/2650 - loss 0.03218330 - time (sec): 18.93 - samples/sec: 7899.36 - lr: 0.050000 +2023-04-05 15:52:13,994 epoch 77 - iter 530/2650 - loss 0.03187748 - time (sec): 37.21 - samples/sec: 7923.32 - lr: 0.050000 +2023-04-05 15:52:32,065 epoch 77 - iter 795/2650 - loss 0.03177840 - time (sec): 55.28 - samples/sec: 7992.74 - lr: 0.050000 +2023-04-05 15:52:49,961 epoch 77 - iter 1060/2650 - loss 0.03167606 - time (sec): 73.18 - samples/sec: 8044.32 - lr: 0.050000 +2023-04-05 15:53:08,316 epoch 77 - iter 1325/2650 - loss 0.03169360 - time (sec): 91.53 - samples/sec: 8020.24 - lr: 0.050000 +2023-04-05 15:53:26,361 epoch 77 - iter 1590/2650 - loss 0.03185192 - time (sec): 109.58 - samples/sec: 8037.85 - lr: 0.050000 +2023-04-05 15:53:44,204 epoch 77 - iter 1855/2650 - loss 0.03203371 - time (sec): 127.42 - samples/sec: 8052.18 - lr: 0.050000 +2023-04-05 15:54:02,347 epoch 77 - iter 2120/2650 - loss 0.03198228 - time (sec): 145.56 - samples/sec: 8056.20 - lr: 0.050000 +2023-04-05 15:54:20,345 epoch 77 - iter 2385/2650 - loss 0.03184141 - time (sec): 163.56 - samples/sec: 8054.11 - lr: 0.050000 +2023-04-05 15:54:38,174 epoch 77 - iter 2650/2650 - loss 0.03186972 - time (sec): 181.39 - samples/sec: 8062.04 - lr: 0.050000 +2023-04-05 15:54:38,174 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:54:38,175 EPOCH 77 done: loss 0.0319 - lr 0.050000 +2023-04-05 15:54:38,175 BAD EPOCHS (no improvement): 1 +2023-04-05 15:54:38,178 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:54:56,625 epoch 78 - iter 265/2650 - loss 0.03017653 - time (sec): 18.45 - samples/sec: 7944.50 - lr: 0.050000 +2023-04-05 15:55:14,646 epoch 78 - iter 530/2650 - loss 0.03077051 - time (sec): 36.47 - samples/sec: 8034.11 - lr: 0.050000 +2023-04-05 15:55:32,678 epoch 78 - iter 795/2650 - loss 0.03042051 - time (sec): 54.50 - samples/sec: 8057.21 - lr: 0.050000 +2023-04-05 15:55:50,782 epoch 78 - iter 1060/2650 - loss 0.03067265 - time (sec): 72.60 - samples/sec: 8075.66 - lr: 0.050000 +2023-04-05 15:56:08,754 epoch 78 - iter 1325/2650 - loss 0.03149557 - time (sec): 90.58 - samples/sec: 8086.87 - lr: 0.050000 +2023-04-05 15:56:26,718 epoch 78 - iter 1590/2650 - loss 0.03129815 - time (sec): 108.54 - samples/sec: 8092.28 - lr: 0.050000 +2023-04-05 15:56:44,574 epoch 78 - iter 1855/2650 - loss 0.03118039 - time (sec): 126.40 - samples/sec: 8100.97 - lr: 0.050000 +2023-04-05 15:57:02,497 epoch 78 - iter 2120/2650 - loss 0.03119876 - time (sec): 144.32 - samples/sec: 8101.22 - lr: 0.050000 +2023-04-05 15:57:20,456 epoch 78 - iter 2385/2650 - loss 0.03103000 - time (sec): 162.28 - samples/sec: 8101.61 - lr: 0.050000 +2023-04-05 15:57:38,822 epoch 78 - iter 2650/2650 - loss 0.03110662 - time (sec): 180.64 - samples/sec: 8095.29 - lr: 0.050000 +2023-04-05 15:57:38,822 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:57:38,822 EPOCH 78 done: loss 0.0311 - lr 0.050000 +2023-04-05 15:57:38,822 BAD EPOCHS (no improvement): 0 +2023-04-05 15:57:38,825 ---------------------------------------------------------------------------------------------------- +2023-04-05 15:57:56,636 epoch 79 - iter 265/2650 - loss 0.03136639 - time (sec): 17.81 - samples/sec: 8218.91 - lr: 0.050000 +2023-04-05 15:58:14,368 epoch 79 - iter 530/2650 - loss 0.03082705 - time (sec): 35.54 - samples/sec: 8252.69 - lr: 0.050000 +2023-04-05 15:58:32,335 epoch 79 - iter 795/2650 - loss 0.03060434 - time (sec): 53.51 - samples/sec: 8194.27 - lr: 0.050000 +2023-04-05 15:58:51,200 epoch 79 - iter 1060/2650 - loss 0.03045012 - time (sec): 72.37 - samples/sec: 8114.44 - lr: 0.050000 +2023-04-05 15:59:09,293 epoch 79 - iter 1325/2650 - loss 0.03046960 - time (sec): 90.47 - samples/sec: 8104.49 - lr: 0.050000 +2023-04-05 15:59:27,350 epoch 79 - iter 1590/2650 - loss 0.03121398 - time (sec): 108.53 - samples/sec: 8113.71 - lr: 0.050000 +2023-04-05 15:59:45,223 epoch 79 - iter 1855/2650 - loss 0.03123924 - time (sec): 126.40 - samples/sec: 8101.71 - lr: 0.050000 +2023-04-05 16:00:03,761 epoch 79 - iter 2120/2650 - loss 0.03126028 - time (sec): 144.94 - samples/sec: 8071.14 - lr: 0.050000 +2023-04-05 16:00:21,904 epoch 79 - iter 2385/2650 - loss 0.03147229 - time (sec): 163.08 - samples/sec: 8073.15 - lr: 0.050000 +2023-04-05 16:00:39,566 epoch 79 - iter 2650/2650 - loss 0.03147414 - time (sec): 180.74 - samples/sec: 8090.91 - lr: 0.050000 +2023-04-05 16:00:39,567 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:00:39,567 EPOCH 79 done: loss 0.0315 - lr 0.050000 +2023-04-05 16:00:39,567 BAD EPOCHS (no improvement): 1 +2023-04-05 16:00:39,570 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:00:57,695 epoch 80 - iter 265/2650 - loss 0.02950655 - time (sec): 18.13 - samples/sec: 8089.41 - lr: 0.050000 +2023-04-05 16:01:15,737 epoch 80 - iter 530/2650 - loss 0.02989593 - time (sec): 36.17 - samples/sec: 8070.04 - lr: 0.050000 +2023-04-05 16:01:33,862 epoch 80 - iter 795/2650 - loss 0.02996041 - time (sec): 54.29 - samples/sec: 8103.12 - lr: 0.050000 +2023-04-05 16:01:51,500 epoch 80 - iter 1060/2650 - loss 0.03072004 - time (sec): 71.93 - samples/sec: 8127.75 - lr: 0.050000 +2023-04-05 16:02:09,453 epoch 80 - iter 1325/2650 - loss 0.03109382 - time (sec): 89.88 - samples/sec: 8140.36 - lr: 0.050000 +2023-04-05 16:02:27,965 epoch 80 - iter 1590/2650 - loss 0.03101502 - time (sec): 108.40 - samples/sec: 8107.23 - lr: 0.050000 +2023-04-05 16:02:45,623 epoch 80 - iter 1855/2650 - loss 0.03115635 - time (sec): 126.05 - samples/sec: 8117.33 - lr: 0.050000 +2023-04-05 16:03:03,686 epoch 80 - iter 2120/2650 - loss 0.03113706 - time (sec): 144.12 - samples/sec: 8117.75 - lr: 0.050000 +2023-04-05 16:03:21,897 epoch 80 - iter 2385/2650 - loss 0.03094054 - time (sec): 162.33 - samples/sec: 8110.00 - lr: 0.050000 +2023-04-05 16:03:40,227 epoch 80 - iter 2650/2650 - loss 0.03116852 - time (sec): 180.66 - samples/sec: 8094.68 - lr: 0.050000 +2023-04-05 16:03:40,227 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:03:40,228 EPOCH 80 done: loss 0.0312 - lr 0.050000 +2023-04-05 16:03:40,228 BAD EPOCHS (no improvement): 2 +2023-04-05 16:03:40,231 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:03:58,130 epoch 81 - iter 265/2650 - loss 0.03050701 - time (sec): 17.90 - samples/sec: 8098.05 - lr: 0.050000 +2023-04-05 16:04:16,414 epoch 81 - iter 530/2650 - loss 0.03099144 - time (sec): 36.18 - samples/sec: 8096.00 - lr: 0.050000 +2023-04-05 16:04:34,566 epoch 81 - iter 795/2650 - loss 0.03084154 - time (sec): 54.33 - samples/sec: 8076.94 - lr: 0.050000 +2023-04-05 16:04:52,456 epoch 81 - iter 1060/2650 - loss 0.03073356 - time (sec): 72.23 - samples/sec: 8070.74 - lr: 0.050000 +2023-04-05 16:05:10,431 epoch 81 - iter 1325/2650 - loss 0.03078831 - time (sec): 90.20 - samples/sec: 8083.26 - lr: 0.050000 +2023-04-05 16:05:28,262 epoch 81 - iter 1590/2650 - loss 0.03081613 - time (sec): 108.03 - samples/sec: 8106.14 - lr: 0.050000 +2023-04-05 16:05:46,986 epoch 81 - iter 1855/2650 - loss 0.03109769 - time (sec): 126.75 - samples/sec: 8067.07 - lr: 0.050000 +2023-04-05 16:06:04,787 epoch 81 - iter 2120/2650 - loss 0.03100634 - time (sec): 144.56 - samples/sec: 8081.72 - lr: 0.050000 +2023-04-05 16:06:22,670 epoch 81 - iter 2385/2650 - loss 0.03089991 - time (sec): 162.44 - samples/sec: 8096.42 - lr: 0.050000 +2023-04-05 16:06:41,240 epoch 81 - iter 2650/2650 - loss 0.03091406 - time (sec): 181.01 - samples/sec: 8078.95 - lr: 0.050000 +2023-04-05 16:06:41,240 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:06:41,240 EPOCH 81 done: loss 0.0309 - lr 0.050000 +2023-04-05 16:06:41,241 BAD EPOCHS (no improvement): 0 +2023-04-05 16:06:41,244 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:06:59,061 epoch 82 - iter 265/2650 - loss 0.03100058 - time (sec): 17.82 - samples/sec: 8127.65 - lr: 0.050000 +2023-04-05 16:07:17,635 epoch 82 - iter 530/2650 - loss 0.03067576 - time (sec): 36.39 - samples/sec: 8037.33 - lr: 0.050000 +2023-04-05 16:07:35,641 epoch 82 - iter 795/2650 - loss 0.03038061 - time (sec): 54.40 - samples/sec: 8073.86 - lr: 0.050000 +2023-04-05 16:07:53,434 epoch 82 - iter 1060/2650 - loss 0.03018400 - time (sec): 72.19 - samples/sec: 8104.42 - lr: 0.050000 +2023-04-05 16:08:11,687 epoch 82 - iter 1325/2650 - loss 0.03025144 - time (sec): 90.44 - samples/sec: 8101.04 - lr: 0.050000 +2023-04-05 16:08:29,600 epoch 82 - iter 1590/2650 - loss 0.03050428 - time (sec): 108.36 - samples/sec: 8099.65 - lr: 0.050000 +2023-04-05 16:08:47,189 epoch 82 - iter 1855/2650 - loss 0.03064468 - time (sec): 125.95 - samples/sec: 8119.68 - lr: 0.050000 +2023-04-05 16:09:05,192 epoch 82 - iter 2120/2650 - loss 0.03077815 - time (sec): 143.95 - samples/sec: 8116.08 - lr: 0.050000 +2023-04-05 16:09:23,817 epoch 82 - iter 2385/2650 - loss 0.03085177 - time (sec): 162.57 - samples/sec: 8094.99 - lr: 0.050000 +2023-04-05 16:09:41,828 epoch 82 - iter 2650/2650 - loss 0.03072148 - time (sec): 180.58 - samples/sec: 8097.95 - lr: 0.050000 +2023-04-05 16:09:41,829 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:09:41,829 EPOCH 82 done: loss 0.0307 - lr 0.050000 +2023-04-05 16:09:41,829 BAD EPOCHS (no improvement): 0 +2023-04-05 16:09:41,832 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:09:59,463 epoch 83 - iter 265/2650 - loss 0.03007558 - time (sec): 17.63 - samples/sec: 8219.74 - lr: 0.050000 +2023-04-05 16:10:17,821 epoch 83 - iter 530/2650 - loss 0.03044376 - time (sec): 35.99 - samples/sec: 8140.63 - lr: 0.050000 +2023-04-05 16:10:35,579 epoch 83 - iter 795/2650 - loss 0.03103522 - time (sec): 53.75 - samples/sec: 8180.82 - lr: 0.050000 +2023-04-05 16:10:53,640 epoch 83 - iter 1060/2650 - loss 0.03125184 - time (sec): 71.81 - samples/sec: 8157.94 - lr: 0.050000 +2023-04-05 16:11:11,401 epoch 83 - iter 1325/2650 - loss 0.03105806 - time (sec): 89.57 - samples/sec: 8152.43 - lr: 0.050000 +2023-04-05 16:11:29,272 epoch 83 - iter 1590/2650 - loss 0.03107680 - time (sec): 107.44 - samples/sec: 8167.05 - lr: 0.050000 +2023-04-05 16:11:47,670 epoch 83 - iter 1855/2650 - loss 0.03104069 - time (sec): 125.84 - samples/sec: 8151.68 - lr: 0.050000 +2023-04-05 16:12:05,620 epoch 83 - iter 2120/2650 - loss 0.03129541 - time (sec): 143.79 - samples/sec: 8136.79 - lr: 0.050000 +2023-04-05 16:12:24,158 epoch 83 - iter 2385/2650 - loss 0.03122815 - time (sec): 162.33 - samples/sec: 8107.14 - lr: 0.050000 +2023-04-05 16:12:42,791 epoch 83 - iter 2650/2650 - loss 0.03111928 - time (sec): 180.96 - samples/sec: 8081.19 - lr: 0.050000 +2023-04-05 16:12:42,791 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:12:42,791 EPOCH 83 done: loss 0.0311 - lr 0.050000 +2023-04-05 16:12:42,791 BAD EPOCHS (no improvement): 1 +2023-04-05 16:12:42,794 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:13:00,945 epoch 84 - iter 265/2650 - loss 0.03098471 - time (sec): 18.15 - samples/sec: 8020.19 - lr: 0.050000 +2023-04-05 16:13:18,559 epoch 84 - iter 530/2650 - loss 0.03063539 - time (sec): 35.77 - samples/sec: 8179.91 - lr: 0.050000 +2023-04-05 16:13:36,238 epoch 84 - iter 795/2650 - loss 0.03067449 - time (sec): 53.44 - samples/sec: 8154.95 - lr: 0.050000 +2023-04-05 16:13:54,683 epoch 84 - iter 1060/2650 - loss 0.03100105 - time (sec): 71.89 - samples/sec: 8112.63 - lr: 0.050000 +2023-04-05 16:14:12,667 epoch 84 - iter 1325/2650 - loss 0.03081692 - time (sec): 89.87 - samples/sec: 8121.75 - lr: 0.050000 +2023-04-05 16:14:30,441 epoch 84 - iter 1590/2650 - loss 0.03067709 - time (sec): 107.65 - samples/sec: 8122.66 - lr: 0.050000 +2023-04-05 16:14:48,354 epoch 84 - iter 1855/2650 - loss 0.03053990 - time (sec): 125.56 - samples/sec: 8127.30 - lr: 0.050000 +2023-04-05 16:15:06,115 epoch 84 - iter 2120/2650 - loss 0.03060062 - time (sec): 143.32 - samples/sec: 8142.75 - lr: 0.050000 +2023-04-05 16:15:24,699 epoch 84 - iter 2385/2650 - loss 0.03050306 - time (sec): 161.91 - samples/sec: 8118.83 - lr: 0.050000 +2023-04-05 16:15:43,592 epoch 84 - iter 2650/2650 - loss 0.03067195 - time (sec): 180.80 - samples/sec: 8088.36 - lr: 0.050000 +2023-04-05 16:15:43,593 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:15:43,593 EPOCH 84 done: loss 0.0307 - lr 0.050000 +2023-04-05 16:15:43,593 BAD EPOCHS (no improvement): 0 +2023-04-05 16:15:43,595 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:16:01,501 epoch 85 - iter 265/2650 - loss 0.02921295 - time (sec): 17.91 - samples/sec: 8124.98 - lr: 0.050000 +2023-04-05 16:16:19,840 epoch 85 - iter 530/2650 - loss 0.02994135 - time (sec): 36.24 - samples/sec: 8072.19 - lr: 0.050000 +2023-04-05 16:16:37,973 epoch 85 - iter 795/2650 - loss 0.02974127 - time (sec): 54.38 - samples/sec: 8047.48 - lr: 0.050000 +2023-04-05 16:16:55,992 epoch 85 - iter 1060/2650 - loss 0.02989692 - time (sec): 72.40 - samples/sec: 8076.21 - lr: 0.050000 +2023-04-05 16:17:13,728 epoch 85 - iter 1325/2650 - loss 0.02975561 - time (sec): 90.13 - samples/sec: 8100.20 - lr: 0.050000 +2023-04-05 16:17:32,023 epoch 85 - iter 1590/2650 - loss 0.03032414 - time (sec): 108.43 - samples/sec: 8092.06 - lr: 0.050000 +2023-04-05 16:17:50,156 epoch 85 - iter 1855/2650 - loss 0.03038329 - time (sec): 126.56 - samples/sec: 8093.43 - lr: 0.050000 +2023-04-05 16:18:08,567 epoch 85 - iter 2120/2650 - loss 0.03061367 - time (sec): 144.97 - samples/sec: 8081.07 - lr: 0.050000 +2023-04-05 16:18:26,274 epoch 85 - iter 2385/2650 - loss 0.03074929 - time (sec): 162.68 - samples/sec: 8089.12 - lr: 0.050000 +2023-04-05 16:18:44,937 epoch 85 - iter 2650/2650 - loss 0.03096049 - time (sec): 181.34 - samples/sec: 8064.15 - lr: 0.050000 +2023-04-05 16:18:44,937 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:18:44,937 EPOCH 85 done: loss 0.0310 - lr 0.050000 +2023-04-05 16:18:44,937 BAD EPOCHS (no improvement): 1 +2023-04-05 16:18:44,940 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:19:02,857 epoch 86 - iter 265/2650 - loss 0.03008857 - time (sec): 17.92 - samples/sec: 8089.51 - lr: 0.050000 +2023-04-05 16:19:20,840 epoch 86 - iter 530/2650 - loss 0.03090977 - time (sec): 35.90 - samples/sec: 8116.72 - lr: 0.050000 +2023-04-05 16:19:39,285 epoch 86 - iter 795/2650 - loss 0.03076073 - time (sec): 54.34 - samples/sec: 8064.40 - lr: 0.050000 +2023-04-05 16:19:57,579 epoch 86 - iter 1060/2650 - loss 0.03087074 - time (sec): 72.64 - samples/sec: 8061.27 - lr: 0.050000 +2023-04-05 16:20:15,769 epoch 86 - iter 1325/2650 - loss 0.03070933 - time (sec): 90.83 - samples/sec: 8057.78 - lr: 0.050000 +2023-04-05 16:20:34,211 epoch 86 - iter 1590/2650 - loss 0.03043000 - time (sec): 109.27 - samples/sec: 8032.85 - lr: 0.050000 +2023-04-05 16:20:52,733 epoch 86 - iter 1855/2650 - loss 0.03043706 - time (sec): 127.79 - samples/sec: 8020.06 - lr: 0.050000 +2023-04-05 16:21:10,877 epoch 86 - iter 2120/2650 - loss 0.03016968 - time (sec): 145.94 - samples/sec: 8023.45 - lr: 0.050000 +2023-04-05 16:21:29,029 epoch 86 - iter 2385/2650 - loss 0.03042293 - time (sec): 164.09 - samples/sec: 8024.32 - lr: 0.050000 +2023-04-05 16:21:46,853 epoch 86 - iter 2650/2650 - loss 0.03059590 - time (sec): 181.91 - samples/sec: 8038.83 - lr: 0.050000 +2023-04-05 16:21:46,853 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:21:46,853 EPOCH 86 done: loss 0.0306 - lr 0.050000 +2023-04-05 16:21:46,853 BAD EPOCHS (no improvement): 0 +2023-04-05 16:21:46,856 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:22:05,585 epoch 87 - iter 265/2650 - loss 0.03021581 - time (sec): 18.73 - samples/sec: 7939.10 - lr: 0.050000 +2023-04-05 16:22:23,907 epoch 87 - iter 530/2650 - loss 0.03088997 - time (sec): 37.05 - samples/sec: 7992.83 - lr: 0.050000 +2023-04-05 16:22:42,164 epoch 87 - iter 795/2650 - loss 0.03023432 - time (sec): 55.31 - samples/sec: 7963.03 - lr: 0.050000 +2023-04-05 16:23:00,173 epoch 87 - iter 1060/2650 - loss 0.02989709 - time (sec): 73.32 - samples/sec: 8009.40 - lr: 0.050000 +2023-04-05 16:23:17,884 epoch 87 - iter 1325/2650 - loss 0.02975284 - time (sec): 91.03 - samples/sec: 8033.66 - lr: 0.050000 +2023-04-05 16:23:36,263 epoch 87 - iter 1590/2650 - loss 0.02987707 - time (sec): 109.41 - samples/sec: 8023.02 - lr: 0.050000 +2023-04-05 16:23:54,085 epoch 87 - iter 1855/2650 - loss 0.03018207 - time (sec): 127.23 - samples/sec: 8039.17 - lr: 0.050000 +2023-04-05 16:24:12,728 epoch 87 - iter 2120/2650 - loss 0.03023263 - time (sec): 145.87 - samples/sec: 8023.16 - lr: 0.050000 +2023-04-05 16:24:30,895 epoch 87 - iter 2385/2650 - loss 0.03032780 - time (sec): 164.04 - samples/sec: 8026.13 - lr: 0.050000 +2023-04-05 16:24:49,001 epoch 87 - iter 2650/2650 - loss 0.03046973 - time (sec): 182.14 - samples/sec: 8028.57 - lr: 0.050000 +2023-04-05 16:24:49,001 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:24:49,001 EPOCH 87 done: loss 0.0305 - lr 0.050000 +2023-04-05 16:24:49,001 BAD EPOCHS (no improvement): 0 +2023-04-05 16:24:49,004 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:25:07,296 epoch 88 - iter 265/2650 - loss 0.03044841 - time (sec): 18.29 - samples/sec: 8045.33 - lr: 0.050000 +2023-04-05 16:25:25,938 epoch 88 - iter 530/2650 - loss 0.03076234 - time (sec): 36.93 - samples/sec: 7994.61 - lr: 0.050000 +2023-04-05 16:25:43,800 epoch 88 - iter 795/2650 - loss 0.02995183 - time (sec): 54.80 - samples/sec: 8038.70 - lr: 0.050000 +2023-04-05 16:26:01,710 epoch 88 - iter 1060/2650 - loss 0.03027499 - time (sec): 72.71 - samples/sec: 8066.43 - lr: 0.050000 +2023-04-05 16:26:19,350 epoch 88 - iter 1325/2650 - loss 0.03013454 - time (sec): 90.35 - samples/sec: 8095.04 - lr: 0.050000 +2023-04-05 16:26:37,303 epoch 88 - iter 1590/2650 - loss 0.03008684 - time (sec): 108.30 - samples/sec: 8080.16 - lr: 0.050000 +2023-04-05 16:26:55,627 epoch 88 - iter 1855/2650 - loss 0.02999024 - time (sec): 126.62 - samples/sec: 8065.00 - lr: 0.050000 +2023-04-05 16:27:13,947 epoch 88 - iter 2120/2650 - loss 0.03036241 - time (sec): 144.94 - samples/sec: 8066.63 - lr: 0.050000 +2023-04-05 16:27:32,068 epoch 88 - iter 2385/2650 - loss 0.03046138 - time (sec): 163.06 - samples/sec: 8069.14 - lr: 0.050000 +2023-04-05 16:27:50,594 epoch 88 - iter 2650/2650 - loss 0.03041590 - time (sec): 181.59 - samples/sec: 8053.10 - lr: 0.050000 +2023-04-05 16:27:50,594 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:27:50,594 EPOCH 88 done: loss 0.0304 - lr 0.050000 +2023-04-05 16:27:50,594 BAD EPOCHS (no improvement): 0 +2023-04-05 16:27:50,597 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:28:08,653 epoch 89 - iter 265/2650 - loss 0.03011771 - time (sec): 18.06 - samples/sec: 8023.00 - lr: 0.050000 +2023-04-05 16:28:26,717 epoch 89 - iter 530/2650 - loss 0.03039898 - time (sec): 36.12 - samples/sec: 8093.71 - lr: 0.050000 +2023-04-05 16:28:45,518 epoch 89 - iter 795/2650 - loss 0.03040671 - time (sec): 54.92 - samples/sec: 7984.38 - lr: 0.050000 +2023-04-05 16:29:04,469 epoch 89 - iter 1060/2650 - loss 0.03037468 - time (sec): 73.87 - samples/sec: 7958.95 - lr: 0.050000 +2023-04-05 16:29:22,026 epoch 89 - iter 1325/2650 - loss 0.03021385 - time (sec): 91.43 - samples/sec: 8032.50 - lr: 0.050000 +2023-04-05 16:29:39,600 epoch 89 - iter 1590/2650 - loss 0.03021893 - time (sec): 109.00 - samples/sec: 8061.57 - lr: 0.050000 +2023-04-05 16:29:57,913 epoch 89 - iter 1855/2650 - loss 0.03034696 - time (sec): 127.32 - samples/sec: 8051.94 - lr: 0.050000 +2023-04-05 16:30:16,183 epoch 89 - iter 2120/2650 - loss 0.03037544 - time (sec): 145.59 - samples/sec: 8046.92 - lr: 0.050000 +2023-04-05 16:30:34,417 epoch 89 - iter 2385/2650 - loss 0.03025423 - time (sec): 163.82 - samples/sec: 8038.08 - lr: 0.050000 +2023-04-05 16:30:52,372 epoch 89 - iter 2650/2650 - loss 0.03028481 - time (sec): 181.78 - samples/sec: 8044.90 - lr: 0.050000 +2023-04-05 16:30:52,373 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:30:52,373 EPOCH 89 done: loss 0.0303 - lr 0.050000 +2023-04-05 16:30:52,373 BAD EPOCHS (no improvement): 0 +2023-04-05 16:30:52,376 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:31:10,560 epoch 90 - iter 265/2650 - loss 0.02991978 - time (sec): 18.18 - samples/sec: 8061.70 - lr: 0.050000 +2023-04-05 16:31:28,781 epoch 90 - iter 530/2650 - loss 0.02984146 - time (sec): 36.41 - samples/sec: 8095.14 - lr: 0.050000 +2023-04-05 16:31:46,518 epoch 90 - iter 795/2650 - loss 0.02961434 - time (sec): 54.14 - samples/sec: 8125.00 - lr: 0.050000 +2023-04-05 16:32:04,992 epoch 90 - iter 1060/2650 - loss 0.02989024 - time (sec): 72.62 - samples/sec: 8079.68 - lr: 0.050000 +2023-04-05 16:32:32,914 epoch 90 - iter 1325/2650 - loss 0.02968093 - time (sec): 100.54 - samples/sec: 7281.89 - lr: 0.050000 +2023-04-05 16:32:51,315 epoch 90 - iter 1590/2650 - loss 0.02980051 - time (sec): 118.94 - samples/sec: 7378.41 - lr: 0.050000 +2023-04-05 16:33:09,532 epoch 90 - iter 1855/2650 - loss 0.02991638 - time (sec): 137.16 - samples/sec: 7466.90 - lr: 0.050000 +2023-04-05 16:33:27,502 epoch 90 - iter 2120/2650 - loss 0.02991097 - time (sec): 155.13 - samples/sec: 7552.23 - lr: 0.050000 +2023-04-05 16:33:45,657 epoch 90 - iter 2385/2650 - loss 0.02989985 - time (sec): 173.28 - samples/sec: 7604.17 - lr: 0.050000 +2023-04-05 16:34:03,358 epoch 90 - iter 2650/2650 - loss 0.03001918 - time (sec): 190.98 - samples/sec: 7657.06 - lr: 0.050000 +2023-04-05 16:34:03,359 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:34:03,359 EPOCH 90 done: loss 0.0300 - lr 0.050000 +2023-04-05 16:34:03,359 BAD EPOCHS (no improvement): 0 +2023-04-05 16:34:03,362 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:34:21,520 epoch 91 - iter 265/2650 - loss 0.02881073 - time (sec): 18.16 - samples/sec: 7962.20 - lr: 0.050000 +2023-04-05 16:34:39,620 epoch 91 - iter 530/2650 - loss 0.02847586 - time (sec): 36.26 - samples/sec: 8003.81 - lr: 0.050000 +2023-04-05 16:34:57,714 epoch 91 - iter 795/2650 - loss 0.02862172 - time (sec): 54.35 - samples/sec: 8063.19 - lr: 0.050000 +2023-04-05 16:35:16,027 epoch 91 - iter 1060/2650 - loss 0.02918594 - time (sec): 72.67 - samples/sec: 8041.02 - lr: 0.050000 +2023-04-05 16:35:34,298 epoch 91 - iter 1325/2650 - loss 0.02972446 - time (sec): 90.94 - samples/sec: 8046.55 - lr: 0.050000 +2023-04-05 16:35:52,429 epoch 91 - iter 1590/2650 - loss 0.02982420 - time (sec): 109.07 - samples/sec: 8047.33 - lr: 0.050000 +2023-04-05 16:36:10,726 epoch 91 - iter 1855/2650 - loss 0.02983972 - time (sec): 127.36 - samples/sec: 8045.16 - lr: 0.050000 +2023-04-05 16:36:28,755 epoch 91 - iter 2120/2650 - loss 0.02995110 - time (sec): 145.39 - samples/sec: 8054.55 - lr: 0.050000 +2023-04-05 16:36:47,129 epoch 91 - iter 2385/2650 - loss 0.02980799 - time (sec): 163.77 - samples/sec: 8044.99 - lr: 0.050000 +2023-04-05 16:37:05,059 epoch 91 - iter 2650/2650 - loss 0.02989641 - time (sec): 181.70 - samples/sec: 8048.36 - lr: 0.050000 +2023-04-05 16:37:05,059 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:37:05,059 EPOCH 91 done: loss 0.0299 - lr 0.050000 +2023-04-05 16:37:05,059 BAD EPOCHS (no improvement): 0 +2023-04-05 16:37:05,062 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:37:23,748 epoch 92 - iter 265/2650 - loss 0.03033049 - time (sec): 18.69 - samples/sec: 7939.02 - lr: 0.050000 +2023-04-05 16:37:41,714 epoch 92 - iter 530/2650 - loss 0.03040671 - time (sec): 36.65 - samples/sec: 8001.88 - lr: 0.050000 +2023-04-05 16:37:59,570 epoch 92 - iter 795/2650 - loss 0.03021733 - time (sec): 54.51 - samples/sec: 8054.26 - lr: 0.050000 +2023-04-05 16:38:17,859 epoch 92 - iter 1060/2650 - loss 0.03026141 - time (sec): 72.80 - samples/sec: 8048.30 - lr: 0.050000 +2023-04-05 16:38:36,487 epoch 92 - iter 1325/2650 - loss 0.03019434 - time (sec): 91.42 - samples/sec: 8018.19 - lr: 0.050000 +2023-04-05 16:38:54,144 epoch 92 - iter 1590/2650 - loss 0.03001710 - time (sec): 109.08 - samples/sec: 8049.78 - lr: 0.050000 +2023-04-05 16:39:12,618 epoch 92 - iter 1855/2650 - loss 0.02993196 - time (sec): 127.56 - samples/sec: 8036.82 - lr: 0.050000 +2023-04-05 16:39:30,360 epoch 92 - iter 2120/2650 - loss 0.02977772 - time (sec): 145.30 - samples/sec: 8048.77 - lr: 0.050000 +2023-04-05 16:39:48,456 epoch 92 - iter 2385/2650 - loss 0.02998377 - time (sec): 163.39 - samples/sec: 8054.63 - lr: 0.050000 +2023-04-05 16:40:06,587 epoch 92 - iter 2650/2650 - loss 0.02985869 - time (sec): 181.52 - samples/sec: 8055.99 - lr: 0.050000 +2023-04-05 16:40:06,587 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:40:06,587 EPOCH 92 done: loss 0.0299 - lr 0.050000 +2023-04-05 16:40:06,587 BAD EPOCHS (no improvement): 0 +2023-04-05 16:40:06,590 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:40:24,574 epoch 93 - iter 265/2650 - loss 0.02827410 - time (sec): 17.98 - samples/sec: 8109.86 - lr: 0.050000 +2023-04-05 16:40:42,808 epoch 93 - iter 530/2650 - loss 0.02855756 - time (sec): 36.22 - samples/sec: 8050.76 - lr: 0.050000 +2023-04-05 16:41:01,491 epoch 93 - iter 795/2650 - loss 0.02918833 - time (sec): 54.90 - samples/sec: 8016.44 - lr: 0.050000 +2023-04-05 16:41:19,699 epoch 93 - iter 1060/2650 - loss 0.02917837 - time (sec): 73.11 - samples/sec: 8019.22 - lr: 0.050000 +2023-04-05 16:41:38,081 epoch 93 - iter 1325/2650 - loss 0.02932871 - time (sec): 91.49 - samples/sec: 8017.09 - lr: 0.050000 +2023-04-05 16:41:56,384 epoch 93 - iter 1590/2650 - loss 0.02943757 - time (sec): 109.79 - samples/sec: 8015.64 - lr: 0.050000 +2023-04-05 16:42:14,583 epoch 93 - iter 1855/2650 - loss 0.02945684 - time (sec): 127.99 - samples/sec: 8011.31 - lr: 0.050000 +2023-04-05 16:42:32,476 epoch 93 - iter 2120/2650 - loss 0.02964349 - time (sec): 145.89 - samples/sec: 8022.56 - lr: 0.050000 +2023-04-05 16:42:50,352 epoch 93 - iter 2385/2650 - loss 0.02964837 - time (sec): 163.76 - samples/sec: 8028.49 - lr: 0.050000 +2023-04-05 16:43:08,992 epoch 93 - iter 2650/2650 - loss 0.02982741 - time (sec): 182.40 - samples/sec: 8017.27 - lr: 0.050000 +2023-04-05 16:43:08,992 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:43:08,992 EPOCH 93 done: loss 0.0298 - lr 0.050000 +2023-04-05 16:43:08,992 BAD EPOCHS (no improvement): 0 +2023-04-05 16:43:08,995 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:43:26,676 epoch 94 - iter 265/2650 - loss 0.02866443 - time (sec): 17.68 - samples/sec: 8167.63 - lr: 0.050000 +2023-04-05 16:43:46,537 epoch 94 - iter 530/2650 - loss 0.02948036 - time (sec): 37.54 - samples/sec: 7866.72 - lr: 0.050000 +2023-04-05 16:44:04,148 epoch 94 - iter 795/2650 - loss 0.02922681 - time (sec): 55.15 - samples/sec: 8019.93 - lr: 0.050000 +2023-04-05 16:44:22,579 epoch 94 - iter 1060/2650 - loss 0.02936435 - time (sec): 73.58 - samples/sec: 8013.79 - lr: 0.050000 +2023-04-05 16:44:40,548 epoch 94 - iter 1325/2650 - loss 0.02959460 - time (sec): 91.55 - samples/sec: 8038.43 - lr: 0.050000 +2023-04-05 16:44:58,890 epoch 94 - iter 1590/2650 - loss 0.02977258 - time (sec): 109.90 - samples/sec: 8024.03 - lr: 0.050000 +2023-04-05 16:45:16,669 epoch 94 - iter 1855/2650 - loss 0.02969671 - time (sec): 127.67 - samples/sec: 8045.72 - lr: 0.050000 +2023-04-05 16:45:34,761 epoch 94 - iter 2120/2650 - loss 0.02990761 - time (sec): 145.77 - samples/sec: 8046.57 - lr: 0.050000 +2023-04-05 16:45:52,172 epoch 94 - iter 2385/2650 - loss 0.02996676 - time (sec): 163.18 - samples/sec: 8076.70 - lr: 0.050000 +2023-04-05 16:46:09,904 epoch 94 - iter 2650/2650 - loss 0.02981403 - time (sec): 180.91 - samples/sec: 8083.42 - lr: 0.050000 +2023-04-05 16:46:09,904 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:46:09,904 EPOCH 94 done: loss 0.0298 - lr 0.050000 +2023-04-05 16:46:09,904 BAD EPOCHS (no improvement): 0 +2023-04-05 16:46:09,907 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:46:28,147 epoch 95 - iter 265/2650 - loss 0.02895740 - time (sec): 18.24 - samples/sec: 8059.25 - lr: 0.050000 +2023-04-05 16:46:46,766 epoch 95 - iter 530/2650 - loss 0.02886901 - time (sec): 36.86 - samples/sec: 7973.48 - lr: 0.050000 +2023-04-05 16:47:04,525 epoch 95 - iter 795/2650 - loss 0.02892029 - time (sec): 54.62 - samples/sec: 8064.12 - lr: 0.050000 +2023-04-05 16:47:22,679 epoch 95 - iter 1060/2650 - loss 0.02926013 - time (sec): 72.77 - samples/sec: 8058.89 - lr: 0.050000 +2023-04-05 16:47:41,056 epoch 95 - iter 1325/2650 - loss 0.02928027 - time (sec): 91.15 - samples/sec: 8039.45 - lr: 0.050000 +2023-04-05 16:47:59,123 epoch 95 - iter 1590/2650 - loss 0.02930187 - time (sec): 109.22 - samples/sec: 8050.74 - lr: 0.050000 +2023-04-05 16:48:17,553 epoch 95 - iter 1855/2650 - loss 0.02942059 - time (sec): 127.65 - samples/sec: 8031.58 - lr: 0.050000 +2023-04-05 16:48:35,340 epoch 95 - iter 2120/2650 - loss 0.02952642 - time (sec): 145.43 - samples/sec: 8058.00 - lr: 0.050000 +2023-04-05 16:48:53,350 epoch 95 - iter 2385/2650 - loss 0.02966751 - time (sec): 163.44 - samples/sec: 8059.43 - lr: 0.050000 +2023-04-05 16:49:11,731 epoch 95 - iter 2650/2650 - loss 0.02968892 - time (sec): 181.82 - samples/sec: 8042.73 - lr: 0.050000 +2023-04-05 16:49:11,732 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:49:11,732 EPOCH 95 done: loss 0.0297 - lr 0.050000 +2023-04-05 16:49:11,732 BAD EPOCHS (no improvement): 0 +2023-04-05 16:49:11,734 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:49:29,915 epoch 96 - iter 265/2650 - loss 0.03009647 - time (sec): 18.18 - samples/sec: 8049.69 - lr: 0.050000 +2023-04-05 16:49:48,531 epoch 96 - iter 530/2650 - loss 0.02956403 - time (sec): 36.80 - samples/sec: 7995.24 - lr: 0.050000 +2023-04-05 16:50:06,476 epoch 96 - iter 795/2650 - loss 0.03003335 - time (sec): 54.74 - samples/sec: 8034.75 - lr: 0.050000 +2023-04-05 16:50:24,166 epoch 96 - iter 1060/2650 - loss 0.02921479 - time (sec): 72.43 - samples/sec: 8063.32 - lr: 0.050000 +2023-04-05 16:50:42,596 epoch 96 - iter 1325/2650 - loss 0.02963404 - time (sec): 90.86 - samples/sec: 8053.04 - lr: 0.050000 +2023-04-05 16:51:01,017 epoch 96 - iter 1590/2650 - loss 0.02951184 - time (sec): 109.28 - samples/sec: 8038.85 - lr: 0.050000 +2023-04-05 16:51:19,304 epoch 96 - iter 1855/2650 - loss 0.02954697 - time (sec): 127.57 - samples/sec: 8033.10 - lr: 0.050000 +2023-04-05 16:51:36,705 epoch 96 - iter 2120/2650 - loss 0.02964479 - time (sec): 144.97 - samples/sec: 8069.11 - lr: 0.050000 +2023-04-05 16:51:54,493 epoch 96 - iter 2385/2650 - loss 0.02951076 - time (sec): 162.76 - samples/sec: 8089.96 - lr: 0.050000 +2023-04-05 16:52:12,436 epoch 96 - iter 2650/2650 - loss 0.02957345 - time (sec): 180.70 - samples/sec: 8092.68 - lr: 0.050000 +2023-04-05 16:52:12,437 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:52:12,437 EPOCH 96 done: loss 0.0296 - lr 0.050000 +2023-04-05 16:52:12,437 BAD EPOCHS (no improvement): 0 +2023-04-05 16:52:12,443 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:52:30,854 epoch 97 - iter 265/2650 - loss 0.02918383 - time (sec): 18.41 - samples/sec: 7948.55 - lr: 0.050000 +2023-04-05 16:52:48,435 epoch 97 - iter 530/2650 - loss 0.03102801 - time (sec): 35.99 - samples/sec: 8094.63 - lr: 0.050000 +2023-04-05 16:53:06,288 epoch 97 - iter 795/2650 - loss 0.03124657 - time (sec): 53.84 - samples/sec: 8139.20 - lr: 0.050000 +2023-04-05 16:53:24,343 epoch 97 - iter 1060/2650 - loss 0.03052383 - time (sec): 71.90 - samples/sec: 8126.81 - lr: 0.050000 +2023-04-05 16:53:42,424 epoch 97 - iter 1325/2650 - loss 0.03026245 - time (sec): 89.98 - samples/sec: 8104.86 - lr: 0.050000 +2023-04-05 16:54:00,806 epoch 97 - iter 1590/2650 - loss 0.02996778 - time (sec): 108.36 - samples/sec: 8083.87 - lr: 0.050000 +2023-04-05 16:54:18,390 epoch 97 - iter 1855/2650 - loss 0.02986189 - time (sec): 125.95 - samples/sec: 8104.83 - lr: 0.050000 +2023-04-05 16:54:37,305 epoch 97 - iter 2120/2650 - loss 0.02969668 - time (sec): 144.86 - samples/sec: 8060.78 - lr: 0.050000 +2023-04-05 16:54:55,300 epoch 97 - iter 2385/2650 - loss 0.02970671 - time (sec): 162.86 - samples/sec: 8074.56 - lr: 0.050000 +2023-04-05 16:55:13,324 epoch 97 - iter 2650/2650 - loss 0.02952680 - time (sec): 180.88 - samples/sec: 8084.66 - lr: 0.050000 +2023-04-05 16:55:13,325 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:55:13,325 EPOCH 97 done: loss 0.0295 - lr 0.050000 +2023-04-05 16:55:13,325 BAD EPOCHS (no improvement): 0 +2023-04-05 16:55:13,328 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:55:31,075 epoch 98 - iter 265/2650 - loss 0.02847034 - time (sec): 17.75 - samples/sec: 8254.94 - lr: 0.050000 +2023-04-05 16:55:49,547 epoch 98 - iter 530/2650 - loss 0.02884925 - time (sec): 36.22 - samples/sec: 8098.88 - lr: 0.050000 +2023-04-05 16:56:07,629 epoch 98 - iter 795/2650 - loss 0.02899023 - time (sec): 54.30 - samples/sec: 8087.80 - lr: 0.050000 +2023-04-05 16:56:25,658 epoch 98 - iter 1060/2650 - loss 0.02907776 - time (sec): 72.33 - samples/sec: 8082.69 - lr: 0.050000 +2023-04-05 16:56:43,974 epoch 98 - iter 1325/2650 - loss 0.02932887 - time (sec): 90.65 - samples/sec: 8071.21 - lr: 0.050000 +2023-04-05 16:57:02,287 epoch 98 - iter 1590/2650 - loss 0.02965113 - time (sec): 108.96 - samples/sec: 8053.60 - lr: 0.050000 +2023-04-05 16:57:20,427 epoch 98 - iter 1855/2650 - loss 0.02943823 - time (sec): 127.10 - samples/sec: 8058.22 - lr: 0.050000 +2023-04-05 16:57:38,095 epoch 98 - iter 2120/2650 - loss 0.02947932 - time (sec): 144.77 - samples/sec: 8076.23 - lr: 0.050000 +2023-04-05 16:57:56,128 epoch 98 - iter 2385/2650 - loss 0.02939530 - time (sec): 162.80 - samples/sec: 8089.82 - lr: 0.050000 +2023-04-05 16:58:13,740 epoch 98 - iter 2650/2650 - loss 0.02944466 - time (sec): 180.41 - samples/sec: 8105.67 - lr: 0.050000 +2023-04-05 16:58:13,740 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:58:13,741 EPOCH 98 done: loss 0.0294 - lr 0.050000 +2023-04-05 16:58:13,741 BAD EPOCHS (no improvement): 0 +2023-04-05 16:58:13,744 ---------------------------------------------------------------------------------------------------- +2023-04-05 16:58:32,721 epoch 99 - iter 265/2650 - loss 0.02877541 - time (sec): 18.98 - samples/sec: 7841.34 - lr: 0.050000 +2023-04-05 16:58:50,985 epoch 99 - iter 530/2650 - loss 0.02948008 - time (sec): 37.24 - samples/sec: 7923.51 - lr: 0.050000 +2023-04-05 16:59:08,333 epoch 99 - iter 795/2650 - loss 0.02911033 - time (sec): 54.59 - samples/sec: 8044.60 - lr: 0.050000 +2023-04-05 16:59:26,819 epoch 99 - iter 1060/2650 - loss 0.02905510 - time (sec): 73.07 - samples/sec: 8021.48 - lr: 0.050000 +2023-04-05 16:59:44,881 epoch 99 - iter 1325/2650 - loss 0.02924257 - time (sec): 91.14 - samples/sec: 8034.10 - lr: 0.050000 +2023-04-05 17:00:02,943 epoch 99 - iter 1590/2650 - loss 0.02948078 - time (sec): 109.20 - samples/sec: 8045.71 - lr: 0.050000 +2023-04-05 17:00:20,447 epoch 99 - iter 1855/2650 - loss 0.02942945 - time (sec): 126.70 - samples/sec: 8071.34 - lr: 0.050000 +2023-04-05 17:00:38,876 epoch 99 - iter 2120/2650 - loss 0.02963024 - time (sec): 145.13 - samples/sec: 8060.66 - lr: 0.050000 +2023-04-05 17:00:56,692 epoch 99 - iter 2385/2650 - loss 0.02963172 - time (sec): 162.95 - samples/sec: 8080.89 - lr: 0.050000 +2023-04-05 17:01:14,375 epoch 99 - iter 2650/2650 - loss 0.02964568 - time (sec): 180.63 - samples/sec: 8095.87 - lr: 0.050000 +2023-04-05 17:01:14,375 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:01:14,375 EPOCH 99 done: loss 0.0296 - lr 0.050000 +2023-04-05 17:01:14,375 BAD EPOCHS (no improvement): 1 +2023-04-05 17:01:14,380 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:01:32,311 epoch 100 - iter 265/2650 - loss 0.02806300 - time (sec): 17.93 - samples/sec: 8182.21 - lr: 0.050000 +2023-04-05 17:01:50,229 epoch 100 - iter 530/2650 - loss 0.02840293 - time (sec): 35.85 - samples/sec: 8137.97 - lr: 0.050000 +2023-04-05 17:02:07,598 epoch 100 - iter 795/2650 - loss 0.02908684 - time (sec): 53.22 - samples/sec: 8184.05 - lr: 0.050000 +2023-04-05 17:02:26,045 epoch 100 - iter 1060/2650 - loss 0.02915101 - time (sec): 71.67 - samples/sec: 8163.15 - lr: 0.050000 +2023-04-05 17:02:44,640 epoch 100 - iter 1325/2650 - loss 0.02927592 - time (sec): 90.26 - samples/sec: 8086.97 - lr: 0.050000 +2023-04-05 17:03:02,661 epoch 100 - iter 1590/2650 - loss 0.02929555 - time (sec): 108.28 - samples/sec: 8079.65 - lr: 0.050000 +2023-04-05 17:03:20,726 epoch 100 - iter 1855/2650 - loss 0.02930320 - time (sec): 126.35 - samples/sec: 8086.82 - lr: 0.050000 +2023-04-05 17:03:38,502 epoch 100 - iter 2120/2650 - loss 0.02920282 - time (sec): 144.12 - samples/sec: 8107.50 - lr: 0.050000 +2023-04-05 17:03:56,780 epoch 100 - iter 2385/2650 - loss 0.02936988 - time (sec): 162.40 - samples/sec: 8106.99 - lr: 0.050000 +2023-04-05 17:04:14,878 epoch 100 - iter 2650/2650 - loss 0.02943625 - time (sec): 180.50 - samples/sec: 8101.81 - lr: 0.050000 +2023-04-05 17:04:14,878 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:04:14,878 EPOCH 100 done: loss 0.0294 - lr 0.050000 +2023-04-05 17:04:14,878 BAD EPOCHS (no improvement): 0 +2023-04-05 17:04:14,881 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:04:32,958 epoch 101 - iter 265/2650 - loss 0.02856568 - time (sec): 18.08 - samples/sec: 8104.10 - lr: 0.050000 +2023-04-05 17:04:50,935 epoch 101 - iter 530/2650 - loss 0.02857157 - time (sec): 36.05 - samples/sec: 8153.58 - lr: 0.050000 +2023-04-05 17:05:08,959 epoch 101 - iter 795/2650 - loss 0.02821683 - time (sec): 54.08 - samples/sec: 8155.51 - lr: 0.050000 +2023-04-05 17:05:27,317 epoch 101 - iter 1060/2650 - loss 0.02834932 - time (sec): 72.44 - samples/sec: 8116.06 - lr: 0.050000 +2023-04-05 17:05:45,283 epoch 101 - iter 1325/2650 - loss 0.02880835 - time (sec): 90.40 - samples/sec: 8134.83 - lr: 0.050000 +2023-04-05 17:06:03,451 epoch 101 - iter 1590/2650 - loss 0.02890159 - time (sec): 108.57 - samples/sec: 8111.15 - lr: 0.050000 +2023-04-05 17:06:21,708 epoch 101 - iter 1855/2650 - loss 0.02911856 - time (sec): 126.83 - samples/sec: 8084.83 - lr: 0.050000 +2023-04-05 17:06:39,269 epoch 101 - iter 2120/2650 - loss 0.02908659 - time (sec): 144.39 - samples/sec: 8101.30 - lr: 0.050000 +2023-04-05 17:06:57,657 epoch 101 - iter 2385/2650 - loss 0.02917721 - time (sec): 162.78 - samples/sec: 8089.55 - lr: 0.050000 +2023-04-05 17:07:15,469 epoch 101 - iter 2650/2650 - loss 0.02910207 - time (sec): 180.59 - samples/sec: 8097.82 - lr: 0.050000 +2023-04-05 17:07:15,469 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:07:15,469 EPOCH 101 done: loss 0.0291 - lr 0.050000 +2023-04-05 17:07:15,469 BAD EPOCHS (no improvement): 0 +2023-04-05 17:07:15,471 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:07:33,470 epoch 102 - iter 265/2650 - loss 0.02966051 - time (sec): 18.00 - samples/sec: 8160.56 - lr: 0.050000 +2023-04-05 17:07:51,711 epoch 102 - iter 530/2650 - loss 0.02912085 - time (sec): 36.24 - samples/sec: 8110.99 - lr: 0.050000 +2023-04-05 17:08:09,539 epoch 102 - iter 795/2650 - loss 0.02928129 - time (sec): 54.07 - samples/sec: 8130.63 - lr: 0.050000 +2023-04-05 17:08:27,188 epoch 102 - iter 1060/2650 - loss 0.02900651 - time (sec): 71.72 - samples/sec: 8163.84 - lr: 0.050000 +2023-04-05 17:08:44,877 epoch 102 - iter 1325/2650 - loss 0.02897097 - time (sec): 89.41 - samples/sec: 8168.80 - lr: 0.050000 +2023-04-05 17:09:02,957 epoch 102 - iter 1590/2650 - loss 0.02919493 - time (sec): 107.49 - samples/sec: 8164.94 - lr: 0.050000 +2023-04-05 17:09:21,473 epoch 102 - iter 1855/2650 - loss 0.02920688 - time (sec): 126.00 - samples/sec: 8128.33 - lr: 0.050000 +2023-04-05 17:09:39,513 epoch 102 - iter 2120/2650 - loss 0.02927457 - time (sec): 144.04 - samples/sec: 8120.58 - lr: 0.050000 +2023-04-05 17:09:57,986 epoch 102 - iter 2385/2650 - loss 0.02924242 - time (sec): 162.51 - samples/sec: 8097.99 - lr: 0.050000 +2023-04-05 17:10:16,196 epoch 102 - iter 2650/2650 - loss 0.02926345 - time (sec): 180.72 - samples/sec: 8091.68 - lr: 0.050000 +2023-04-05 17:10:16,196 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:10:16,196 EPOCH 102 done: loss 0.0293 - lr 0.050000 +2023-04-05 17:10:16,196 BAD EPOCHS (no improvement): 1 +2023-04-05 17:10:16,198 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:10:34,431 epoch 103 - iter 265/2650 - loss 0.02986082 - time (sec): 18.23 - samples/sec: 8053.92 - lr: 0.050000 +2023-04-05 17:10:52,721 epoch 103 - iter 530/2650 - loss 0.02833752 - time (sec): 36.52 - samples/sec: 8004.48 - lr: 0.050000 +2023-04-05 17:11:11,286 epoch 103 - iter 795/2650 - loss 0.02840340 - time (sec): 55.09 - samples/sec: 8006.30 - lr: 0.050000 +2023-04-05 17:11:30,013 epoch 103 - iter 1060/2650 - loss 0.02874919 - time (sec): 73.81 - samples/sec: 7984.64 - lr: 0.050000 +2023-04-05 17:11:48,075 epoch 103 - iter 1325/2650 - loss 0.02904599 - time (sec): 91.88 - samples/sec: 8006.33 - lr: 0.050000 +2023-04-05 17:12:05,630 epoch 103 - iter 1590/2650 - loss 0.02924025 - time (sec): 109.43 - samples/sec: 8047.91 - lr: 0.050000 +2023-04-05 17:12:23,220 epoch 103 - iter 1855/2650 - loss 0.02913116 - time (sec): 127.02 - samples/sec: 8073.43 - lr: 0.050000 +2023-04-05 17:12:40,558 epoch 103 - iter 2120/2650 - loss 0.02903550 - time (sec): 144.36 - samples/sec: 8096.64 - lr: 0.050000 +2023-04-05 17:12:59,050 epoch 103 - iter 2385/2650 - loss 0.02903728 - time (sec): 162.85 - samples/sec: 8083.27 - lr: 0.050000 +2023-04-05 17:13:17,058 epoch 103 - iter 2650/2650 - loss 0.02901260 - time (sec): 180.86 - samples/sec: 8085.63 - lr: 0.050000 +2023-04-05 17:13:17,058 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:13:17,059 EPOCH 103 done: loss 0.0290 - lr 0.050000 +2023-04-05 17:13:17,059 BAD EPOCHS (no improvement): 0 +2023-04-05 17:13:17,061 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:13:35,434 epoch 104 - iter 265/2650 - loss 0.02795252 - time (sec): 18.37 - samples/sec: 7961.70 - lr: 0.050000 +2023-04-05 17:13:53,565 epoch 104 - iter 530/2650 - loss 0.02813495 - time (sec): 36.50 - samples/sec: 8034.54 - lr: 0.050000 +2023-04-05 17:14:12,267 epoch 104 - iter 795/2650 - loss 0.02836407 - time (sec): 55.21 - samples/sec: 7971.23 - lr: 0.050000 +2023-04-05 17:14:30,757 epoch 104 - iter 1060/2650 - loss 0.02860051 - time (sec): 73.70 - samples/sec: 7949.02 - lr: 0.050000 +2023-04-05 17:14:49,014 epoch 104 - iter 1325/2650 - loss 0.02853786 - time (sec): 91.95 - samples/sec: 7967.92 - lr: 0.050000 +2023-04-05 17:15:06,839 epoch 104 - iter 1590/2650 - loss 0.02855968 - time (sec): 109.78 - samples/sec: 7988.34 - lr: 0.050000 +2023-04-05 17:15:24,944 epoch 104 - iter 1855/2650 - loss 0.02894790 - time (sec): 127.88 - samples/sec: 8007.18 - lr: 0.050000 +2023-04-05 17:15:43,273 epoch 104 - iter 2120/2650 - loss 0.02906222 - time (sec): 146.21 - samples/sec: 8012.18 - lr: 0.050000 +2023-04-05 17:16:01,514 epoch 104 - iter 2385/2650 - loss 0.02907874 - time (sec): 164.45 - samples/sec: 8010.06 - lr: 0.050000 +2023-04-05 17:16:19,169 epoch 104 - iter 2650/2650 - loss 0.02912337 - time (sec): 182.11 - samples/sec: 8030.20 - lr: 0.050000 +2023-04-05 17:16:19,169 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:16:19,169 EPOCH 104 done: loss 0.0291 - lr 0.050000 +2023-04-05 17:16:19,169 BAD EPOCHS (no improvement): 1 +2023-04-05 17:16:19,172 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:16:37,224 epoch 105 - iter 265/2650 - loss 0.03006240 - time (sec): 18.05 - samples/sec: 8132.29 - lr: 0.050000 +2023-04-05 17:16:55,322 epoch 105 - iter 530/2650 - loss 0.02880424 - time (sec): 36.15 - samples/sec: 8026.20 - lr: 0.050000 +2023-04-05 17:17:13,688 epoch 105 - iter 795/2650 - loss 0.02882853 - time (sec): 54.52 - samples/sec: 7994.57 - lr: 0.050000 +2023-04-05 17:17:32,054 epoch 105 - iter 1060/2650 - loss 0.02867017 - time (sec): 72.88 - samples/sec: 8003.67 - lr: 0.050000 +2023-04-05 17:17:50,668 epoch 105 - iter 1325/2650 - loss 0.02880601 - time (sec): 91.50 - samples/sec: 7983.86 - lr: 0.050000 +2023-04-05 17:18:08,316 epoch 105 - iter 1590/2650 - loss 0.02870321 - time (sec): 109.14 - samples/sec: 8031.78 - lr: 0.050000 +2023-04-05 17:18:26,257 epoch 105 - iter 1855/2650 - loss 0.02873980 - time (sec): 127.08 - samples/sec: 8059.91 - lr: 0.050000 +2023-04-05 17:18:44,334 epoch 105 - iter 2120/2650 - loss 0.02888801 - time (sec): 145.16 - samples/sec: 8063.93 - lr: 0.050000 +2023-04-05 17:19:02,340 epoch 105 - iter 2385/2650 - loss 0.02896487 - time (sec): 163.17 - samples/sec: 8066.47 - lr: 0.050000 +2023-04-05 17:19:30,636 epoch 105 - iter 2650/2650 - loss 0.02898334 - time (sec): 191.46 - samples/sec: 7637.82 - lr: 0.050000 +2023-04-05 17:19:30,636 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:19:30,636 EPOCH 105 done: loss 0.0290 - lr 0.050000 +2023-04-05 17:19:30,636 BAD EPOCHS (no improvement): 0 +2023-04-05 17:19:30,639 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:19:48,405 epoch 106 - iter 265/2650 - loss 0.02948329 - time (sec): 17.77 - samples/sec: 8268.79 - lr: 0.050000 +2023-04-05 17:20:06,705 epoch 106 - iter 530/2650 - loss 0.02822930 - time (sec): 36.07 - samples/sec: 8110.59 - lr: 0.050000 +2023-04-05 17:20:24,644 epoch 106 - iter 795/2650 - loss 0.02879564 - time (sec): 54.01 - samples/sec: 8122.04 - lr: 0.050000 +2023-04-05 17:20:42,979 epoch 106 - iter 1060/2650 - loss 0.02869529 - time (sec): 72.34 - samples/sec: 8098.69 - lr: 0.050000 +2023-04-05 17:21:00,902 epoch 106 - iter 1325/2650 - loss 0.02859426 - time (sec): 90.26 - samples/sec: 8113.73 - lr: 0.050000 +2023-04-05 17:21:18,987 epoch 106 - iter 1590/2650 - loss 0.02863329 - time (sec): 108.35 - samples/sec: 8107.98 - lr: 0.050000 +2023-04-05 17:21:37,195 epoch 106 - iter 1855/2650 - loss 0.02871771 - time (sec): 126.56 - samples/sec: 8099.79 - lr: 0.050000 +2023-04-05 17:21:55,689 epoch 106 - iter 2120/2650 - loss 0.02868298 - time (sec): 145.05 - samples/sec: 8081.96 - lr: 0.050000 +2023-04-05 17:22:13,767 epoch 106 - iter 2385/2650 - loss 0.02860349 - time (sec): 163.13 - samples/sec: 8080.49 - lr: 0.050000 +2023-04-05 17:22:31,988 epoch 106 - iter 2650/2650 - loss 0.02863135 - time (sec): 181.35 - samples/sec: 8063.78 - lr: 0.050000 +2023-04-05 17:22:31,988 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:22:31,988 EPOCH 106 done: loss 0.0286 - lr 0.050000 +2023-04-05 17:22:31,989 BAD EPOCHS (no improvement): 0 +2023-04-05 17:22:31,995 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:22:50,632 epoch 107 - iter 265/2650 - loss 0.03090108 - time (sec): 18.64 - samples/sec: 7837.85 - lr: 0.050000 +2023-04-05 17:23:08,692 epoch 107 - iter 530/2650 - loss 0.02989043 - time (sec): 36.70 - samples/sec: 7993.75 - lr: 0.050000 +2023-04-05 17:23:27,071 epoch 107 - iter 795/2650 - loss 0.02936208 - time (sec): 55.08 - samples/sec: 7975.67 - lr: 0.050000 +2023-04-05 17:23:44,847 epoch 107 - iter 1060/2650 - loss 0.02909403 - time (sec): 72.85 - samples/sec: 8031.93 - lr: 0.050000 +2023-04-05 17:24:02,543 epoch 107 - iter 1325/2650 - loss 0.02888072 - time (sec): 90.55 - samples/sec: 8082.86 - lr: 0.050000 +2023-04-05 17:24:20,568 epoch 107 - iter 1590/2650 - loss 0.02865145 - time (sec): 108.57 - samples/sec: 8084.89 - lr: 0.050000 +2023-04-05 17:24:38,581 epoch 107 - iter 1855/2650 - loss 0.02873011 - time (sec): 126.59 - samples/sec: 8083.83 - lr: 0.050000 +2023-04-05 17:24:56,425 epoch 107 - iter 2120/2650 - loss 0.02865957 - time (sec): 144.43 - samples/sec: 8087.88 - lr: 0.050000 +2023-04-05 17:25:15,219 epoch 107 - iter 2385/2650 - loss 0.02859194 - time (sec): 163.22 - samples/sec: 8054.80 - lr: 0.050000 +2023-04-05 17:25:33,691 epoch 107 - iter 2650/2650 - loss 0.02862999 - time (sec): 181.70 - samples/sec: 8048.41 - lr: 0.050000 +2023-04-05 17:25:33,691 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:25:33,691 EPOCH 107 done: loss 0.0286 - lr 0.050000 +2023-04-05 17:25:33,691 BAD EPOCHS (no improvement): 0 +2023-04-05 17:25:33,693 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:25:52,024 epoch 108 - iter 265/2650 - loss 0.02842706 - time (sec): 18.33 - samples/sec: 7917.86 - lr: 0.050000 +2023-04-05 17:26:09,716 epoch 108 - iter 530/2650 - loss 0.02916818 - time (sec): 36.02 - samples/sec: 8055.72 - lr: 0.050000 +2023-04-05 17:26:26,974 epoch 108 - iter 795/2650 - loss 0.02888848 - time (sec): 53.28 - samples/sec: 8154.80 - lr: 0.050000 +2023-04-05 17:26:45,102 epoch 108 - iter 1060/2650 - loss 0.02885894 - time (sec): 71.41 - samples/sec: 8128.54 - lr: 0.050000 +2023-04-05 17:27:02,911 epoch 108 - iter 1325/2650 - loss 0.02879496 - time (sec): 89.22 - samples/sec: 8134.40 - lr: 0.050000 +2023-04-05 17:27:21,266 epoch 108 - iter 1590/2650 - loss 0.02870162 - time (sec): 107.57 - samples/sec: 8110.64 - lr: 0.050000 +2023-04-05 17:27:39,625 epoch 108 - iter 1855/2650 - loss 0.02866263 - time (sec): 125.93 - samples/sec: 8099.30 - lr: 0.050000 +2023-04-05 17:27:57,989 epoch 108 - iter 2120/2650 - loss 0.02866592 - time (sec): 144.30 - samples/sec: 8090.35 - lr: 0.050000 +2023-04-05 17:28:15,941 epoch 108 - iter 2385/2650 - loss 0.02864924 - time (sec): 162.25 - samples/sec: 8103.74 - lr: 0.050000 +2023-04-05 17:28:34,490 epoch 108 - iter 2650/2650 - loss 0.02857386 - time (sec): 180.80 - samples/sec: 8088.45 - lr: 0.050000 +2023-04-05 17:28:34,490 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:28:34,490 EPOCH 108 done: loss 0.0286 - lr 0.050000 +2023-04-05 17:28:34,490 BAD EPOCHS (no improvement): 0 +2023-04-05 17:28:34,493 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:28:51,967 epoch 109 - iter 265/2650 - loss 0.02936650 - time (sec): 17.47 - samples/sec: 8241.63 - lr: 0.050000 +2023-04-05 17:29:10,373 epoch 109 - iter 530/2650 - loss 0.02867800 - time (sec): 35.88 - samples/sec: 8103.14 - lr: 0.050000 +2023-04-05 17:29:28,865 epoch 109 - iter 795/2650 - loss 0.02835937 - time (sec): 54.37 - samples/sec: 8052.93 - lr: 0.050000 +2023-04-05 17:29:47,205 epoch 109 - iter 1060/2650 - loss 0.02867269 - time (sec): 72.71 - samples/sec: 8035.43 - lr: 0.050000 +2023-04-05 17:30:04,976 epoch 109 - iter 1325/2650 - loss 0.02877673 - time (sec): 90.48 - samples/sec: 8066.58 - lr: 0.050000 +2023-04-05 17:30:22,696 epoch 109 - iter 1590/2650 - loss 0.02883464 - time (sec): 108.20 - samples/sec: 8086.87 - lr: 0.050000 +2023-04-05 17:30:40,870 epoch 109 - iter 1855/2650 - loss 0.02888421 - time (sec): 126.38 - samples/sec: 8084.22 - lr: 0.050000 +2023-04-05 17:30:58,814 epoch 109 - iter 2120/2650 - loss 0.02893871 - time (sec): 144.32 - samples/sec: 8099.67 - lr: 0.050000 +2023-04-05 17:31:17,151 epoch 109 - iter 2385/2650 - loss 0.02892781 - time (sec): 162.66 - samples/sec: 8090.87 - lr: 0.050000 +2023-04-05 17:31:35,301 epoch 109 - iter 2650/2650 - loss 0.02881606 - time (sec): 180.81 - samples/sec: 8087.94 - lr: 0.050000 +2023-04-05 17:31:35,301 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:31:35,301 EPOCH 109 done: loss 0.0288 - lr 0.050000 +2023-04-05 17:31:35,301 BAD EPOCHS (no improvement): 1 +2023-04-05 17:31:35,304 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:31:53,820 epoch 110 - iter 265/2650 - loss 0.02926556 - time (sec): 18.52 - samples/sec: 7955.47 - lr: 0.050000 +2023-04-05 17:32:11,348 epoch 110 - iter 530/2650 - loss 0.02886637 - time (sec): 36.04 - samples/sec: 8095.76 - lr: 0.050000 +2023-04-05 17:32:29,531 epoch 110 - iter 795/2650 - loss 0.02840960 - time (sec): 54.23 - samples/sec: 8101.67 - lr: 0.050000 +2023-04-05 17:32:47,174 epoch 110 - iter 1060/2650 - loss 0.02873275 - time (sec): 71.87 - samples/sec: 8135.65 - lr: 0.050000 +2023-04-05 17:33:05,172 epoch 110 - iter 1325/2650 - loss 0.02872997 - time (sec): 89.87 - samples/sec: 8132.34 - lr: 0.050000 +2023-04-05 17:33:23,315 epoch 110 - iter 1590/2650 - loss 0.02854199 - time (sec): 108.01 - samples/sec: 8115.72 - lr: 0.050000 +2023-04-05 17:33:41,458 epoch 110 - iter 1855/2650 - loss 0.02849189 - time (sec): 126.15 - samples/sec: 8106.59 - lr: 0.050000 +2023-04-05 17:34:00,141 epoch 110 - iter 2120/2650 - loss 0.02867275 - time (sec): 144.84 - samples/sec: 8080.88 - lr: 0.050000 +2023-04-05 17:34:18,089 epoch 110 - iter 2385/2650 - loss 0.02864965 - time (sec): 162.79 - samples/sec: 8087.99 - lr: 0.050000 +2023-04-05 17:34:36,143 epoch 110 - iter 2650/2650 - loss 0.02862272 - time (sec): 180.84 - samples/sec: 8086.53 - lr: 0.050000 +2023-04-05 17:34:36,144 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:34:36,144 EPOCH 110 done: loss 0.0286 - lr 0.050000 +2023-04-05 17:34:36,144 BAD EPOCHS (no improvement): 2 +2023-04-05 17:34:36,147 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:34:54,061 epoch 111 - iter 265/2650 - loss 0.02831877 - time (sec): 17.91 - samples/sec: 8038.33 - lr: 0.050000 +2023-04-05 17:35:12,810 epoch 111 - iter 530/2650 - loss 0.02946900 - time (sec): 36.66 - samples/sec: 7956.63 - lr: 0.050000 +2023-04-05 17:35:30,698 epoch 111 - iter 795/2650 - loss 0.02927524 - time (sec): 54.55 - samples/sec: 8011.23 - lr: 0.050000 +2023-04-05 17:35:48,628 epoch 111 - iter 1060/2650 - loss 0.02888681 - time (sec): 72.48 - samples/sec: 8017.69 - lr: 0.050000 +2023-04-05 17:36:06,897 epoch 111 - iter 1325/2650 - loss 0.02898305 - time (sec): 90.75 - samples/sec: 8035.93 - lr: 0.050000 +2023-04-05 17:36:24,629 epoch 111 - iter 1590/2650 - loss 0.02914566 - time (sec): 108.48 - samples/sec: 8071.95 - lr: 0.050000 +2023-04-05 17:36:43,157 epoch 111 - iter 1855/2650 - loss 0.02910074 - time (sec): 127.01 - samples/sec: 8053.78 - lr: 0.050000 +2023-04-05 17:37:00,938 epoch 111 - iter 2120/2650 - loss 0.02908495 - time (sec): 144.79 - samples/sec: 8078.31 - lr: 0.050000 +2023-04-05 17:37:18,797 epoch 111 - iter 2385/2650 - loss 0.02903722 - time (sec): 162.65 - samples/sec: 8096.77 - lr: 0.050000 +2023-04-05 17:37:36,502 epoch 111 - iter 2650/2650 - loss 0.02903882 - time (sec): 180.36 - samples/sec: 8108.23 - lr: 0.050000 +2023-04-05 17:37:36,503 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:37:36,503 EPOCH 111 done: loss 0.0290 - lr 0.050000 +2023-04-05 17:37:36,503 BAD EPOCHS (no improvement): 3 +2023-04-05 17:37:36,505 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:37:54,752 epoch 112 - iter 265/2650 - loss 0.02710494 - time (sec): 18.25 - samples/sec: 8029.51 - lr: 0.050000 +2023-04-05 17:38:13,021 epoch 112 - iter 530/2650 - loss 0.02772084 - time (sec): 36.52 - samples/sec: 8014.28 - lr: 0.050000 +2023-04-05 17:38:30,957 epoch 112 - iter 795/2650 - loss 0.02807779 - time (sec): 54.45 - samples/sec: 8082.31 - lr: 0.050000 +2023-04-05 17:38:49,111 epoch 112 - iter 1060/2650 - loss 0.02848853 - time (sec): 72.61 - samples/sec: 8056.14 - lr: 0.050000 +2023-04-05 17:39:06,830 epoch 112 - iter 1325/2650 - loss 0.02833008 - time (sec): 90.32 - samples/sec: 8075.49 - lr: 0.050000 +2023-04-05 17:39:24,855 epoch 112 - iter 1590/2650 - loss 0.02819534 - time (sec): 108.35 - samples/sec: 8084.03 - lr: 0.050000 +2023-04-05 17:39:43,264 epoch 112 - iter 1855/2650 - loss 0.02840982 - time (sec): 126.76 - samples/sec: 8079.38 - lr: 0.050000 +2023-04-05 17:40:01,239 epoch 112 - iter 2120/2650 - loss 0.02842634 - time (sec): 144.73 - samples/sec: 8090.68 - lr: 0.050000 +2023-04-05 17:40:19,289 epoch 112 - iter 2385/2650 - loss 0.02849352 - time (sec): 162.78 - samples/sec: 8082.26 - lr: 0.050000 +2023-04-05 17:40:37,663 epoch 112 - iter 2650/2650 - loss 0.02848127 - time (sec): 181.16 - samples/sec: 8072.33 - lr: 0.050000 +2023-04-05 17:40:37,663 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:40:37,663 EPOCH 112 done: loss 0.0285 - lr 0.050000 +2023-04-05 17:40:37,663 BAD EPOCHS (no improvement): 0 +2023-04-05 17:40:37,666 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:40:56,057 epoch 113 - iter 265/2650 - loss 0.02754800 - time (sec): 18.39 - samples/sec: 7957.32 - lr: 0.050000 +2023-04-05 17:41:14,523 epoch 113 - iter 530/2650 - loss 0.02840821 - time (sec): 36.86 - samples/sec: 7932.46 - lr: 0.050000 +2023-04-05 17:41:32,859 epoch 113 - iter 795/2650 - loss 0.02789125 - time (sec): 55.19 - samples/sec: 7970.08 - lr: 0.050000 +2023-04-05 17:41:50,298 epoch 113 - iter 1060/2650 - loss 0.02779993 - time (sec): 72.63 - samples/sec: 8038.57 - lr: 0.050000 +2023-04-05 17:42:08,925 epoch 113 - iter 1325/2650 - loss 0.02803452 - time (sec): 91.26 - samples/sec: 8009.76 - lr: 0.050000 +2023-04-05 17:42:26,725 epoch 113 - iter 1590/2650 - loss 0.02814691 - time (sec): 109.06 - samples/sec: 8055.16 - lr: 0.050000 +2023-04-05 17:42:44,576 epoch 113 - iter 1855/2650 - loss 0.02813755 - time (sec): 126.91 - samples/sec: 8067.19 - lr: 0.050000 +2023-04-05 17:43:02,546 epoch 113 - iter 2120/2650 - loss 0.02810261 - time (sec): 144.88 - samples/sec: 8069.85 - lr: 0.050000 +2023-04-05 17:43:20,731 epoch 113 - iter 2385/2650 - loss 0.02832263 - time (sec): 163.06 - samples/sec: 8075.92 - lr: 0.050000 +2023-04-05 17:43:38,567 epoch 113 - iter 2650/2650 - loss 0.02846656 - time (sec): 180.90 - samples/sec: 8083.79 - lr: 0.050000 +2023-04-05 17:43:38,568 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:43:38,568 EPOCH 113 done: loss 0.0285 - lr 0.050000 +2023-04-05 17:43:38,568 BAD EPOCHS (no improvement): 0 +2023-04-05 17:43:38,573 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:43:56,858 epoch 114 - iter 265/2650 - loss 0.02907795 - time (sec): 18.28 - samples/sec: 7918.45 - lr: 0.050000 +2023-04-05 17:44:21,887 epoch 114 - iter 530/2650 - loss 0.02924185 - time (sec): 43.31 - samples/sec: 6709.71 - lr: 0.050000 +2023-04-05 17:44:53,355 epoch 114 - iter 795/2650 - loss 0.02838547 - time (sec): 74.78 - samples/sec: 5844.56 - lr: 0.050000 +2023-04-05 17:45:11,690 epoch 114 - iter 1060/2650 - loss 0.02833405 - time (sec): 93.12 - samples/sec: 6281.34 - lr: 0.050000 +2023-04-05 17:45:30,081 epoch 114 - iter 1325/2650 - loss 0.02811633 - time (sec): 111.51 - samples/sec: 6555.37 - lr: 0.050000 +2023-04-05 17:45:48,257 epoch 114 - iter 1590/2650 - loss 0.02797142 - time (sec): 129.68 - samples/sec: 6771.21 - lr: 0.050000 +2023-04-05 17:46:05,961 epoch 114 - iter 1855/2650 - loss 0.02818285 - time (sec): 147.39 - samples/sec: 6951.12 - lr: 0.050000 +2023-04-05 17:46:23,393 epoch 114 - iter 2120/2650 - loss 0.02826081 - time (sec): 164.82 - samples/sec: 7098.05 - lr: 0.050000 +2023-04-05 17:46:41,640 epoch 114 - iter 2385/2650 - loss 0.02830574 - time (sec): 183.07 - samples/sec: 7191.79 - lr: 0.050000 +2023-04-05 17:47:15,747 epoch 114 - iter 2650/2650 - loss 0.02831788 - time (sec): 217.17 - samples/sec: 6733.63 - lr: 0.050000 +2023-04-05 17:47:15,747 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:47:15,747 EPOCH 114 done: loss 0.0283 - lr 0.050000 +2023-04-05 17:47:15,747 BAD EPOCHS (no improvement): 0 +2023-04-05 17:47:15,751 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:47:39,238 epoch 115 - iter 265/2650 - loss 0.02738039 - time (sec): 23.49 - samples/sec: 6344.94 - lr: 0.050000 +2023-04-05 17:47:57,205 epoch 115 - iter 530/2650 - loss 0.02808868 - time (sec): 41.45 - samples/sec: 7078.57 - lr: 0.050000 +2023-04-05 17:48:14,884 epoch 115 - iter 795/2650 - loss 0.02831272 - time (sec): 59.13 - samples/sec: 7428.64 - lr: 0.050000 +2023-04-05 17:48:32,881 epoch 115 - iter 1060/2650 - loss 0.02821831 - time (sec): 77.13 - samples/sec: 7575.37 - lr: 0.050000 +2023-04-05 17:48:50,651 epoch 115 - iter 1325/2650 - loss 0.02852687 - time (sec): 94.90 - samples/sec: 7700.82 - lr: 0.050000 +2023-04-05 17:49:09,107 epoch 115 - iter 1590/2650 - loss 0.02850624 - time (sec): 113.36 - samples/sec: 7742.93 - lr: 0.050000 +2023-04-05 17:49:27,021 epoch 115 - iter 1855/2650 - loss 0.02842765 - time (sec): 131.27 - samples/sec: 7796.84 - lr: 0.050000 +2023-04-05 17:49:45,047 epoch 115 - iter 2120/2650 - loss 0.02856729 - time (sec): 149.30 - samples/sec: 7826.67 - lr: 0.050000 +2023-04-05 17:50:03,408 epoch 115 - iter 2385/2650 - loss 0.02855496 - time (sec): 167.66 - samples/sec: 7855.97 - lr: 0.050000 +2023-04-05 17:50:21,777 epoch 115 - iter 2650/2650 - loss 0.02856531 - time (sec): 186.03 - samples/sec: 7861.05 - lr: 0.050000 +2023-04-05 17:50:21,778 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:50:21,778 EPOCH 115 done: loss 0.0286 - lr 0.050000 +2023-04-05 17:50:21,778 BAD EPOCHS (no improvement): 1 +2023-04-05 17:50:21,780 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:50:40,208 epoch 116 - iter 265/2650 - loss 0.02798561 - time (sec): 18.43 - samples/sec: 8018.63 - lr: 0.050000 +2023-04-05 17:50:58,748 epoch 116 - iter 530/2650 - loss 0.02852557 - time (sec): 36.97 - samples/sec: 7974.32 - lr: 0.050000 +2023-04-05 17:51:16,660 epoch 116 - iter 795/2650 - loss 0.02806934 - time (sec): 54.88 - samples/sec: 7989.55 - lr: 0.050000 +2023-04-05 17:51:35,049 epoch 116 - iter 1060/2650 - loss 0.02814954 - time (sec): 73.27 - samples/sec: 7971.00 - lr: 0.050000 +2023-04-05 17:51:53,443 epoch 116 - iter 1325/2650 - loss 0.02806115 - time (sec): 91.66 - samples/sec: 7965.58 - lr: 0.050000 +2023-04-05 17:52:11,476 epoch 116 - iter 1590/2650 - loss 0.02823494 - time (sec): 109.70 - samples/sec: 7988.36 - lr: 0.050000 +2023-04-05 17:52:29,954 epoch 116 - iter 1855/2650 - loss 0.02811955 - time (sec): 128.17 - samples/sec: 7991.25 - lr: 0.050000 +2023-04-05 17:52:48,422 epoch 116 - iter 2120/2650 - loss 0.02831881 - time (sec): 146.64 - samples/sec: 7988.36 - lr: 0.050000 +2023-04-05 17:53:06,264 epoch 116 - iter 2385/2650 - loss 0.02832040 - time (sec): 164.48 - samples/sec: 8006.16 - lr: 0.050000 +2023-04-05 17:53:23,952 epoch 116 - iter 2650/2650 - loss 0.02839601 - time (sec): 182.17 - samples/sec: 8027.39 - lr: 0.050000 +2023-04-05 17:53:23,952 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:53:23,952 EPOCH 116 done: loss 0.0284 - lr 0.050000 +2023-04-05 17:53:23,953 BAD EPOCHS (no improvement): 2 +2023-04-05 17:53:23,955 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:53:42,049 epoch 117 - iter 265/2650 - loss 0.02763361 - time (sec): 18.09 - samples/sec: 8049.00 - lr: 0.050000 +2023-04-05 17:53:59,930 epoch 117 - iter 530/2650 - loss 0.02823546 - time (sec): 35.97 - samples/sec: 8122.72 - lr: 0.050000 +2023-04-05 17:54:18,046 epoch 117 - iter 795/2650 - loss 0.02855896 - time (sec): 54.09 - samples/sec: 8127.38 - lr: 0.050000 +2023-04-05 17:54:35,773 epoch 117 - iter 1060/2650 - loss 0.02873585 - time (sec): 71.82 - samples/sec: 8140.53 - lr: 0.050000 +2023-04-05 17:54:53,737 epoch 117 - iter 1325/2650 - loss 0.02855544 - time (sec): 89.78 - samples/sec: 8128.03 - lr: 0.050000 +2023-04-05 17:55:12,332 epoch 117 - iter 1590/2650 - loss 0.02846007 - time (sec): 108.38 - samples/sec: 8110.19 - lr: 0.050000 +2023-04-05 17:55:30,492 epoch 117 - iter 1855/2650 - loss 0.02839878 - time (sec): 126.54 - samples/sec: 8109.41 - lr: 0.050000 +2023-04-05 17:55:48,407 epoch 117 - iter 2120/2650 - loss 0.02827772 - time (sec): 144.45 - samples/sec: 8103.68 - lr: 0.050000 +2023-04-05 17:56:06,406 epoch 117 - iter 2385/2650 - loss 0.02835868 - time (sec): 162.45 - samples/sec: 8101.76 - lr: 0.050000 +2023-04-05 17:56:24,435 epoch 117 - iter 2650/2650 - loss 0.02826237 - time (sec): 180.48 - samples/sec: 8102.62 - lr: 0.050000 +2023-04-05 17:56:24,436 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:56:24,436 EPOCH 117 done: loss 0.0283 - lr 0.050000 +2023-04-05 17:56:24,436 BAD EPOCHS (no improvement): 0 +2023-04-05 17:56:24,439 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:56:42,806 epoch 118 - iter 265/2650 - loss 0.02689999 - time (sec): 18.37 - samples/sec: 8017.21 - lr: 0.050000 +2023-04-05 17:57:00,685 epoch 118 - iter 530/2650 - loss 0.02754985 - time (sec): 36.25 - samples/sec: 8084.31 - lr: 0.050000 +2023-04-05 17:57:17,941 epoch 118 - iter 795/2650 - loss 0.02747606 - time (sec): 53.50 - samples/sec: 8197.73 - lr: 0.050000 +2023-04-05 17:57:36,304 epoch 118 - iter 1060/2650 - loss 0.02740483 - time (sec): 71.86 - samples/sec: 8146.87 - lr: 0.050000 +2023-04-05 17:57:54,803 epoch 118 - iter 1325/2650 - loss 0.02749871 - time (sec): 90.36 - samples/sec: 8112.86 - lr: 0.050000 +2023-04-05 17:58:12,685 epoch 118 - iter 1590/2650 - loss 0.02787136 - time (sec): 108.25 - samples/sec: 8118.77 - lr: 0.050000 +2023-04-05 17:58:30,769 epoch 118 - iter 1855/2650 - loss 0.02785887 - time (sec): 126.33 - samples/sec: 8113.33 - lr: 0.050000 +2023-04-05 17:58:50,153 epoch 118 - iter 2120/2650 - loss 0.02802973 - time (sec): 145.71 - samples/sec: 8036.64 - lr: 0.050000 +2023-04-05 17:59:08,043 epoch 118 - iter 2385/2650 - loss 0.02805504 - time (sec): 163.60 - samples/sec: 8047.51 - lr: 0.050000 +2023-04-05 17:59:26,273 epoch 118 - iter 2650/2650 - loss 0.02817978 - time (sec): 181.83 - samples/sec: 8042.27 - lr: 0.050000 +2023-04-05 17:59:26,274 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:59:26,274 EPOCH 118 done: loss 0.0282 - lr 0.050000 +2023-04-05 17:59:26,274 BAD EPOCHS (no improvement): 0 +2023-04-05 17:59:26,276 ---------------------------------------------------------------------------------------------------- +2023-04-05 17:59:44,421 epoch 119 - iter 265/2650 - loss 0.02644769 - time (sec): 18.14 - samples/sec: 8064.26 - lr: 0.050000 +2023-04-05 18:00:02,257 epoch 119 - iter 530/2650 - loss 0.02640071 - time (sec): 35.98 - samples/sec: 8111.27 - lr: 0.050000 +2023-04-05 18:00:20,821 epoch 119 - iter 795/2650 - loss 0.02660438 - time (sec): 54.54 - samples/sec: 8031.55 - lr: 0.050000 +2023-04-05 18:00:39,006 epoch 119 - iter 1060/2650 - loss 0.02712309 - time (sec): 72.73 - samples/sec: 8016.74 - lr: 0.050000 +2023-04-05 18:00:56,571 epoch 119 - iter 1325/2650 - loss 0.02756340 - time (sec): 90.29 - samples/sec: 8064.68 - lr: 0.050000 +2023-04-05 18:01:14,702 epoch 119 - iter 1590/2650 - loss 0.02762641 - time (sec): 108.43 - samples/sec: 8073.08 - lr: 0.050000 +2023-04-05 18:01:32,379 epoch 119 - iter 1855/2650 - loss 0.02758023 - time (sec): 126.10 - samples/sec: 8105.49 - lr: 0.050000 +2023-04-05 18:01:50,471 epoch 119 - iter 2120/2650 - loss 0.02772653 - time (sec): 144.19 - samples/sec: 8104.24 - lr: 0.050000 +2023-04-05 18:02:08,855 epoch 119 - iter 2385/2650 - loss 0.02774498 - time (sec): 162.58 - samples/sec: 8095.88 - lr: 0.050000 +2023-04-05 18:02:27,305 epoch 119 - iter 2650/2650 - loss 0.02774099 - time (sec): 181.03 - samples/sec: 8078.07 - lr: 0.050000 +2023-04-05 18:02:27,305 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:02:27,305 EPOCH 119 done: loss 0.0277 - lr 0.050000 +2023-04-05 18:02:27,305 BAD EPOCHS (no improvement): 0 +2023-04-05 18:02:27,308 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:02:45,248 epoch 120 - iter 265/2650 - loss 0.02702659 - time (sec): 17.94 - samples/sec: 8257.55 - lr: 0.050000 +2023-04-05 18:03:03,264 epoch 120 - iter 530/2650 - loss 0.02721009 - time (sec): 35.96 - samples/sec: 8176.43 - lr: 0.050000 +2023-04-05 18:03:21,904 epoch 120 - iter 795/2650 - loss 0.02741460 - time (sec): 54.60 - samples/sec: 8071.94 - lr: 0.050000 +2023-04-05 18:03:39,644 epoch 120 - iter 1060/2650 - loss 0.02711904 - time (sec): 72.34 - samples/sec: 8098.67 - lr: 0.050000 +2023-04-05 18:03:58,137 epoch 120 - iter 1325/2650 - loss 0.02713009 - time (sec): 90.83 - samples/sec: 8072.12 - lr: 0.050000 +2023-04-05 18:04:16,185 epoch 120 - iter 1590/2650 - loss 0.02736496 - time (sec): 108.88 - samples/sec: 8084.03 - lr: 0.050000 +2023-04-05 18:04:34,058 epoch 120 - iter 1855/2650 - loss 0.02768589 - time (sec): 126.75 - samples/sec: 8087.47 - lr: 0.050000 +2023-04-05 18:04:52,645 epoch 120 - iter 2120/2650 - loss 0.02785959 - time (sec): 145.34 - samples/sec: 8062.32 - lr: 0.050000 +2023-04-05 18:05:11,062 epoch 120 - iter 2385/2650 - loss 0.02788691 - time (sec): 163.75 - samples/sec: 8047.74 - lr: 0.050000 +2023-04-05 18:05:28,822 epoch 120 - iter 2650/2650 - loss 0.02809507 - time (sec): 181.51 - samples/sec: 8056.52 - lr: 0.050000 +2023-04-05 18:05:28,822 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:05:28,822 EPOCH 120 done: loss 0.0281 - lr 0.050000 +2023-04-05 18:05:28,822 BAD EPOCHS (no improvement): 1 +2023-04-05 18:05:28,825 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:05:47,247 epoch 121 - iter 265/2650 - loss 0.02521062 - time (sec): 18.42 - samples/sec: 7955.11 - lr: 0.050000 +2023-04-05 18:06:05,451 epoch 121 - iter 530/2650 - loss 0.02611540 - time (sec): 36.63 - samples/sec: 7998.17 - lr: 0.050000 +2023-04-05 18:06:23,802 epoch 121 - iter 795/2650 - loss 0.02669010 - time (sec): 54.98 - samples/sec: 7990.58 - lr: 0.050000 +2023-04-05 18:06:42,162 epoch 121 - iter 1060/2650 - loss 0.02672997 - time (sec): 73.34 - samples/sec: 8015.95 - lr: 0.050000 +2023-04-05 18:07:00,335 epoch 121 - iter 1325/2650 - loss 0.02709965 - time (sec): 91.51 - samples/sec: 8016.69 - lr: 0.050000 +2023-04-05 18:07:27,715 epoch 121 - iter 1590/2650 - loss 0.02715452 - time (sec): 118.89 - samples/sec: 7392.65 - lr: 0.050000 +2023-04-05 18:07:45,954 epoch 121 - iter 1855/2650 - loss 0.02726512 - time (sec): 137.13 - samples/sec: 7474.79 - lr: 0.050000 +2023-04-05 18:08:03,698 epoch 121 - iter 2120/2650 - loss 0.02749526 - time (sec): 154.87 - samples/sec: 7550.02 - lr: 0.050000 +2023-04-05 18:08:22,521 epoch 121 - iter 2385/2650 - loss 0.02754644 - time (sec): 173.70 - samples/sec: 7575.39 - lr: 0.050000 +2023-04-05 18:08:40,590 epoch 121 - iter 2650/2650 - loss 0.02765558 - time (sec): 191.76 - samples/sec: 7625.84 - lr: 0.050000 +2023-04-05 18:08:40,590 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:08:40,590 EPOCH 121 done: loss 0.0277 - lr 0.050000 +2023-04-05 18:08:40,590 BAD EPOCHS (no improvement): 0 +2023-04-05 18:08:40,593 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:08:58,595 epoch 122 - iter 265/2650 - loss 0.02808547 - time (sec): 18.00 - samples/sec: 8091.27 - lr: 0.050000 +2023-04-05 18:09:17,139 epoch 122 - iter 530/2650 - loss 0.02802134 - time (sec): 36.55 - samples/sec: 8055.63 - lr: 0.050000 +2023-04-05 18:09:35,610 epoch 122 - iter 795/2650 - loss 0.02840358 - time (sec): 55.02 - samples/sec: 8029.66 - lr: 0.050000 +2023-04-05 18:09:54,781 epoch 122 - iter 1060/2650 - loss 0.02802755 - time (sec): 74.19 - samples/sec: 7941.52 - lr: 0.050000 +2023-04-05 18:10:12,539 epoch 122 - iter 1325/2650 - loss 0.02777354 - time (sec): 91.95 - samples/sec: 7993.57 - lr: 0.050000 +2023-04-05 18:10:30,639 epoch 122 - iter 1590/2650 - loss 0.02793101 - time (sec): 110.05 - samples/sec: 7986.07 - lr: 0.050000 +2023-04-05 18:10:48,509 epoch 122 - iter 1855/2650 - loss 0.02804560 - time (sec): 127.92 - samples/sec: 8021.44 - lr: 0.050000 +2023-04-05 18:11:06,150 epoch 122 - iter 2120/2650 - loss 0.02801840 - time (sec): 145.56 - samples/sec: 8048.11 - lr: 0.050000 +2023-04-05 18:11:23,999 epoch 122 - iter 2385/2650 - loss 0.02804419 - time (sec): 163.41 - samples/sec: 8050.68 - lr: 0.050000 +2023-04-05 18:11:42,125 epoch 122 - iter 2650/2650 - loss 0.02825461 - time (sec): 181.53 - samples/sec: 8055.71 - lr: 0.050000 +2023-04-05 18:11:42,125 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:11:42,125 EPOCH 122 done: loss 0.0283 - lr 0.050000 +2023-04-05 18:11:42,125 BAD EPOCHS (no improvement): 1 +2023-04-05 18:11:42,128 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:12:00,105 epoch 123 - iter 265/2650 - loss 0.02711484 - time (sec): 17.98 - samples/sec: 8076.46 - lr: 0.050000 +2023-04-05 18:12:17,847 epoch 123 - iter 530/2650 - loss 0.02717101 - time (sec): 35.72 - samples/sec: 8165.61 - lr: 0.050000 +2023-04-05 18:12:35,894 epoch 123 - iter 795/2650 - loss 0.02747001 - time (sec): 53.77 - samples/sec: 8127.88 - lr: 0.050000 +2023-04-05 18:12:54,208 epoch 123 - iter 1060/2650 - loss 0.02813646 - time (sec): 72.08 - samples/sec: 8112.13 - lr: 0.050000 +2023-04-05 18:13:12,462 epoch 123 - iter 1325/2650 - loss 0.02800627 - time (sec): 90.33 - samples/sec: 8084.99 - lr: 0.050000 +2023-04-05 18:13:30,678 epoch 123 - iter 1590/2650 - loss 0.02798650 - time (sec): 108.55 - samples/sec: 8071.92 - lr: 0.050000 +2023-04-05 18:13:49,293 epoch 123 - iter 1855/2650 - loss 0.02803206 - time (sec): 127.16 - samples/sec: 8054.09 - lr: 0.050000 +2023-04-05 18:14:07,008 epoch 123 - iter 2120/2650 - loss 0.02811204 - time (sec): 144.88 - samples/sec: 8070.50 - lr: 0.050000 +2023-04-05 18:14:25,437 epoch 123 - iter 2385/2650 - loss 0.02819932 - time (sec): 163.31 - samples/sec: 8056.29 - lr: 0.050000 +2023-04-05 18:14:43,740 epoch 123 - iter 2650/2650 - loss 0.02813888 - time (sec): 181.61 - samples/sec: 8052.14 - lr: 0.050000 +2023-04-05 18:14:43,740 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:14:43,740 EPOCH 123 done: loss 0.0281 - lr 0.050000 +2023-04-05 18:14:43,740 BAD EPOCHS (no improvement): 2 +2023-04-05 18:14:43,743 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:15:01,592 epoch 124 - iter 265/2650 - loss 0.02696338 - time (sec): 17.85 - samples/sec: 8135.77 - lr: 0.050000 +2023-04-05 18:15:19,412 epoch 124 - iter 530/2650 - loss 0.02725889 - time (sec): 35.67 - samples/sec: 8165.15 - lr: 0.050000 +2023-04-05 18:15:37,776 epoch 124 - iter 795/2650 - loss 0.02717434 - time (sec): 54.03 - samples/sec: 8097.14 - lr: 0.050000 +2023-04-05 18:15:56,091 epoch 124 - iter 1060/2650 - loss 0.02697220 - time (sec): 72.35 - samples/sec: 8076.50 - lr: 0.050000 +2023-04-05 18:16:14,499 epoch 124 - iter 1325/2650 - loss 0.02753524 - time (sec): 90.76 - samples/sec: 8057.13 - lr: 0.050000 +2023-04-05 18:16:32,985 epoch 124 - iter 1590/2650 - loss 0.02796007 - time (sec): 109.24 - samples/sec: 8045.80 - lr: 0.050000 +2023-04-05 18:16:51,172 epoch 124 - iter 1855/2650 - loss 0.02797708 - time (sec): 127.43 - samples/sec: 8050.30 - lr: 0.050000 +2023-04-05 18:17:08,983 epoch 124 - iter 2120/2650 - loss 0.02795310 - time (sec): 145.24 - samples/sec: 8056.13 - lr: 0.050000 +2023-04-05 18:17:26,729 epoch 124 - iter 2385/2650 - loss 0.02787938 - time (sec): 162.99 - samples/sec: 8073.85 - lr: 0.050000 +2023-04-05 18:17:44,487 epoch 124 - iter 2650/2650 - loss 0.02785167 - time (sec): 180.74 - samples/sec: 8090.77 - lr: 0.050000 +2023-04-05 18:17:44,488 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:17:44,488 EPOCH 124 done: loss 0.0279 - lr 0.050000 +2023-04-05 18:17:44,488 BAD EPOCHS (no improvement): 3 +2023-04-05 18:17:44,491 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:18:02,340 epoch 125 - iter 265/2650 - loss 0.02856059 - time (sec): 17.85 - samples/sec: 8215.39 - lr: 0.050000 +2023-04-05 18:18:20,234 epoch 125 - iter 530/2650 - loss 0.02830099 - time (sec): 35.74 - samples/sec: 8161.19 - lr: 0.050000 +2023-04-05 18:18:38,535 epoch 125 - iter 795/2650 - loss 0.02753850 - time (sec): 54.04 - samples/sec: 8113.40 - lr: 0.050000 +2023-04-05 18:18:56,637 epoch 125 - iter 1060/2650 - loss 0.02728955 - time (sec): 72.15 - samples/sec: 8103.37 - lr: 0.050000 +2023-04-05 18:19:15,119 epoch 125 - iter 1325/2650 - loss 0.02759938 - time (sec): 90.63 - samples/sec: 8097.68 - lr: 0.050000 +2023-04-05 18:19:32,488 epoch 125 - iter 1590/2650 - loss 0.02749853 - time (sec): 108.00 - samples/sec: 8131.33 - lr: 0.050000 +2023-04-05 18:19:50,791 epoch 125 - iter 1855/2650 - loss 0.02736618 - time (sec): 126.30 - samples/sec: 8102.13 - lr: 0.050000 +2023-04-05 18:20:08,911 epoch 125 - iter 2120/2650 - loss 0.02769555 - time (sec): 144.42 - samples/sec: 8093.36 - lr: 0.050000 +2023-04-05 18:20:27,474 epoch 125 - iter 2385/2650 - loss 0.02789177 - time (sec): 162.98 - samples/sec: 8077.48 - lr: 0.050000 +2023-04-05 18:20:45,176 epoch 125 - iter 2650/2650 - loss 0.02785441 - time (sec): 180.68 - samples/sec: 8093.44 - lr: 0.050000 +2023-04-05 18:20:45,176 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:20:45,176 EPOCH 125 done: loss 0.0279 - lr 0.050000 +2023-04-05 18:20:45,177 Epoch 125: reducing learning rate of group 0 to 2.5000e-02. +2023-04-05 18:20:45,177 BAD EPOCHS (no improvement): 4 +2023-04-05 18:20:45,179 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:21:03,006 epoch 126 - iter 265/2650 - loss 0.02761471 - time (sec): 17.83 - samples/sec: 8164.70 - lr: 0.025000 +2023-04-05 18:21:21,410 epoch 126 - iter 530/2650 - loss 0.02695613 - time (sec): 36.23 - samples/sec: 8065.82 - lr: 0.025000 +2023-04-05 18:21:39,232 epoch 126 - iter 795/2650 - loss 0.02639481 - time (sec): 54.05 - samples/sec: 8105.55 - lr: 0.025000 +2023-04-05 18:21:57,249 epoch 126 - iter 1060/2650 - loss 0.02669803 - time (sec): 72.07 - samples/sec: 8109.85 - lr: 0.025000 +2023-04-05 18:22:15,205 epoch 126 - iter 1325/2650 - loss 0.02696905 - time (sec): 90.03 - samples/sec: 8125.08 - lr: 0.025000 +2023-04-05 18:22:33,299 epoch 126 - iter 1590/2650 - loss 0.02689059 - time (sec): 108.12 - samples/sec: 8101.38 - lr: 0.025000 +2023-04-05 18:22:51,648 epoch 126 - iter 1855/2650 - loss 0.02675055 - time (sec): 126.47 - samples/sec: 8095.51 - lr: 0.025000 +2023-04-05 18:23:09,940 epoch 126 - iter 2120/2650 - loss 0.02703276 - time (sec): 144.76 - samples/sec: 8094.35 - lr: 0.025000 +2023-04-05 18:23:28,087 epoch 126 - iter 2385/2650 - loss 0.02695826 - time (sec): 162.91 - samples/sec: 8089.54 - lr: 0.025000 +2023-04-05 18:23:45,946 epoch 126 - iter 2650/2650 - loss 0.02686253 - time (sec): 180.77 - samples/sec: 8089.78 - lr: 0.025000 +2023-04-05 18:23:45,946 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:23:45,946 EPOCH 126 done: loss 0.0269 - lr 0.025000 +2023-04-05 18:23:45,946 BAD EPOCHS (no improvement): 0 +2023-04-05 18:23:45,949 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:24:03,594 epoch 127 - iter 265/2650 - loss 0.02705563 - time (sec): 17.64 - samples/sec: 8251.80 - lr: 0.025000 +2023-04-05 18:24:21,622 epoch 127 - iter 530/2650 - loss 0.02700159 - time (sec): 35.67 - samples/sec: 8193.36 - lr: 0.025000 +2023-04-05 18:24:39,654 epoch 127 - iter 795/2650 - loss 0.02659643 - time (sec): 53.70 - samples/sec: 8149.77 - lr: 0.025000 +2023-04-05 18:24:57,804 epoch 127 - iter 1060/2650 - loss 0.02641078 - time (sec): 71.85 - samples/sec: 8137.50 - lr: 0.025000 +2023-04-05 18:25:15,899 epoch 127 - iter 1325/2650 - loss 0.02659799 - time (sec): 89.95 - samples/sec: 8132.92 - lr: 0.025000 +2023-04-05 18:25:34,091 epoch 127 - iter 1590/2650 - loss 0.02642112 - time (sec): 108.14 - samples/sec: 8117.76 - lr: 0.025000 +2023-04-05 18:25:52,429 epoch 127 - iter 1855/2650 - loss 0.02631653 - time (sec): 126.48 - samples/sec: 8082.91 - lr: 0.025000 +2023-04-05 18:26:09,923 epoch 127 - iter 2120/2650 - loss 0.02671297 - time (sec): 143.97 - samples/sec: 8118.67 - lr: 0.025000 +2023-04-05 18:26:28,596 epoch 127 - iter 2385/2650 - loss 0.02673630 - time (sec): 162.65 - samples/sec: 8094.58 - lr: 0.025000 +2023-04-05 18:26:46,386 epoch 127 - iter 2650/2650 - loss 0.02666838 - time (sec): 180.44 - samples/sec: 8104.60 - lr: 0.025000 +2023-04-05 18:26:46,386 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:26:46,386 EPOCH 127 done: loss 0.0267 - lr 0.025000 +2023-04-05 18:26:46,386 BAD EPOCHS (no improvement): 0 +2023-04-05 18:26:46,389 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:27:04,545 epoch 128 - iter 265/2650 - loss 0.02412791 - time (sec): 18.16 - samples/sec: 8044.88 - lr: 0.025000 +2023-04-05 18:27:22,336 epoch 128 - iter 530/2650 - loss 0.02502421 - time (sec): 35.95 - samples/sec: 8110.52 - lr: 0.025000 +2023-04-05 18:27:40,316 epoch 128 - iter 795/2650 - loss 0.02520468 - time (sec): 53.93 - samples/sec: 8109.96 - lr: 0.025000 +2023-04-05 18:27:58,198 epoch 128 - iter 1060/2650 - loss 0.02520594 - time (sec): 71.81 - samples/sec: 8109.33 - lr: 0.025000 +2023-04-05 18:28:16,257 epoch 128 - iter 1325/2650 - loss 0.02561542 - time (sec): 89.87 - samples/sec: 8103.85 - lr: 0.025000 +2023-04-05 18:28:34,483 epoch 128 - iter 1590/2650 - loss 0.02578441 - time (sec): 108.09 - samples/sec: 8114.48 - lr: 0.025000 +2023-04-05 18:28:52,283 epoch 128 - iter 1855/2650 - loss 0.02590230 - time (sec): 125.89 - samples/sec: 8132.03 - lr: 0.025000 +2023-04-05 18:29:10,642 epoch 128 - iter 2120/2650 - loss 0.02594621 - time (sec): 144.25 - samples/sec: 8113.66 - lr: 0.025000 +2023-04-05 18:29:29,329 epoch 128 - iter 2385/2650 - loss 0.02609275 - time (sec): 162.94 - samples/sec: 8082.30 - lr: 0.025000 +2023-04-05 18:29:47,240 epoch 128 - iter 2650/2650 - loss 0.02602075 - time (sec): 180.85 - samples/sec: 8086.00 - lr: 0.025000 +2023-04-05 18:29:47,240 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:29:47,240 EPOCH 128 done: loss 0.0260 - lr 0.025000 +2023-04-05 18:29:47,240 BAD EPOCHS (no improvement): 0 +2023-04-05 18:29:47,243 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:30:05,301 epoch 129 - iter 265/2650 - loss 0.02599109 - time (sec): 18.06 - samples/sec: 8057.80 - lr: 0.025000 +2023-04-05 18:30:23,450 epoch 129 - iter 530/2650 - loss 0.02568471 - time (sec): 36.21 - samples/sec: 8078.19 - lr: 0.025000 +2023-04-05 18:30:41,825 epoch 129 - iter 795/2650 - loss 0.02573009 - time (sec): 54.58 - samples/sec: 8064.00 - lr: 0.025000 +2023-04-05 18:30:59,623 epoch 129 - iter 1060/2650 - loss 0.02565556 - time (sec): 72.38 - samples/sec: 8097.86 - lr: 0.025000 +2023-04-05 18:31:17,486 epoch 129 - iter 1325/2650 - loss 0.02562216 - time (sec): 90.24 - samples/sec: 8121.02 - lr: 0.025000 +2023-04-05 18:31:35,724 epoch 129 - iter 1590/2650 - loss 0.02580308 - time (sec): 108.48 - samples/sec: 8100.41 - lr: 0.025000 +2023-04-05 18:31:53,367 epoch 129 - iter 1855/2650 - loss 0.02569281 - time (sec): 126.12 - samples/sec: 8120.27 - lr: 0.025000 +2023-04-05 18:32:11,432 epoch 129 - iter 2120/2650 - loss 0.02567842 - time (sec): 144.19 - samples/sec: 8118.51 - lr: 0.025000 +2023-04-05 18:32:29,931 epoch 129 - iter 2385/2650 - loss 0.02578080 - time (sec): 162.69 - samples/sec: 8100.37 - lr: 0.025000 +2023-04-05 18:32:47,669 epoch 129 - iter 2650/2650 - loss 0.02577547 - time (sec): 180.43 - samples/sec: 8105.10 - lr: 0.025000 +2023-04-05 18:32:47,669 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:32:47,669 EPOCH 129 done: loss 0.0258 - lr 0.025000 +2023-04-05 18:32:47,669 BAD EPOCHS (no improvement): 0 +2023-04-05 18:32:47,672 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:33:05,245 epoch 130 - iter 265/2650 - loss 0.02528774 - time (sec): 17.57 - samples/sec: 8226.61 - lr: 0.025000 +2023-04-05 18:33:23,181 epoch 130 - iter 530/2650 - loss 0.02555078 - time (sec): 35.51 - samples/sec: 8164.82 - lr: 0.025000 +2023-04-05 18:33:41,509 epoch 130 - iter 795/2650 - loss 0.02556368 - time (sec): 53.84 - samples/sec: 8121.08 - lr: 0.025000 +2023-04-05 18:33:59,638 epoch 130 - iter 1060/2650 - loss 0.02543156 - time (sec): 71.97 - samples/sec: 8108.15 - lr: 0.025000 +2023-04-05 18:34:17,418 epoch 130 - iter 1325/2650 - loss 0.02524260 - time (sec): 89.75 - samples/sec: 8125.58 - lr: 0.025000 +2023-04-05 18:34:35,441 epoch 130 - iter 1590/2650 - loss 0.02543936 - time (sec): 107.77 - samples/sec: 8115.60 - lr: 0.025000 +2023-04-05 18:34:54,136 epoch 130 - iter 1855/2650 - loss 0.02541993 - time (sec): 126.46 - samples/sec: 8068.61 - lr: 0.025000 +2023-04-05 18:35:11,934 epoch 130 - iter 2120/2650 - loss 0.02546932 - time (sec): 144.26 - samples/sec: 8092.56 - lr: 0.025000 +2023-04-05 18:35:30,360 epoch 130 - iter 2385/2650 - loss 0.02556265 - time (sec): 162.69 - samples/sec: 8093.32 - lr: 0.025000 +2023-04-05 18:35:48,956 epoch 130 - iter 2650/2650 - loss 0.02549351 - time (sec): 181.28 - samples/sec: 8066.71 - lr: 0.025000 +2023-04-05 18:35:48,956 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:35:48,956 EPOCH 130 done: loss 0.0255 - lr 0.025000 +2023-04-05 18:35:48,956 BAD EPOCHS (no improvement): 0 +2023-04-05 18:35:48,960 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:36:07,150 epoch 131 - iter 265/2650 - loss 0.02608488 - time (sec): 18.19 - samples/sec: 8105.90 - lr: 0.025000 +2023-04-05 18:36:25,121 epoch 131 - iter 530/2650 - loss 0.02592117 - time (sec): 36.16 - samples/sec: 8114.69 - lr: 0.025000 +2023-04-05 18:36:43,282 epoch 131 - iter 795/2650 - loss 0.02565652 - time (sec): 54.32 - samples/sec: 8095.02 - lr: 0.025000 +2023-04-05 18:37:01,694 epoch 131 - iter 1060/2650 - loss 0.02521483 - time (sec): 72.73 - samples/sec: 8050.09 - lr: 0.025000 +2023-04-05 18:37:19,685 epoch 131 - iter 1325/2650 - loss 0.02528238 - time (sec): 90.73 - samples/sec: 8072.91 - lr: 0.025000 +2023-04-05 18:37:36,943 epoch 131 - iter 1590/2650 - loss 0.02539675 - time (sec): 107.98 - samples/sec: 8115.78 - lr: 0.025000 +2023-04-05 18:37:55,368 epoch 131 - iter 1855/2650 - loss 0.02575196 - time (sec): 126.41 - samples/sec: 8093.75 - lr: 0.025000 +2023-04-05 18:38:14,038 epoch 131 - iter 2120/2650 - loss 0.02567297 - time (sec): 145.08 - samples/sec: 8079.90 - lr: 0.025000 +2023-04-05 18:38:31,621 epoch 131 - iter 2385/2650 - loss 0.02557674 - time (sec): 162.66 - samples/sec: 8092.37 - lr: 0.025000 +2023-04-05 18:38:49,363 epoch 131 - iter 2650/2650 - loss 0.02547960 - time (sec): 180.40 - samples/sec: 8106.08 - lr: 0.025000 +2023-04-05 18:38:49,363 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:38:49,363 EPOCH 131 done: loss 0.0255 - lr 0.025000 +2023-04-05 18:38:49,363 BAD EPOCHS (no improvement): 0 +2023-04-05 18:38:49,367 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:39:07,158 epoch 132 - iter 265/2650 - loss 0.02526280 - time (sec): 17.79 - samples/sec: 8194.92 - lr: 0.025000 +2023-04-05 18:39:25,817 epoch 132 - iter 530/2650 - loss 0.02516201 - time (sec): 36.45 - samples/sec: 8006.02 - lr: 0.025000 +2023-04-05 18:39:43,388 epoch 132 - iter 795/2650 - loss 0.02544962 - time (sec): 54.02 - samples/sec: 8093.13 - lr: 0.025000 +2023-04-05 18:40:02,160 epoch 132 - iter 1060/2650 - loss 0.02532481 - time (sec): 72.79 - samples/sec: 8018.78 - lr: 0.025000 +2023-04-05 18:40:19,739 epoch 132 - iter 1325/2650 - loss 0.02540267 - time (sec): 90.37 - samples/sec: 8060.62 - lr: 0.025000 +2023-04-05 18:40:37,563 epoch 132 - iter 1590/2650 - loss 0.02537736 - time (sec): 108.20 - samples/sec: 8078.10 - lr: 0.025000 +2023-04-05 18:40:55,639 epoch 132 - iter 1855/2650 - loss 0.02509043 - time (sec): 126.27 - samples/sec: 8084.14 - lr: 0.025000 +2023-04-05 18:41:14,162 epoch 132 - iter 2120/2650 - loss 0.02525964 - time (sec): 144.80 - samples/sec: 8064.46 - lr: 0.025000 +2023-04-05 18:41:32,126 epoch 132 - iter 2385/2650 - loss 0.02515181 - time (sec): 162.76 - samples/sec: 8077.11 - lr: 0.025000 +2023-04-05 18:41:50,361 epoch 132 - iter 2650/2650 - loss 0.02518512 - time (sec): 180.99 - samples/sec: 8079.59 - lr: 0.025000 +2023-04-05 18:41:50,362 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:41:50,362 EPOCH 132 done: loss 0.0252 - lr 0.025000 +2023-04-05 18:41:50,362 BAD EPOCHS (no improvement): 0 +2023-04-05 18:41:50,364 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:42:08,079 epoch 133 - iter 265/2650 - loss 0.02498017 - time (sec): 17.71 - samples/sec: 8192.46 - lr: 0.025000 +2023-04-05 18:42:26,186 epoch 133 - iter 530/2650 - loss 0.02482306 - time (sec): 35.82 - samples/sec: 8154.43 - lr: 0.025000 +2023-04-05 18:42:44,410 epoch 133 - iter 795/2650 - loss 0.02476083 - time (sec): 54.05 - samples/sec: 8130.80 - lr: 0.025000 +2023-04-05 18:43:02,463 epoch 133 - iter 1060/2650 - loss 0.02465676 - time (sec): 72.10 - samples/sec: 8120.65 - lr: 0.025000 +2023-04-05 18:43:20,920 epoch 133 - iter 1325/2650 - loss 0.02487944 - time (sec): 90.56 - samples/sec: 8114.18 - lr: 0.025000 +2023-04-05 18:43:39,893 epoch 133 - iter 1590/2650 - loss 0.02481255 - time (sec): 109.53 - samples/sec: 8046.64 - lr: 0.025000 +2023-04-05 18:43:57,875 epoch 133 - iter 1855/2650 - loss 0.02495586 - time (sec): 127.51 - samples/sec: 8063.78 - lr: 0.025000 +2023-04-05 18:44:15,914 epoch 133 - iter 2120/2650 - loss 0.02498226 - time (sec): 145.55 - samples/sec: 8061.77 - lr: 0.025000 +2023-04-05 18:44:33,445 epoch 133 - iter 2385/2650 - loss 0.02507539 - time (sec): 163.08 - samples/sec: 8083.29 - lr: 0.025000 +2023-04-05 18:44:51,359 epoch 133 - iter 2650/2650 - loss 0.02516142 - time (sec): 181.00 - samples/sec: 8079.58 - lr: 0.025000 +2023-04-05 18:44:51,360 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:44:51,360 EPOCH 133 done: loss 0.0252 - lr 0.025000 +2023-04-05 18:44:51,360 BAD EPOCHS (no improvement): 0 +2023-04-05 18:44:51,362 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:45:09,180 epoch 134 - iter 265/2650 - loss 0.02457572 - time (sec): 17.82 - samples/sec: 8195.86 - lr: 0.025000 +2023-04-05 18:45:26,963 epoch 134 - iter 530/2650 - loss 0.02485823 - time (sec): 35.60 - samples/sec: 8164.70 - lr: 0.025000 +2023-04-05 18:45:45,696 epoch 134 - iter 795/2650 - loss 0.02513041 - time (sec): 54.33 - samples/sec: 8052.78 - lr: 0.025000 +2023-04-05 18:46:03,480 epoch 134 - iter 1060/2650 - loss 0.02510502 - time (sec): 72.12 - samples/sec: 8103.35 - lr: 0.025000 +2023-04-05 18:46:21,630 epoch 134 - iter 1325/2650 - loss 0.02523565 - time (sec): 90.27 - samples/sec: 8084.10 - lr: 0.025000 +2023-04-05 18:46:40,241 epoch 134 - iter 1590/2650 - loss 0.02521900 - time (sec): 108.88 - samples/sec: 8049.50 - lr: 0.025000 +2023-04-05 18:46:58,713 epoch 134 - iter 1855/2650 - loss 0.02514394 - time (sec): 127.35 - samples/sec: 8047.89 - lr: 0.025000 +2023-04-05 18:47:16,347 epoch 134 - iter 2120/2650 - loss 0.02528172 - time (sec): 144.98 - samples/sec: 8072.89 - lr: 0.025000 +2023-04-05 18:47:34,647 epoch 134 - iter 2385/2650 - loss 0.02521397 - time (sec): 163.29 - samples/sec: 8064.12 - lr: 0.025000 +2023-04-05 18:47:52,426 epoch 134 - iter 2650/2650 - loss 0.02522383 - time (sec): 181.06 - samples/sec: 8076.50 - lr: 0.025000 +2023-04-05 18:47:52,427 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:47:52,427 EPOCH 134 done: loss 0.0252 - lr 0.025000 +2023-04-05 18:47:52,427 BAD EPOCHS (no improvement): 1 +2023-04-05 18:47:52,430 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:48:10,428 epoch 135 - iter 265/2650 - loss 0.02515428 - time (sec): 18.00 - samples/sec: 8095.20 - lr: 0.025000 +2023-04-05 18:48:29,028 epoch 135 - iter 530/2650 - loss 0.02531870 - time (sec): 36.60 - samples/sec: 7998.43 - lr: 0.025000 +2023-04-05 18:48:46,930 epoch 135 - iter 795/2650 - loss 0.02561037 - time (sec): 54.50 - samples/sec: 8054.65 - lr: 0.025000 +2023-04-05 18:49:05,052 epoch 135 - iter 1060/2650 - loss 0.02523012 - time (sec): 72.62 - samples/sec: 8048.76 - lr: 0.025000 +2023-04-05 18:49:23,558 epoch 135 - iter 1325/2650 - loss 0.02496347 - time (sec): 91.13 - samples/sec: 8034.77 - lr: 0.025000 +2023-04-05 18:49:41,199 epoch 135 - iter 1590/2650 - loss 0.02460371 - time (sec): 108.77 - samples/sec: 8078.41 - lr: 0.025000 +2023-04-05 18:49:59,087 epoch 135 - iter 1855/2650 - loss 0.02464470 - time (sec): 126.66 - samples/sec: 8075.22 - lr: 0.025000 +2023-04-05 18:50:17,197 epoch 135 - iter 2120/2650 - loss 0.02472300 - time (sec): 144.77 - samples/sec: 8076.81 - lr: 0.025000 +2023-04-05 18:50:35,910 epoch 135 - iter 2385/2650 - loss 0.02477552 - time (sec): 163.48 - samples/sec: 8053.95 - lr: 0.025000 +2023-04-05 18:50:54,175 epoch 135 - iter 2650/2650 - loss 0.02486079 - time (sec): 181.74 - samples/sec: 8046.24 - lr: 0.025000 +2023-04-05 18:50:54,175 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:50:54,176 EPOCH 135 done: loss 0.0249 - lr 0.025000 +2023-04-05 18:50:54,176 BAD EPOCHS (no improvement): 0 +2023-04-05 18:50:54,179 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:51:12,065 epoch 136 - iter 265/2650 - loss 0.02542377 - time (sec): 17.89 - samples/sec: 8123.12 - lr: 0.025000 +2023-04-05 18:51:30,200 epoch 136 - iter 530/2650 - loss 0.02492437 - time (sec): 36.02 - samples/sec: 8096.11 - lr: 0.025000 +2023-04-05 18:51:48,768 epoch 136 - iter 795/2650 - loss 0.02484104 - time (sec): 54.59 - samples/sec: 8012.81 - lr: 0.025000 +2023-04-05 18:52:07,516 epoch 136 - iter 1060/2650 - loss 0.02467132 - time (sec): 73.34 - samples/sec: 7977.27 - lr: 0.025000 +2023-04-05 18:52:25,740 epoch 136 - iter 1325/2650 - loss 0.02459426 - time (sec): 91.56 - samples/sec: 7994.65 - lr: 0.025000 +2023-04-05 18:52:43,831 epoch 136 - iter 1590/2650 - loss 0.02470621 - time (sec): 109.65 - samples/sec: 8009.86 - lr: 0.025000 +2023-04-05 18:53:01,805 epoch 136 - iter 1855/2650 - loss 0.02471586 - time (sec): 127.63 - samples/sec: 8035.97 - lr: 0.025000 +2023-04-05 18:53:19,584 epoch 136 - iter 2120/2650 - loss 0.02474584 - time (sec): 145.40 - samples/sec: 8050.40 - lr: 0.025000 +2023-04-05 18:53:36,996 epoch 136 - iter 2385/2650 - loss 0.02472729 - time (sec): 162.82 - samples/sec: 8081.92 - lr: 0.025000 +2023-04-05 18:53:55,198 epoch 136 - iter 2650/2650 - loss 0.02484105 - time (sec): 181.02 - samples/sec: 8078.51 - lr: 0.025000 +2023-04-05 18:53:55,199 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:53:55,199 EPOCH 136 done: loss 0.0248 - lr 0.025000 +2023-04-05 18:53:55,199 BAD EPOCHS (no improvement): 0 +2023-04-05 18:53:55,201 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:54:23,011 epoch 137 - iter 265/2650 - loss 0.02398522 - time (sec): 27.81 - samples/sec: 5222.81 - lr: 0.025000 +2023-04-05 18:54:40,759 epoch 137 - iter 530/2650 - loss 0.02461934 - time (sec): 45.56 - samples/sec: 6351.79 - lr: 0.025000 +2023-04-05 18:54:59,275 epoch 137 - iter 795/2650 - loss 0.02487058 - time (sec): 64.07 - samples/sec: 6796.59 - lr: 0.025000 +2023-04-05 18:55:17,239 epoch 137 - iter 1060/2650 - loss 0.02473141 - time (sec): 82.04 - samples/sec: 7076.98 - lr: 0.025000 +2023-04-05 18:55:35,673 epoch 137 - iter 1325/2650 - loss 0.02483518 - time (sec): 100.47 - samples/sec: 7252.10 - lr: 0.025000 +2023-04-05 18:55:53,974 epoch 137 - iter 1590/2650 - loss 0.02484433 - time (sec): 118.77 - samples/sec: 7357.59 - lr: 0.025000 +2023-04-05 18:56:12,103 epoch 137 - iter 1855/2650 - loss 0.02487423 - time (sec): 136.90 - samples/sec: 7455.37 - lr: 0.025000 +2023-04-05 18:56:30,340 epoch 137 - iter 2120/2650 - loss 0.02488445 - time (sec): 155.14 - samples/sec: 7530.51 - lr: 0.025000 +2023-04-05 18:56:48,822 epoch 137 - iter 2385/2650 - loss 0.02495899 - time (sec): 173.62 - samples/sec: 7583.64 - lr: 0.025000 +2023-04-05 18:57:06,421 epoch 137 - iter 2650/2650 - loss 0.02475853 - time (sec): 191.22 - samples/sec: 7647.57 - lr: 0.025000 +2023-04-05 18:57:06,421 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:57:06,421 EPOCH 137 done: loss 0.0248 - lr 0.025000 +2023-04-05 18:57:06,421 BAD EPOCHS (no improvement): 0 +2023-04-05 18:57:06,424 ---------------------------------------------------------------------------------------------------- +2023-04-05 18:57:24,169 epoch 138 - iter 265/2650 - loss 0.02427945 - time (sec): 17.74 - samples/sec: 8182.15 - lr: 0.025000 +2023-04-05 18:57:42,079 epoch 138 - iter 530/2650 - loss 0.02408522 - time (sec): 35.65 - samples/sec: 8182.47 - lr: 0.025000 +2023-04-05 18:58:00,683 epoch 138 - iter 795/2650 - loss 0.02429837 - time (sec): 54.26 - samples/sec: 8095.01 - lr: 0.025000 +2023-04-05 18:58:18,995 epoch 138 - iter 1060/2650 - loss 0.02453084 - time (sec): 72.57 - samples/sec: 8088.43 - lr: 0.025000 +2023-04-05 18:58:37,225 epoch 138 - iter 1325/2650 - loss 0.02460430 - time (sec): 90.80 - samples/sec: 8091.10 - lr: 0.025000 +2023-04-05 18:58:55,469 epoch 138 - iter 1590/2650 - loss 0.02465567 - time (sec): 109.04 - samples/sec: 8066.84 - lr: 0.025000 +2023-04-05 18:59:14,097 epoch 138 - iter 1855/2650 - loss 0.02449791 - time (sec): 127.67 - samples/sec: 8039.58 - lr: 0.025000 +2023-04-05 18:59:31,986 epoch 138 - iter 2120/2650 - loss 0.02465562 - time (sec): 145.56 - samples/sec: 8047.63 - lr: 0.025000 +2023-04-05 18:59:50,040 epoch 138 - iter 2385/2650 - loss 0.02467509 - time (sec): 163.62 - samples/sec: 8057.35 - lr: 0.025000 +2023-04-05 19:00:08,105 epoch 138 - iter 2650/2650 - loss 0.02464871 - time (sec): 181.68 - samples/sec: 8049.10 - lr: 0.025000 +2023-04-05 19:00:08,105 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:00:08,105 EPOCH 138 done: loss 0.0246 - lr 0.025000 +2023-04-05 19:00:08,105 BAD EPOCHS (no improvement): 0 +2023-04-05 19:00:08,108 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:00:26,236 epoch 139 - iter 265/2650 - loss 0.02498530 - time (sec): 18.13 - samples/sec: 8137.63 - lr: 0.025000 +2023-04-05 19:00:44,097 epoch 139 - iter 530/2650 - loss 0.02449827 - time (sec): 35.99 - samples/sec: 8111.14 - lr: 0.025000 +2023-04-05 19:01:02,511 epoch 139 - iter 795/2650 - loss 0.02468473 - time (sec): 54.40 - samples/sec: 8045.64 - lr: 0.025000 +2023-04-05 19:01:20,505 epoch 139 - iter 1060/2650 - loss 0.02480890 - time (sec): 72.40 - samples/sec: 8049.98 - lr: 0.025000 +2023-04-05 19:01:38,334 epoch 139 - iter 1325/2650 - loss 0.02472212 - time (sec): 90.23 - samples/sec: 8067.88 - lr: 0.025000 +2023-04-05 19:01:56,483 epoch 139 - iter 1590/2650 - loss 0.02469157 - time (sec): 108.37 - samples/sec: 8079.40 - lr: 0.025000 +2023-04-05 19:02:14,516 epoch 139 - iter 1855/2650 - loss 0.02451259 - time (sec): 126.41 - samples/sec: 8075.07 - lr: 0.025000 +2023-04-05 19:02:32,774 epoch 139 - iter 2120/2650 - loss 0.02435786 - time (sec): 144.67 - samples/sec: 8082.15 - lr: 0.025000 +2023-04-05 19:02:51,171 epoch 139 - iter 2385/2650 - loss 0.02432947 - time (sec): 163.06 - samples/sec: 8070.10 - lr: 0.025000 +2023-04-05 19:03:09,791 epoch 139 - iter 2650/2650 - loss 0.02436687 - time (sec): 181.68 - samples/sec: 8048.98 - lr: 0.025000 +2023-04-05 19:03:09,792 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:03:09,792 EPOCH 139 done: loss 0.0244 - lr 0.025000 +2023-04-05 19:03:09,792 BAD EPOCHS (no improvement): 0 +2023-04-05 19:03:09,796 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:03:28,698 epoch 140 - iter 265/2650 - loss 0.02468503 - time (sec): 18.90 - samples/sec: 7808.15 - lr: 0.025000 +2023-04-05 19:03:46,948 epoch 140 - iter 530/2650 - loss 0.02462389 - time (sec): 37.15 - samples/sec: 7936.13 - lr: 0.025000 +2023-04-05 19:04:04,305 epoch 140 - iter 795/2650 - loss 0.02481561 - time (sec): 54.51 - samples/sec: 8076.94 - lr: 0.025000 +2023-04-05 19:04:22,700 epoch 140 - iter 1060/2650 - loss 0.02483435 - time (sec): 72.90 - samples/sec: 8032.00 - lr: 0.025000 +2023-04-05 19:04:40,447 epoch 140 - iter 1325/2650 - loss 0.02484754 - time (sec): 90.65 - samples/sec: 8074.66 - lr: 0.025000 +2023-04-05 19:04:58,324 epoch 140 - iter 1590/2650 - loss 0.02484423 - time (sec): 108.53 - samples/sec: 8086.68 - lr: 0.025000 +2023-04-05 19:05:16,532 epoch 140 - iter 1855/2650 - loss 0.02490814 - time (sec): 126.74 - samples/sec: 8076.81 - lr: 0.025000 +2023-04-05 19:05:34,861 epoch 140 - iter 2120/2650 - loss 0.02484655 - time (sec): 145.07 - samples/sec: 8067.23 - lr: 0.025000 +2023-04-05 19:05:52,734 epoch 140 - iter 2385/2650 - loss 0.02466221 - time (sec): 162.94 - samples/sec: 8077.24 - lr: 0.025000 +2023-04-05 19:06:11,647 epoch 140 - iter 2650/2650 - loss 0.02472064 - time (sec): 181.85 - samples/sec: 8041.52 - lr: 0.025000 +2023-04-05 19:06:11,648 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:06:11,648 EPOCH 140 done: loss 0.0247 - lr 0.025000 +2023-04-05 19:06:11,648 BAD EPOCHS (no improvement): 1 +2023-04-05 19:06:11,650 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:06:29,850 epoch 141 - iter 265/2650 - loss 0.02434420 - time (sec): 18.20 - samples/sec: 7988.83 - lr: 0.025000 +2023-04-05 19:06:47,857 epoch 141 - iter 530/2650 - loss 0.02436066 - time (sec): 36.21 - samples/sec: 8069.81 - lr: 0.025000 +2023-04-05 19:07:06,350 epoch 141 - iter 795/2650 - loss 0.02534629 - time (sec): 54.70 - samples/sec: 8014.54 - lr: 0.025000 +2023-04-05 19:07:24,551 epoch 141 - iter 1060/2650 - loss 0.02502286 - time (sec): 72.90 - samples/sec: 8002.30 - lr: 0.025000 +2023-04-05 19:07:42,712 epoch 141 - iter 1325/2650 - loss 0.02484554 - time (sec): 91.06 - samples/sec: 8006.66 - lr: 0.025000 +2023-04-05 19:08:00,673 epoch 141 - iter 1590/2650 - loss 0.02475347 - time (sec): 109.02 - samples/sec: 8025.45 - lr: 0.025000 +2023-04-05 19:08:18,701 epoch 141 - iter 1855/2650 - loss 0.02473113 - time (sec): 127.05 - samples/sec: 8041.95 - lr: 0.025000 +2023-04-05 19:08:36,115 epoch 141 - iter 2120/2650 - loss 0.02461074 - time (sec): 144.46 - samples/sec: 8073.30 - lr: 0.025000 +2023-04-05 19:08:54,495 epoch 141 - iter 2385/2650 - loss 0.02448703 - time (sec): 162.84 - samples/sec: 8074.58 - lr: 0.025000 +2023-04-05 19:09:12,620 epoch 141 - iter 2650/2650 - loss 0.02465336 - time (sec): 180.97 - samples/sec: 8080.70 - lr: 0.025000 +2023-04-05 19:09:12,620 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:09:12,621 EPOCH 141 done: loss 0.0247 - lr 0.025000 +2023-04-05 19:09:12,621 BAD EPOCHS (no improvement): 2 +2023-04-05 19:09:12,624 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:09:31,185 epoch 142 - iter 265/2650 - loss 0.02362361 - time (sec): 18.56 - samples/sec: 8028.65 - lr: 0.025000 +2023-04-05 19:09:48,926 epoch 142 - iter 530/2650 - loss 0.02378519 - time (sec): 36.30 - samples/sec: 8099.60 - lr: 0.025000 +2023-04-05 19:10:06,578 epoch 142 - iter 795/2650 - loss 0.02401617 - time (sec): 53.95 - samples/sec: 8137.17 - lr: 0.025000 +2023-04-05 19:10:24,606 epoch 142 - iter 1060/2650 - loss 0.02395020 - time (sec): 71.98 - samples/sec: 8122.96 - lr: 0.025000 +2023-04-05 19:10:42,478 epoch 142 - iter 1325/2650 - loss 0.02400259 - time (sec): 89.85 - samples/sec: 8128.14 - lr: 0.025000 +2023-04-05 19:11:01,125 epoch 142 - iter 1590/2650 - loss 0.02427005 - time (sec): 108.50 - samples/sec: 8095.44 - lr: 0.025000 +2023-04-05 19:11:19,552 epoch 142 - iter 1855/2650 - loss 0.02414302 - time (sec): 126.93 - samples/sec: 8080.23 - lr: 0.025000 +2023-04-05 19:11:37,465 epoch 142 - iter 2120/2650 - loss 0.02406484 - time (sec): 144.84 - samples/sec: 8079.65 - lr: 0.025000 +2023-04-05 19:11:55,717 epoch 142 - iter 2385/2650 - loss 0.02411731 - time (sec): 163.09 - samples/sec: 8076.86 - lr: 0.025000 +2023-04-05 19:12:13,456 epoch 142 - iter 2650/2650 - loss 0.02409605 - time (sec): 180.83 - samples/sec: 8086.85 - lr: 0.025000 +2023-04-05 19:12:13,456 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:12:13,457 EPOCH 142 done: loss 0.0241 - lr 0.025000 +2023-04-05 19:12:13,457 BAD EPOCHS (no improvement): 0 +2023-04-05 19:12:13,460 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:12:31,737 epoch 143 - iter 265/2650 - loss 0.02411463 - time (sec): 18.28 - samples/sec: 8048.46 - lr: 0.025000 +2023-04-05 19:12:49,871 epoch 143 - iter 530/2650 - loss 0.02313879 - time (sec): 36.41 - samples/sec: 8041.93 - lr: 0.025000 +2023-04-05 19:13:07,745 epoch 143 - iter 795/2650 - loss 0.02367285 - time (sec): 54.29 - samples/sec: 8089.07 - lr: 0.025000 +2023-04-05 19:13:26,132 epoch 143 - iter 1060/2650 - loss 0.02351134 - time (sec): 72.67 - samples/sec: 8049.22 - lr: 0.025000 +2023-04-05 19:13:44,378 epoch 143 - iter 1325/2650 - loss 0.02383040 - time (sec): 90.92 - samples/sec: 8038.09 - lr: 0.025000 +2023-04-05 19:14:02,445 epoch 143 - iter 1590/2650 - loss 0.02373061 - time (sec): 108.99 - samples/sec: 8043.84 - lr: 0.025000 +2023-04-05 19:14:21,387 epoch 143 - iter 1855/2650 - loss 0.02384253 - time (sec): 127.93 - samples/sec: 8011.47 - lr: 0.025000 +2023-04-05 19:14:38,985 epoch 143 - iter 2120/2650 - loss 0.02401724 - time (sec): 145.53 - samples/sec: 8045.84 - lr: 0.025000 +2023-04-05 19:14:56,902 epoch 143 - iter 2385/2650 - loss 0.02410497 - time (sec): 163.44 - samples/sec: 8058.34 - lr: 0.025000 +2023-04-05 19:15:14,821 epoch 143 - iter 2650/2650 - loss 0.02415712 - time (sec): 181.36 - samples/sec: 8063.25 - lr: 0.025000 +2023-04-05 19:15:14,821 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:15:14,822 EPOCH 143 done: loss 0.0242 - lr 0.025000 +2023-04-05 19:15:14,822 BAD EPOCHS (no improvement): 1 +2023-04-05 19:15:14,824 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:15:32,821 epoch 144 - iter 265/2650 - loss 0.02410146 - time (sec): 18.00 - samples/sec: 8222.39 - lr: 0.025000 +2023-04-05 19:15:50,831 epoch 144 - iter 530/2650 - loss 0.02455104 - time (sec): 36.01 - samples/sec: 8176.79 - lr: 0.025000 +2023-04-05 19:16:09,132 epoch 144 - iter 795/2650 - loss 0.02422497 - time (sec): 54.31 - samples/sec: 8110.35 - lr: 0.025000 +2023-04-05 19:16:27,308 epoch 144 - iter 1060/2650 - loss 0.02412373 - time (sec): 72.48 - samples/sec: 8081.46 - lr: 0.025000 +2023-04-05 19:16:45,473 epoch 144 - iter 1325/2650 - loss 0.02422841 - time (sec): 90.65 - samples/sec: 8077.44 - lr: 0.025000 +2023-04-05 19:17:03,886 epoch 144 - iter 1590/2650 - loss 0.02431464 - time (sec): 109.06 - samples/sec: 8050.87 - lr: 0.025000 +2023-04-05 19:17:22,166 epoch 144 - iter 1855/2650 - loss 0.02434347 - time (sec): 127.34 - samples/sec: 8049.13 - lr: 0.025000 +2023-04-05 19:17:40,178 epoch 144 - iter 2120/2650 - loss 0.02414644 - time (sec): 145.35 - samples/sec: 8056.50 - lr: 0.025000 +2023-04-05 19:17:58,238 epoch 144 - iter 2385/2650 - loss 0.02394313 - time (sec): 163.41 - samples/sec: 8059.74 - lr: 0.025000 +2023-04-05 19:18:16,557 epoch 144 - iter 2650/2650 - loss 0.02403273 - time (sec): 181.73 - samples/sec: 8046.78 - lr: 0.025000 +2023-04-05 19:18:16,557 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:18:16,557 EPOCH 144 done: loss 0.0240 - lr 0.025000 +2023-04-05 19:18:16,557 BAD EPOCHS (no improvement): 0 +2023-04-05 19:18:16,560 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:18:34,838 epoch 145 - iter 265/2650 - loss 0.02442818 - time (sec): 18.28 - samples/sec: 8112.38 - lr: 0.025000 +2023-04-05 19:18:52,596 epoch 145 - iter 530/2650 - loss 0.02383093 - time (sec): 36.04 - samples/sec: 8136.39 - lr: 0.025000 +2023-04-05 19:19:10,429 epoch 145 - iter 795/2650 - loss 0.02421364 - time (sec): 53.87 - samples/sec: 8128.87 - lr: 0.025000 +2023-04-05 19:19:28,524 epoch 145 - iter 1060/2650 - loss 0.02416159 - time (sec): 71.96 - samples/sec: 8114.35 - lr: 0.025000 +2023-04-05 19:19:46,600 epoch 145 - iter 1325/2650 - loss 0.02441926 - time (sec): 90.04 - samples/sec: 8105.17 - lr: 0.025000 +2023-04-05 19:20:05,121 epoch 145 - iter 1590/2650 - loss 0.02465421 - time (sec): 108.56 - samples/sec: 8079.30 - lr: 0.025000 +2023-04-05 19:20:23,180 epoch 145 - iter 1855/2650 - loss 0.02463703 - time (sec): 126.62 - samples/sec: 8065.80 - lr: 0.025000 +2023-04-05 19:20:41,537 epoch 145 - iter 2120/2650 - loss 0.02446815 - time (sec): 144.98 - samples/sec: 8050.14 - lr: 0.025000 +2023-04-05 19:20:59,386 epoch 145 - iter 2385/2650 - loss 0.02440793 - time (sec): 162.83 - samples/sec: 8075.16 - lr: 0.025000 +2023-04-05 19:21:17,593 epoch 145 - iter 2650/2650 - loss 0.02449743 - time (sec): 181.03 - samples/sec: 8077.90 - lr: 0.025000 +2023-04-05 19:21:17,593 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:21:17,593 EPOCH 145 done: loss 0.0245 - lr 0.025000 +2023-04-05 19:21:17,593 BAD EPOCHS (no improvement): 1 +2023-04-05 19:21:17,596 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:21:36,198 epoch 146 - iter 265/2650 - loss 0.02431475 - time (sec): 18.60 - samples/sec: 7808.35 - lr: 0.025000 +2023-04-05 19:21:54,256 epoch 146 - iter 530/2650 - loss 0.02434228 - time (sec): 36.66 - samples/sec: 7943.37 - lr: 0.025000 +2023-04-05 19:22:12,343 epoch 146 - iter 795/2650 - loss 0.02438686 - time (sec): 54.75 - samples/sec: 7987.82 - lr: 0.025000 +2023-04-05 19:22:30,133 epoch 146 - iter 1060/2650 - loss 0.02486960 - time (sec): 72.54 - samples/sec: 8036.91 - lr: 0.025000 +2023-04-05 19:22:48,709 epoch 146 - iter 1325/2650 - loss 0.02506781 - time (sec): 91.11 - samples/sec: 8028.05 - lr: 0.025000 +2023-04-05 19:23:06,826 epoch 146 - iter 1590/2650 - loss 0.02497211 - time (sec): 109.23 - samples/sec: 8041.87 - lr: 0.025000 +2023-04-05 19:23:24,616 epoch 146 - iter 1855/2650 - loss 0.02464985 - time (sec): 127.02 - samples/sec: 8060.30 - lr: 0.025000 +2023-04-05 19:23:42,611 epoch 146 - iter 2120/2650 - loss 0.02469244 - time (sec): 145.02 - samples/sec: 8055.12 - lr: 0.025000 +2023-04-05 19:24:01,182 epoch 146 - iter 2385/2650 - loss 0.02469925 - time (sec): 163.59 - samples/sec: 8046.52 - lr: 0.025000 +2023-04-05 19:24:19,374 epoch 146 - iter 2650/2650 - loss 0.02460959 - time (sec): 181.78 - samples/sec: 8044.78 - lr: 0.025000 +2023-04-05 19:24:19,374 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:24:19,375 EPOCH 146 done: loss 0.0246 - lr 0.025000 +2023-04-05 19:24:19,375 BAD EPOCHS (no improvement): 2 +2023-04-05 19:24:19,377 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:24:37,558 epoch 147 - iter 265/2650 - loss 0.02400175 - time (sec): 18.18 - samples/sec: 7974.29 - lr: 0.025000 +2023-04-05 19:24:56,035 epoch 147 - iter 530/2650 - loss 0.02388287 - time (sec): 36.66 - samples/sec: 7999.78 - lr: 0.025000 +2023-04-05 19:25:13,853 epoch 147 - iter 795/2650 - loss 0.02412332 - time (sec): 54.48 - samples/sec: 8084.05 - lr: 0.025000 +2023-04-05 19:25:32,308 epoch 147 - iter 1060/2650 - loss 0.02419860 - time (sec): 72.93 - samples/sec: 8065.79 - lr: 0.025000 +2023-04-05 19:25:49,659 epoch 147 - iter 1325/2650 - loss 0.02409351 - time (sec): 90.28 - samples/sec: 8120.00 - lr: 0.025000 +2023-04-05 19:26:07,964 epoch 147 - iter 1590/2650 - loss 0.02417817 - time (sec): 108.59 - samples/sec: 8090.30 - lr: 0.025000 +2023-04-05 19:26:25,776 epoch 147 - iter 1855/2650 - loss 0.02414995 - time (sec): 126.40 - samples/sec: 8094.92 - lr: 0.025000 +2023-04-05 19:26:44,155 epoch 147 - iter 2120/2650 - loss 0.02396278 - time (sec): 144.78 - samples/sec: 8085.49 - lr: 0.025000 +2023-04-05 19:27:02,337 epoch 147 - iter 2385/2650 - loss 0.02392168 - time (sec): 162.96 - samples/sec: 8082.09 - lr: 0.025000 +2023-04-05 19:27:20,296 epoch 147 - iter 2650/2650 - loss 0.02396101 - time (sec): 180.92 - samples/sec: 8083.00 - lr: 0.025000 +2023-04-05 19:27:20,296 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:27:20,296 EPOCH 147 done: loss 0.0240 - lr 0.025000 +2023-04-05 19:27:20,296 BAD EPOCHS (no improvement): 0 +2023-04-05 19:27:20,300 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:27:38,438 epoch 148 - iter 265/2650 - loss 0.02418173 - time (sec): 18.14 - samples/sec: 7986.80 - lr: 0.025000 +2023-04-05 19:27:56,592 epoch 148 - iter 530/2650 - loss 0.02349866 - time (sec): 36.29 - samples/sec: 8047.67 - lr: 0.025000 +2023-04-05 19:28:14,951 epoch 148 - iter 795/2650 - loss 0.02330397 - time (sec): 54.65 - samples/sec: 8029.85 - lr: 0.025000 +2023-04-05 19:28:32,991 epoch 148 - iter 1060/2650 - loss 0.02358839 - time (sec): 72.69 - samples/sec: 8058.41 - lr: 0.025000 +2023-04-05 19:28:51,226 epoch 148 - iter 1325/2650 - loss 0.02361168 - time (sec): 90.93 - samples/sec: 8045.44 - lr: 0.025000 +2023-04-05 19:29:09,472 epoch 148 - iter 1590/2650 - loss 0.02360907 - time (sec): 109.17 - samples/sec: 8045.32 - lr: 0.025000 +2023-04-05 19:29:27,565 epoch 148 - iter 1855/2650 - loss 0.02356411 - time (sec): 127.27 - samples/sec: 8060.23 - lr: 0.025000 +2023-04-05 19:29:45,453 epoch 148 - iter 2120/2650 - loss 0.02376616 - time (sec): 145.15 - samples/sec: 8065.54 - lr: 0.025000 +2023-04-05 19:30:03,188 epoch 148 - iter 2385/2650 - loss 0.02377001 - time (sec): 162.89 - samples/sec: 8078.36 - lr: 0.025000 +2023-04-05 19:30:21,184 epoch 148 - iter 2650/2650 - loss 0.02383065 - time (sec): 180.88 - samples/sec: 8084.51 - lr: 0.025000 +2023-04-05 19:30:21,185 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:30:21,185 EPOCH 148 done: loss 0.0238 - lr 0.025000 +2023-04-05 19:30:21,185 BAD EPOCHS (no improvement): 0 +2023-04-05 19:30:21,188 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:30:40,121 epoch 149 - iter 265/2650 - loss 0.02313986 - time (sec): 18.93 - samples/sec: 7805.65 - lr: 0.025000 +2023-04-05 19:30:57,847 epoch 149 - iter 530/2650 - loss 0.02365756 - time (sec): 36.66 - samples/sec: 8013.59 - lr: 0.025000 +2023-04-05 19:31:15,940 epoch 149 - iter 795/2650 - loss 0.02327459 - time (sec): 54.75 - samples/sec: 8040.37 - lr: 0.025000 +2023-04-05 19:31:33,741 epoch 149 - iter 1060/2650 - loss 0.02334346 - time (sec): 72.55 - samples/sec: 8084.61 - lr: 0.025000 +2023-04-05 19:31:51,559 epoch 149 - iter 1325/2650 - loss 0.02344555 - time (sec): 90.37 - samples/sec: 8109.15 - lr: 0.025000 +2023-04-05 19:32:09,570 epoch 149 - iter 1590/2650 - loss 0.02343850 - time (sec): 108.38 - samples/sec: 8098.97 - lr: 0.025000 +2023-04-05 19:32:27,913 epoch 149 - iter 1855/2650 - loss 0.02355669 - time (sec): 126.72 - samples/sec: 8073.23 - lr: 0.025000 +2023-04-05 19:32:45,667 epoch 149 - iter 2120/2650 - loss 0.02369782 - time (sec): 144.48 - samples/sec: 8092.91 - lr: 0.025000 +2023-04-05 19:33:03,716 epoch 149 - iter 2385/2650 - loss 0.02378899 - time (sec): 162.53 - samples/sec: 8095.20 - lr: 0.025000 +2023-04-05 19:33:21,887 epoch 149 - iter 2650/2650 - loss 0.02373171 - time (sec): 180.70 - samples/sec: 8092.82 - lr: 0.025000 +2023-04-05 19:33:21,888 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:33:21,888 EPOCH 149 done: loss 0.0237 - lr 0.025000 +2023-04-05 19:33:21,888 BAD EPOCHS (no improvement): 0 +2023-04-05 19:33:21,890 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:33:40,397 epoch 150 - iter 265/2650 - loss 0.02347371 - time (sec): 18.51 - samples/sec: 7834.20 - lr: 0.025000 +2023-04-05 19:33:58,754 epoch 150 - iter 530/2650 - loss 0.02398713 - time (sec): 36.86 - samples/sec: 7919.38 - lr: 0.025000 +2023-04-05 19:34:16,630 epoch 150 - iter 795/2650 - loss 0.02438037 - time (sec): 54.74 - samples/sec: 7977.22 - lr: 0.025000 +2023-04-05 19:34:34,610 epoch 150 - iter 1060/2650 - loss 0.02401428 - time (sec): 72.72 - samples/sec: 8049.51 - lr: 0.025000 +2023-04-05 19:34:52,586 epoch 150 - iter 1325/2650 - loss 0.02413249 - time (sec): 90.70 - samples/sec: 8064.24 - lr: 0.025000 +2023-04-05 19:35:10,727 epoch 150 - iter 1590/2650 - loss 0.02403333 - time (sec): 108.84 - samples/sec: 8068.75 - lr: 0.025000 +2023-04-05 19:35:28,366 epoch 150 - iter 1855/2650 - loss 0.02412605 - time (sec): 126.48 - samples/sec: 8096.08 - lr: 0.025000 +2023-04-05 19:35:46,102 epoch 150 - iter 2120/2650 - loss 0.02405604 - time (sec): 144.21 - samples/sec: 8119.56 - lr: 0.025000 +2023-04-05 19:36:04,620 epoch 150 - iter 2385/2650 - loss 0.02408298 - time (sec): 162.73 - samples/sec: 8087.23 - lr: 0.025000 +2023-04-05 19:36:22,702 epoch 150 - iter 2650/2650 - loss 0.02414957 - time (sec): 180.81 - samples/sec: 8087.77 - lr: 0.025000 +2023-04-05 19:36:22,702 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:36:22,702 EPOCH 150 done: loss 0.0241 - lr 0.025000 +2023-04-05 19:36:22,702 BAD EPOCHS (no improvement): 1 +2023-04-05 19:36:28,915 ---------------------------------------------------------------------------------------------------- +2023-04-05 19:36:28,915 Testing using last state of model ... +2023-04-05 19:36:57,391 Evaluating as a multi-label problem: False +2023-04-05 19:36:57,456 0.8903 0.8874 0.8888 0.8192 +2023-04-05 19:36:57,457 +Results: +- F-score (micro) 0.8888 +- F-score (macro) 0.7945 +- Accuracy 0.8192 + +By class: + precision recall f1-score support + + GPE 0.9642 0.9491 0.9566 2240 + PERSON 0.9391 0.9386 0.9389 1988 + ORG 0.8833 0.8897 0.8865 1795 + DATE 0.8519 0.8727 0.8622 1602 + CARDINAL 0.8605 0.8310 0.8455 935 + NORP 0.9318 0.9429 0.9374 841 + PERCENT 0.8879 0.8854 0.8867 349 + MONEY 0.8790 0.8790 0.8790 314 + TIME 0.6484 0.6698 0.6589 212 + ORDINAL 0.7933 0.8462 0.8189 195 + LOC 0.7717 0.7933 0.7824 179 + WORK_OF_ART 0.6323 0.5904 0.6106 166 + FAC 0.7719 0.6519 0.7068 135 + QUANTITY 0.7679 0.8190 0.7926 105 + PRODUCT 0.7246 0.6579 0.6897 76 + EVENT 0.7143 0.6349 0.6723 63 + LAW 0.7097 0.5500 0.6197 40 + LANGUAGE 0.9333 0.6364 0.7568 22 + + micro avg 0.8903 0.8874 0.8888 11257 + macro avg 0.8147 0.7799 0.7945 11257 +weighted avg 0.8901 0.8874 0.8885 11257 + +2023-04-05 19:36:57,457 ----------------------------------------------------------------------------------------------------