diff --git "a/training.log" "b/training.log" --- "a/training.log" +++ "b/training.log" @@ -1,2155 +1,2174 @@ -2019-08-13 18:58:49,095 ---------------------------------------------------------------------------------------------------- -2019-08-13 18:58:49,095 Model: "SequenceTagger( +2023-04-05 22:27:04,698 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:27:04,698 Model: "SequenceTagger( (embeddings): StackedEmbeddings( - (list_embedding_0): WordEmbeddings('fr') + (list_embedding_0): WordEmbeddings( + 'fr' + (embedding): Embedding(1000000, 300) + ) (list_embedding_1): FlairEmbeddings( (lm): LanguageModel( - (drop): Dropout(p=0.5) + (drop): Dropout(p=0.5, inplace=False) (encoder): Embedding(275, 100) (rnn): LSTM(100, 1024) - (decoder): Linear(in_features=1024, out_features=275, bias=True) ) ) (list_embedding_2): FlairEmbeddings( (lm): LanguageModel( - (drop): Dropout(p=0.5) + (drop): Dropout(p=0.5, inplace=False) (encoder): Embedding(275, 100) (rnn): LSTM(100, 1024) - (decoder): Linear(in_features=1024, out_features=275, bias=True) ) ) ) (word_dropout): WordDropout(p=0.05) (locked_dropout): LockedDropout(p=0.5) (embedding2nn): Linear(in_features=2348, out_features=2348, bias=True) - (rnn): LSTM(2348, 256, bidirectional=True) - (linear): Linear(in_features=512, out_features=20, bias=True) + (rnn): LSTM(2348, 256, batch_first=True, bidirectional=True) + (linear): Linear(in_features=512, out_features=19, bias=True) + (loss_function): ViterbiLoss() + (crf): CRF() )" -2019-08-13 18:58:49,096 ---------------------------------------------------------------------------------------------------- -2019-08-13 18:58:49,096 Corpus: "Corpus: 107128 train + 11903 dev + 13226 test sentences" -2019-08-13 18:58:49,096 ---------------------------------------------------------------------------------------------------- -2019-08-13 18:58:49,096 Parameters: -2019-08-13 18:58:49,096 - learning_rate: "0.1" -2019-08-13 18:58:49,096 - mini_batch_size: "32" -2019-08-13 18:58:49,096 - patience: "3" -2019-08-13 18:58:49,096 - anneal_factor: "0.5" -2019-08-13 18:58:49,096 - max_epochs: "150" -2019-08-13 18:58:49,096 - shuffle: "True" -2019-08-13 18:58:49,096 - train_with_dev: "True" -2019-08-13 18:58:49,096 ---------------------------------------------------------------------------------------------------- -2019-08-13 18:58:49,096 Model training base path: "resources/taggers/release-fr-ner-0" -2019-08-13 18:58:49,097 ---------------------------------------------------------------------------------------------------- -2019-08-13 18:58:49,097 Device: cuda:0 -2019-08-13 18:58:49,097 ---------------------------------------------------------------------------------------------------- -2019-08-13 18:58:49,097 Embeddings storage mode: cpu -2019-08-13 18:58:49,097 ---------------------------------------------------------------------------------------------------- -2019-08-13 18:58:50,650 epoch 1 - iter 0/3720 - loss 91.21197510 throughput (samples/sec): 20474.53 -2019-08-13 19:02:13,067 epoch 1 - iter 372/3720 - loss 6.03944552 throughput (samples/sec): 75.52 -2019-08-13 19:04:55,346 epoch 1 - iter 744/3720 - loss 4.35996136 throughput (samples/sec): 76.28 -2019-08-13 19:07:36,816 epoch 1 - iter 1116/3720 - loss 3.65192114 throughput (samples/sec): 77.15 -2019-08-13 19:10:17,432 epoch 1 - iter 1488/3720 - loss 3.24999776 throughput (samples/sec): 77.07 -2019-08-13 19:12:59,942 epoch 1 - iter 1860/3720 - loss 2.96708947 throughput (samples/sec): 76.96 -2019-08-13 19:15:45,799 epoch 1 - iter 2232/3720 - loss 2.77272936 throughput (samples/sec): 74.85 -2019-08-13 19:18:29,554 epoch 1 - iter 2604/3720 - loss 2.61904597 throughput (samples/sec): 75.90 -2019-08-13 19:21:13,223 epoch 1 - iter 2976/3720 - loss 2.50279954 throughput (samples/sec): 76.20 -2019-08-13 19:23:54,459 epoch 1 - iter 3348/3720 - loss 2.40538508 throughput (samples/sec): 77.41 -2019-08-13 19:26:37,785 ---------------------------------------------------------------------------------------------------- -2019-08-13 19:26:37,785 EPOCH 1 done: loss 2.3183 - lr 0.1000 -2019-08-13 19:26:37,785 BAD EPOCHS (no improvement): 0 -2019-08-13 19:26:37,785 ---------------------------------------------------------------------------------------------------- -2019-08-13 19:26:39,528 epoch 2 - iter 0/3720 - loss 1.57799530 throughput (samples/sec): 24435.89 -2019-08-13 19:29:24,873 epoch 2 - iter 372/3720 - loss 1.54384129 throughput (samples/sec): 74.81 -2019-08-13 19:32:08,624 epoch 2 - iter 744/3720 - loss 1.52844398 throughput (samples/sec): 75.15 -2019-08-13 19:34:53,742 epoch 2 - iter 1116/3720 - loss 1.52084822 throughput (samples/sec): 74.42 -2019-08-13 19:37:39,363 epoch 2 - iter 1488/3720 - loss 1.50126231 throughput (samples/sec): 74.77 -2019-08-13 19:40:22,833 epoch 2 - iter 1860/3720 - loss 1.48376010 throughput (samples/sec): 75.50 -2019-08-13 19:43:06,424 epoch 2 - iter 2232/3720 - loss 1.47907364 throughput (samples/sec): 75.96 -2019-08-13 19:45:50,043 epoch 2 - iter 2604/3720 - loss 1.46799953 throughput (samples/sec): 76.40 -2019-08-13 19:48:34,100 epoch 2 - iter 2976/3720 - loss 1.46162405 throughput (samples/sec): 75.66 -2019-08-13 19:51:18,032 epoch 2 - iter 3348/3720 - loss 1.44787336 throughput (samples/sec): 76.20 -2019-08-13 19:54:00,139 ---------------------------------------------------------------------------------------------------- -2019-08-13 19:54:00,139 EPOCH 2 done: loss 1.4398 - lr 0.1000 -2019-08-13 19:54:00,139 BAD EPOCHS (no improvement): 0 -2019-08-13 19:54:00,139 ---------------------------------------------------------------------------------------------------- -2019-08-13 19:54:02,014 epoch 3 - iter 0/3720 - loss 2.14483953 throughput (samples/sec): 18769.78 -2019-08-13 19:56:47,516 epoch 3 - iter 372/3720 - loss 1.34348108 throughput (samples/sec): 74.95 -2019-08-13 19:59:30,155 epoch 3 - iter 744/3720 - loss 1.33043544 throughput (samples/sec): 76.68 -2019-08-13 20:02:13,510 epoch 3 - iter 1116/3720 - loss 1.33131669 throughput (samples/sec): 76.37 -2019-08-13 20:04:53,962 epoch 3 - iter 1488/3720 - loss 1.32399288 throughput (samples/sec): 77.56 -2019-08-13 20:07:38,128 epoch 3 - iter 1860/3720 - loss 1.32004507 throughput (samples/sec): 75.22 -2019-08-13 20:10:22,937 epoch 3 - iter 2232/3720 - loss 1.31486852 throughput (samples/sec): 74.95 -2019-08-13 20:13:05,005 epoch 3 - iter 2604/3720 - loss 1.30578636 throughput (samples/sec): 76.79 -2019-08-13 20:15:45,992 epoch 3 - iter 2976/3720 - loss 1.30191243 throughput (samples/sec): 77.03 -2019-08-13 20:18:28,443 epoch 3 - iter 3348/3720 - loss 1.29604418 throughput (samples/sec): 76.30 -2019-08-13 20:21:10,497 ---------------------------------------------------------------------------------------------------- -2019-08-13 20:21:10,498 EPOCH 3 done: loss 1.2916 - lr 0.1000 -2019-08-13 20:21:10,498 BAD EPOCHS (no improvement): 0 -2019-08-13 20:21:10,498 ---------------------------------------------------------------------------------------------------- -2019-08-13 20:21:13,275 epoch 4 - iter 0/3720 - loss 1.67985451 throughput (samples/sec): 22921.16 -2019-08-13 20:23:56,448 epoch 4 - iter 372/3720 - loss 1.22704571 throughput (samples/sec): 76.44 -2019-08-13 20:26:39,912 epoch 4 - iter 744/3720 - loss 1.22211817 throughput (samples/sec): 76.32 -2019-08-13 20:29:23,470 epoch 4 - iter 1116/3720 - loss 1.22444775 throughput (samples/sec): 76.35 -2019-08-13 20:32:09,139 epoch 4 - iter 1488/3720 - loss 1.22435886 throughput (samples/sec): 75.34 -2019-08-13 20:34:52,409 epoch 4 - iter 1860/3720 - loss 1.21883197 throughput (samples/sec): 75.38 -2019-08-13 20:37:37,735 epoch 4 - iter 2232/3720 - loss 1.21631644 throughput (samples/sec): 74.32 -2019-08-13 20:40:20,773 epoch 4 - iter 2604/3720 - loss 1.21628497 throughput (samples/sec): 75.90 -2019-08-13 20:43:04,562 epoch 4 - iter 2976/3720 - loss 1.21689057 throughput (samples/sec): 75.80 -2019-08-13 20:45:48,537 epoch 4 - iter 3348/3720 - loss 1.21100797 throughput (samples/sec): 75.82 -2019-08-13 20:48:33,835 ---------------------------------------------------------------------------------------------------- -2019-08-13 20:48:33,835 EPOCH 4 done: loss 1.2084 - lr 0.1000 -2019-08-13 20:48:33,835 BAD EPOCHS (no improvement): 0 -2019-08-13 20:48:33,835 ---------------------------------------------------------------------------------------------------- -2019-08-13 20:48:35,733 epoch 5 - iter 0/3720 - loss 0.92300105 throughput (samples/sec): 18594.63 -2019-08-13 20:51:20,801 epoch 5 - iter 372/3720 - loss 1.18752395 throughput (samples/sec): 75.40 -2019-08-13 20:54:02,964 epoch 5 - iter 744/3720 - loss 1.15851272 throughput (samples/sec): 76.19 -2019-08-13 20:56:47,638 epoch 5 - iter 1116/3720 - loss 1.15466104 throughput (samples/sec): 75.26 -2019-08-13 20:59:31,404 epoch 5 - iter 1488/3720 - loss 1.15777809 throughput (samples/sec): 75.49 -2019-08-13 21:02:14,924 epoch 5 - iter 1860/3720 - loss 1.15232521 throughput (samples/sec): 75.65 -2019-08-13 21:04:57,773 epoch 5 - iter 2232/3720 - loss 1.15050962 throughput (samples/sec): 76.78 -2019-08-13 21:07:36,922 epoch 5 - iter 2604/3720 - loss 1.14734927 throughput (samples/sec): 77.63 -2019-08-13 21:10:20,454 epoch 5 - iter 2976/3720 - loss 1.14473413 throughput (samples/sec): 75.25 -2019-08-13 21:13:02,761 epoch 5 - iter 3348/3720 - loss 1.14154578 throughput (samples/sec): 76.05 -2019-08-13 21:15:44,989 ---------------------------------------------------------------------------------------------------- -2019-08-13 21:15:44,990 EPOCH 5 done: loss 1.1411 - lr 0.1000 -2019-08-13 21:15:44,990 BAD EPOCHS (no improvement): 0 -2019-08-13 21:15:44,990 ---------------------------------------------------------------------------------------------------- -2019-08-13 21:15:46,872 epoch 6 - iter 0/3720 - loss 0.59046555 throughput (samples/sec): 19240.05 -2019-08-13 21:18:28,386 epoch 6 - iter 372/3720 - loss 1.12638468 throughput (samples/sec): 76.74 -2019-08-13 21:21:13,916 epoch 6 - iter 744/3720 - loss 1.10906654 throughput (samples/sec): 75.66 -2019-08-13 21:23:58,102 epoch 6 - iter 1116/3720 - loss 1.11341810 throughput (samples/sec): 75.21 -2019-08-13 21:26:41,532 epoch 6 - iter 1488/3720 - loss 1.11075304 throughput (samples/sec): 76.64 -2019-08-13 21:29:25,845 epoch 6 - iter 1860/3720 - loss 1.10595691 throughput (samples/sec): 75.25 -2019-08-13 21:32:07,450 epoch 6 - iter 2232/3720 - loss 1.10704256 throughput (samples/sec): 76.88 -2019-08-13 21:34:52,293 epoch 6 - iter 2604/3720 - loss 1.10595910 throughput (samples/sec): 74.81 -2019-08-13 21:37:34,248 epoch 6 - iter 2976/3720 - loss 1.10244406 throughput (samples/sec): 76.45 -2019-08-13 21:40:14,606 epoch 6 - iter 3348/3720 - loss 1.10025130 throughput (samples/sec): 76.92 -2019-08-13 21:42:55,871 ---------------------------------------------------------------------------------------------------- -2019-08-13 21:42:55,871 EPOCH 6 done: loss 1.0990 - lr 0.1000 -2019-08-13 21:42:55,871 BAD EPOCHS (no improvement): 0 -2019-08-13 21:42:55,871 ---------------------------------------------------------------------------------------------------- -2019-08-13 21:42:57,729 epoch 7 - iter 0/3720 - loss 0.78231239 throughput (samples/sec): 19149.71 -2019-08-13 21:45:43,312 epoch 7 - iter 372/3720 - loss 1.05618075 throughput (samples/sec): 74.86 -2019-08-13 21:48:27,646 epoch 7 - iter 744/3720 - loss 1.03894488 throughput (samples/sec): 75.57 -2019-08-13 21:51:11,909 epoch 7 - iter 1116/3720 - loss 1.04166590 throughput (samples/sec): 75.44 -2019-08-13 21:53:53,932 epoch 7 - iter 1488/3720 - loss 1.04780377 throughput (samples/sec): 76.46 -2019-08-13 21:56:35,515 epoch 7 - iter 1860/3720 - loss 1.05445897 throughput (samples/sec): 76.84 -2019-08-13 21:59:19,479 epoch 7 - iter 2232/3720 - loss 1.05508658 throughput (samples/sec): 75.42 -2019-08-13 22:02:01,314 epoch 7 - iter 2604/3720 - loss 1.05646944 throughput (samples/sec): 76.80 -2019-08-13 22:04:43,146 epoch 7 - iter 2976/3720 - loss 1.05800105 throughput (samples/sec): 75.99 -2019-08-13 22:07:24,923 epoch 7 - iter 3348/3720 - loss 1.06036160 throughput (samples/sec): 76.06 -2019-08-13 22:10:08,274 ---------------------------------------------------------------------------------------------------- -2019-08-13 22:10:08,274 EPOCH 7 done: loss 1.0613 - lr 0.1000 -2019-08-13 22:10:08,274 BAD EPOCHS (no improvement): 0 -2019-08-13 22:10:08,274 ---------------------------------------------------------------------------------------------------- -2019-08-13 22:10:10,151 epoch 8 - iter 0/3720 - loss 0.79907465 throughput (samples/sec): 17828.75 -2019-08-13 22:12:55,889 epoch 8 - iter 372/3720 - loss 1.02021535 throughput (samples/sec): 75.32 -2019-08-13 22:15:39,647 epoch 8 - iter 744/3720 - loss 1.01429406 throughput (samples/sec): 76.41 -2019-08-13 22:18:21,339 epoch 8 - iter 1116/3720 - loss 1.02016154 throughput (samples/sec): 76.92 -2019-08-13 22:21:03,927 epoch 8 - iter 1488/3720 - loss 1.01747553 throughput (samples/sec): 76.47 -2019-08-13 22:23:45,136 epoch 8 - iter 1860/3720 - loss 1.02165423 throughput (samples/sec): 76.83 -2019-08-13 22:26:25,618 epoch 8 - iter 2232/3720 - loss 1.02173991 throughput (samples/sec): 76.87 -2019-08-13 22:29:06,379 epoch 8 - iter 2604/3720 - loss 1.02723906 throughput (samples/sec): 77.06 -2019-08-13 22:31:48,954 epoch 8 - iter 2976/3720 - loss 1.02652237 throughput (samples/sec): 76.15 -2019-08-13 22:34:30,735 epoch 8 - iter 3348/3720 - loss 1.02871312 throughput (samples/sec): 77.06 -2019-08-13 22:37:15,357 ---------------------------------------------------------------------------------------------------- -2019-08-13 22:37:15,358 EPOCH 8 done: loss 1.0287 - lr 0.1000 -2019-08-13 22:37:15,358 BAD EPOCHS (no improvement): 0 -2019-08-13 22:37:15,358 ---------------------------------------------------------------------------------------------------- -2019-08-13 22:37:17,072 epoch 9 - iter 0/3720 - loss 1.54383945 throughput (samples/sec): 23898.30 -2019-08-13 22:40:01,867 epoch 9 - iter 372/3720 - loss 0.99026319 throughput (samples/sec): 75.30 -2019-08-13 22:42:42,095 epoch 9 - iter 744/3720 - loss 0.99275502 throughput (samples/sec): 77.87 -2019-08-13 22:45:23,851 epoch 9 - iter 1116/3720 - loss 0.99986905 throughput (samples/sec): 76.17 -2019-08-13 22:48:07,539 epoch 9 - iter 1488/3720 - loss 0.99818515 throughput (samples/sec): 75.97 -2019-08-13 22:50:50,310 epoch 9 - iter 1860/3720 - loss 1.00212036 throughput (samples/sec): 76.34 -2019-08-13 22:53:32,732 epoch 9 - iter 2232/3720 - loss 1.00791586 throughput (samples/sec): 76.08 -2019-08-13 22:56:15,914 epoch 9 - iter 2604/3720 - loss 1.00602238 throughput (samples/sec): 76.46 -2019-08-13 22:58:57,515 epoch 9 - iter 2976/3720 - loss 1.00890544 throughput (samples/sec): 76.73 -2019-08-13 23:01:38,814 epoch 9 - iter 3348/3720 - loss 1.00935457 throughput (samples/sec): 77.14 -2019-08-13 23:04:18,730 ---------------------------------------------------------------------------------------------------- -2019-08-13 23:04:18,731 EPOCH 9 done: loss 1.0086 - lr 0.1000 -2019-08-13 23:04:18,731 BAD EPOCHS (no improvement): 0 -2019-08-13 23:04:18,731 ---------------------------------------------------------------------------------------------------- -2019-08-13 23:04:20,448 epoch 10 - iter 0/3720 - loss 0.54354835 throughput (samples/sec): 25978.98 -2019-08-13 23:07:06,556 epoch 10 - iter 372/3720 - loss 0.97160648 throughput (samples/sec): 75.59 -2019-08-13 23:09:53,146 epoch 10 - iter 744/3720 - loss 0.97667281 throughput (samples/sec): 74.51 -2019-08-13 23:12:36,864 epoch 10 - iter 1116/3720 - loss 0.97703779 throughput (samples/sec): 75.42 -2019-08-13 23:15:21,497 epoch 10 - iter 1488/3720 - loss 0.97892870 throughput (samples/sec): 75.77 -2019-08-13 23:18:04,692 epoch 10 - iter 1860/3720 - loss 0.98750832 throughput (samples/sec): 76.16 -2019-08-13 23:20:49,036 epoch 10 - iter 2232/3720 - loss 0.98789930 throughput (samples/sec): 75.35 -2019-08-13 23:23:32,339 epoch 10 - iter 2604/3720 - loss 0.98878771 throughput (samples/sec): 75.60 -2019-08-13 23:26:15,360 epoch 10 - iter 2976/3720 - loss 0.98579501 throughput (samples/sec): 76.02 -2019-08-13 23:28:59,022 epoch 10 - iter 3348/3720 - loss 0.98923598 throughput (samples/sec): 75.75 -2019-08-13 23:31:39,949 ---------------------------------------------------------------------------------------------------- -2019-08-13 23:31:39,949 EPOCH 10 done: loss 0.9893 - lr 0.1000 -2019-08-13 23:31:39,949 BAD EPOCHS (no improvement): 0 -2019-08-13 23:31:39,949 ---------------------------------------------------------------------------------------------------- -2019-08-13 23:31:41,758 epoch 11 - iter 0/3720 - loss 1.71541357 throughput (samples/sec): 21404.68 -2019-08-13 23:34:28,043 epoch 11 - iter 372/3720 - loss 0.97309590 throughput (samples/sec): 74.99 -2019-08-13 23:37:13,745 epoch 11 - iter 744/3720 - loss 0.96514806 throughput (samples/sec): 74.98 -2019-08-13 23:39:56,825 epoch 11 - iter 1116/3720 - loss 0.96421487 throughput (samples/sec): 75.66 -2019-08-13 23:42:38,798 epoch 11 - iter 1488/3720 - loss 0.96743654 throughput (samples/sec): 76.94 -2019-08-13 23:45:20,065 epoch 11 - iter 1860/3720 - loss 0.96716123 throughput (samples/sec): 77.00 -2019-08-13 23:48:02,767 epoch 11 - iter 2232/3720 - loss 0.97033008 throughput (samples/sec): 75.58 -2019-08-13 23:50:44,012 epoch 11 - iter 2604/3720 - loss 0.97098882 throughput (samples/sec): 77.06 -2019-08-13 23:53:27,655 epoch 11 - iter 2976/3720 - loss 0.97129229 throughput (samples/sec): 75.68 -2019-08-13 23:56:09,219 epoch 11 - iter 3348/3720 - loss 0.96964412 throughput (samples/sec): 76.98 -2019-08-13 23:58:50,919 ---------------------------------------------------------------------------------------------------- -2019-08-13 23:58:50,919 EPOCH 11 done: loss 0.9717 - lr 0.1000 -2019-08-13 23:58:50,919 BAD EPOCHS (no improvement): 0 -2019-08-13 23:58:50,919 ---------------------------------------------------------------------------------------------------- -2019-08-13 23:58:52,876 epoch 12 - iter 0/3720 - loss 1.19521618 throughput (samples/sec): 17288.35 -2019-08-14 00:01:36,010 epoch 12 - iter 372/3720 - loss 0.98252318 throughput (samples/sec): 75.66 -2019-08-14 00:04:17,750 epoch 12 - iter 744/3720 - loss 0.95471967 throughput (samples/sec): 76.35 -2019-08-14 00:06:59,529 epoch 12 - iter 1116/3720 - loss 0.95255668 throughput (samples/sec): 77.03 -2019-08-14 00:09:43,154 epoch 12 - iter 1488/3720 - loss 0.95419802 throughput (samples/sec): 75.62 -2019-08-14 00:12:23,567 epoch 12 - iter 1860/3720 - loss 0.95946174 throughput (samples/sec): 76.89 -2019-08-14 00:15:04,806 epoch 12 - iter 2232/3720 - loss 0.95893017 throughput (samples/sec): 76.52 -2019-08-14 00:17:46,604 epoch 12 - iter 2604/3720 - loss 0.95535940 throughput (samples/sec): 76.45 -2019-08-14 00:20:26,365 epoch 12 - iter 2976/3720 - loss 0.95355625 throughput (samples/sec): 78.10 -2019-08-14 00:23:07,499 epoch 12 - iter 3348/3720 - loss 0.95700808 throughput (samples/sec): 77.00 -2019-08-14 00:25:49,287 ---------------------------------------------------------------------------------------------------- -2019-08-14 00:25:49,287 EPOCH 12 done: loss 0.9578 - lr 0.1000 -2019-08-14 00:25:49,287 BAD EPOCHS (no improvement): 0 -2019-08-14 00:25:49,288 ---------------------------------------------------------------------------------------------------- -2019-08-14 00:25:51,284 epoch 13 - iter 0/3720 - loss 1.14242172 throughput (samples/sec): 15707.75 -2019-08-14 00:28:34,910 epoch 13 - iter 372/3720 - loss 0.94083283 throughput (samples/sec): 76.02 -2019-08-14 00:31:15,848 epoch 13 - iter 744/3720 - loss 0.94413036 throughput (samples/sec): 76.95 -2019-08-14 00:33:55,764 epoch 13 - iter 1116/3720 - loss 0.94754352 throughput (samples/sec): 77.39 -2019-08-14 00:36:38,196 epoch 13 - iter 1488/3720 - loss 0.94510976 throughput (samples/sec): 75.95 -2019-08-14 00:39:19,227 epoch 13 - iter 1860/3720 - loss 0.94038974 throughput (samples/sec): 77.41 -2019-08-14 00:42:02,024 epoch 13 - iter 2232/3720 - loss 0.94279201 throughput (samples/sec): 76.65 -2019-08-14 00:44:44,512 epoch 13 - iter 2604/3720 - loss 0.93998889 throughput (samples/sec): 76.30 -2019-08-14 00:47:26,558 epoch 13 - iter 2976/3720 - loss 0.94200607 throughput (samples/sec): 76.91 -2019-08-14 00:50:08,640 epoch 13 - iter 3348/3720 - loss 0.94085778 throughput (samples/sec): 76.17 -2019-08-14 00:52:51,654 ---------------------------------------------------------------------------------------------------- -2019-08-14 00:52:51,654 EPOCH 13 done: loss 0.9409 - lr 0.1000 -2019-08-14 00:52:51,654 BAD EPOCHS (no improvement): 0 -2019-08-14 00:52:51,654 ---------------------------------------------------------------------------------------------------- -2019-08-14 00:52:53,378 epoch 14 - iter 0/3720 - loss 0.81392503 throughput (samples/sec): 24579.42 -2019-08-14 00:55:35,287 epoch 14 - iter 372/3720 - loss 0.91903556 throughput (samples/sec): 76.55 -2019-08-14 00:58:16,480 epoch 14 - iter 744/3720 - loss 0.94080189 throughput (samples/sec): 77.06 -2019-08-14 01:01:00,288 epoch 14 - iter 1116/3720 - loss 0.93238526 throughput (samples/sec): 75.34 -2019-08-14 01:03:41,870 epoch 14 - iter 1488/3720 - loss 0.92870163 throughput (samples/sec): 76.62 -2019-08-14 01:06:25,520 epoch 14 - iter 1860/3720 - loss 0.92876025 throughput (samples/sec): 75.63 -2019-08-14 01:09:06,791 epoch 14 - iter 2232/3720 - loss 0.92989168 throughput (samples/sec): 76.78 -2019-08-14 01:11:48,045 epoch 14 - iter 2604/3720 - loss 0.92849175 throughput (samples/sec): 76.99 -2019-08-14 01:14:30,884 epoch 14 - iter 2976/3720 - loss 0.92729899 throughput (samples/sec): 76.24 -2019-08-14 01:17:14,082 epoch 14 - iter 3348/3720 - loss 0.92745444 throughput (samples/sec): 76.30 -2019-08-14 01:19:55,393 ---------------------------------------------------------------------------------------------------- -2019-08-14 01:19:55,393 EPOCH 14 done: loss 0.9293 - lr 0.1000 -2019-08-14 01:19:55,393 BAD EPOCHS (no improvement): 0 -2019-08-14 01:19:55,393 ---------------------------------------------------------------------------------------------------- -2019-08-14 01:19:57,116 epoch 15 - iter 0/3720 - loss 0.69200444 throughput (samples/sec): 24575.21 -2019-08-14 01:22:40,848 epoch 15 - iter 372/3720 - loss 0.87021296 throughput (samples/sec): 76.01 -2019-08-14 01:25:22,036 epoch 15 - iter 744/3720 - loss 0.89341479 throughput (samples/sec): 77.06 -2019-08-14 01:28:05,002 epoch 15 - iter 1116/3720 - loss 0.90486783 throughput (samples/sec): 75.92 -2019-08-14 01:30:50,776 epoch 15 - iter 1488/3720 - loss 0.90281475 throughput (samples/sec): 74.98 -2019-08-14 01:33:33,813 epoch 15 - iter 1860/3720 - loss 0.90388144 throughput (samples/sec): 76.28 -2019-08-14 01:36:17,687 epoch 15 - iter 2232/3720 - loss 0.90626740 throughput (samples/sec): 74.77 -2019-08-14 01:39:02,823 epoch 15 - iter 2604/3720 - loss 0.91288618 throughput (samples/sec): 74.88 -2019-08-14 01:41:46,848 epoch 15 - iter 2976/3720 - loss 0.91322998 throughput (samples/sec): 75.46 -2019-08-14 01:44:29,628 epoch 15 - iter 3348/3720 - loss 0.91679663 throughput (samples/sec): 76.12 -2019-08-14 01:47:12,447 ---------------------------------------------------------------------------------------------------- -2019-08-14 01:47:12,448 EPOCH 15 done: loss 0.9173 - lr 0.1000 -2019-08-14 01:47:12,448 BAD EPOCHS (no improvement): 0 -2019-08-14 01:47:12,448 ---------------------------------------------------------------------------------------------------- -2019-08-14 01:47:14,096 epoch 16 - iter 0/3720 - loss 1.07109630 throughput (samples/sec): 27339.07 -2019-08-14 01:49:58,206 epoch 16 - iter 372/3720 - loss 0.89986635 throughput (samples/sec): 75.54 -2019-08-14 01:52:42,176 epoch 16 - iter 744/3720 - loss 0.91058799 throughput (samples/sec): 75.13 -2019-08-14 01:55:25,576 epoch 16 - iter 1116/3720 - loss 0.91115278 throughput (samples/sec): 75.98 -2019-08-14 01:58:07,971 epoch 16 - iter 1488/3720 - loss 0.90940078 throughput (samples/sec): 76.46 -2019-08-14 02:00:50,598 epoch 16 - iter 1860/3720 - loss 0.91045797 throughput (samples/sec): 75.87 -2019-08-14 02:03:32,212 epoch 16 - iter 2232/3720 - loss 0.90492424 throughput (samples/sec): 76.30 -2019-08-14 02:06:14,025 epoch 16 - iter 2604/3720 - loss 0.90600889 throughput (samples/sec): 76.22 -2019-08-14 02:08:53,848 epoch 16 - iter 2976/3720 - loss 0.90470113 throughput (samples/sec): 77.01 -2019-08-14 02:11:33,193 epoch 16 - iter 3348/3720 - loss 0.90386628 throughput (samples/sec): 77.81 -2019-08-14 02:14:12,175 ---------------------------------------------------------------------------------------------------- -2019-08-14 02:14:12,175 EPOCH 16 done: loss 0.9044 - lr 0.1000 -2019-08-14 02:14:12,175 BAD EPOCHS (no improvement): 0 -2019-08-14 02:14:12,175 ---------------------------------------------------------------------------------------------------- -2019-08-14 02:14:13,939 epoch 17 - iter 0/3720 - loss 1.39257133 throughput (samples/sec): 22867.61 -2019-08-14 02:16:56,948 epoch 17 - iter 372/3720 - loss 0.88840501 throughput (samples/sec): 76.47 -2019-08-14 02:19:39,428 epoch 17 - iter 744/3720 - loss 0.90196937 throughput (samples/sec): 76.52 -2019-08-14 02:22:21,193 epoch 17 - iter 1116/3720 - loss 0.89924286 throughput (samples/sec): 76.29 -2019-08-14 02:25:04,712 epoch 17 - iter 1488/3720 - loss 0.89873712 throughput (samples/sec): 75.67 -2019-08-14 02:27:47,336 epoch 17 - iter 1860/3720 - loss 0.89753252 throughput (samples/sec): 76.07 -2019-08-14 02:30:28,639 epoch 17 - iter 2232/3720 - loss 0.89235412 throughput (samples/sec): 77.01 -2019-08-14 02:33:08,568 epoch 17 - iter 2604/3720 - loss 0.89477245 throughput (samples/sec): 77.70 -2019-08-14 02:35:52,553 epoch 17 - iter 2976/3720 - loss 0.89297815 throughput (samples/sec): 75.31 -2019-08-14 02:38:39,137 epoch 17 - iter 3348/3720 - loss 0.89872619 throughput (samples/sec): 73.87 -2019-08-14 02:41:22,983 ---------------------------------------------------------------------------------------------------- -2019-08-14 02:41:22,984 EPOCH 17 done: loss 0.8985 - lr 0.1000 -2019-08-14 02:41:22,984 BAD EPOCHS (no improvement): 0 -2019-08-14 02:41:22,984 ---------------------------------------------------------------------------------------------------- -2019-08-14 02:41:24,723 epoch 18 - iter 0/3720 - loss 0.77083921 throughput (samples/sec): 22843.28 -2019-08-14 02:44:10,166 epoch 18 - iter 372/3720 - loss 0.89290454 throughput (samples/sec): 75.18 -2019-08-14 02:46:53,299 epoch 18 - iter 744/3720 - loss 0.89591612 throughput (samples/sec): 76.36 -2019-08-14 02:49:35,312 epoch 18 - iter 1116/3720 - loss 0.89517852 throughput (samples/sec): 76.84 -2019-08-14 02:52:17,788 epoch 18 - iter 1488/3720 - loss 0.88962467 throughput (samples/sec): 76.33 -2019-08-14 02:54:59,886 epoch 18 - iter 1860/3720 - loss 0.88495676 throughput (samples/sec): 76.82 -2019-08-14 02:57:41,882 epoch 18 - iter 2232/3720 - loss 0.88084732 throughput (samples/sec): 76.28 -2019-08-14 03:00:23,570 epoch 18 - iter 2604/3720 - loss 0.88222906 throughput (samples/sec): 76.60 -2019-08-14 03:03:06,645 epoch 18 - iter 2976/3720 - loss 0.88234441 throughput (samples/sec): 75.86 -2019-08-14 03:05:50,314 epoch 18 - iter 3348/3720 - loss 0.88361001 throughput (samples/sec): 75.66 -2019-08-14 03:08:35,083 ---------------------------------------------------------------------------------------------------- -2019-08-14 03:08:35,083 EPOCH 18 done: loss 0.8856 - lr 0.1000 -2019-08-14 03:08:35,084 BAD EPOCHS (no improvement): 0 -2019-08-14 03:08:35,084 ---------------------------------------------------------------------------------------------------- -2019-08-14 03:08:36,890 epoch 19 - iter 0/3720 - loss 0.91424394 throughput (samples/sec): 20508.49 -2019-08-14 03:11:20,286 epoch 19 - iter 372/3720 - loss 0.86451226 throughput (samples/sec): 75.58 -2019-08-14 03:14:01,332 epoch 19 - iter 744/3720 - loss 0.85403174 throughput (samples/sec): 76.72 -2019-08-14 03:16:45,912 epoch 19 - iter 1116/3720 - loss 0.86553135 throughput (samples/sec): 75.94 -2019-08-14 03:19:29,309 epoch 19 - iter 1488/3720 - loss 0.86744107 throughput (samples/sec): 76.06 -2019-08-14 03:22:11,726 epoch 19 - iter 1860/3720 - loss 0.87428269 throughput (samples/sec): 76.56 -2019-08-14 03:24:55,159 epoch 19 - iter 2232/3720 - loss 0.87818835 throughput (samples/sec): 75.23 -2019-08-14 03:27:34,668 epoch 19 - iter 2604/3720 - loss 0.87866181 throughput (samples/sec): 77.91 -2019-08-14 03:30:18,231 epoch 19 - iter 2976/3720 - loss 0.87730281 throughput (samples/sec): 76.12 -2019-08-14 03:33:02,211 epoch 19 - iter 3348/3720 - loss 0.87822849 throughput (samples/sec): 75.46 -2019-08-14 03:35:46,107 ---------------------------------------------------------------------------------------------------- -2019-08-14 03:35:46,108 EPOCH 19 done: loss 0.8803 - lr 0.1000 -2019-08-14 03:35:46,108 BAD EPOCHS (no improvement): 0 -2019-08-14 03:35:46,108 ---------------------------------------------------------------------------------------------------- -2019-08-14 03:35:48,788 epoch 20 - iter 0/3720 - loss 0.39194250 throughput (samples/sec): 30157.01 -2019-08-14 03:38:32,787 epoch 20 - iter 372/3720 - loss 0.84449465 throughput (samples/sec): 75.95 -2019-08-14 03:41:15,042 epoch 20 - iter 744/3720 - loss 0.84312846 throughput (samples/sec): 76.87 -2019-08-14 03:43:57,835 epoch 20 - iter 1116/3720 - loss 0.85822877 throughput (samples/sec): 76.88 -2019-08-14 03:46:43,967 epoch 20 - iter 1488/3720 - loss 0.85624258 throughput (samples/sec): 74.26 -2019-08-14 03:49:27,531 epoch 20 - iter 1860/3720 - loss 0.86289753 throughput (samples/sec): 75.72 -2019-08-14 03:52:11,626 epoch 20 - iter 2232/3720 - loss 0.86702543 throughput (samples/sec): 75.19 -2019-08-14 03:54:55,057 epoch 20 - iter 2604/3720 - loss 0.86897013 throughput (samples/sec): 75.75 -2019-08-14 03:57:38,680 epoch 20 - iter 2976/3720 - loss 0.87110366 throughput (samples/sec): 75.89 -2019-08-14 04:00:21,708 epoch 20 - iter 3348/3720 - loss 0.87295055 throughput (samples/sec): 75.89 -2019-08-14 04:03:03,269 ---------------------------------------------------------------------------------------------------- -2019-08-14 04:03:03,270 EPOCH 20 done: loss 0.8728 - lr 0.1000 -2019-08-14 04:03:03,270 BAD EPOCHS (no improvement): 0 -2019-08-14 04:03:03,270 ---------------------------------------------------------------------------------------------------- -2019-08-14 04:03:05,052 epoch 21 - iter 0/3720 - loss 0.92326999 throughput (samples/sec): 23054.58 -2019-08-14 04:05:51,374 epoch 21 - iter 372/3720 - loss 0.85929792 throughput (samples/sec): 74.90 -2019-08-14 04:08:34,985 epoch 21 - iter 744/3720 - loss 0.86683869 throughput (samples/sec): 75.96 -2019-08-14 04:11:17,942 epoch 21 - iter 1116/3720 - loss 0.87321425 throughput (samples/sec): 75.98 -2019-08-14 04:14:02,191 epoch 21 - iter 1488/3720 - loss 0.87296304 throughput (samples/sec): 75.41 -2019-08-14 04:16:47,665 epoch 21 - iter 1860/3720 - loss 0.87275451 throughput (samples/sec): 74.01 -2019-08-14 04:19:30,648 epoch 21 - iter 2232/3720 - loss 0.87325202 throughput (samples/sec): 75.69 -2019-08-14 04:22:14,447 epoch 21 - iter 2604/3720 - loss 0.87591002 throughput (samples/sec): 75.25 -2019-08-14 04:24:55,822 epoch 21 - iter 2976/3720 - loss 0.87187349 throughput (samples/sec): 76.24 -2019-08-14 04:27:35,669 epoch 21 - iter 3348/3720 - loss 0.87025153 throughput (samples/sec): 77.14 -2019-08-14 04:30:16,603 ---------------------------------------------------------------------------------------------------- -2019-08-14 04:30:16,603 EPOCH 21 done: loss 0.8696 - lr 0.1000 -2019-08-14 04:30:16,603 BAD EPOCHS (no improvement): 0 -2019-08-14 04:30:16,603 ---------------------------------------------------------------------------------------------------- -2019-08-14 04:30:18,400 epoch 22 - iter 0/3720 - loss 0.94426948 throughput (samples/sec): 22017.78 -2019-08-14 04:33:02,883 epoch 22 - iter 372/3720 - loss 0.83010669 throughput (samples/sec): 74.85 -2019-08-14 04:35:42,741 epoch 22 - iter 744/3720 - loss 0.83836981 throughput (samples/sec): 77.53 -2019-08-14 04:38:25,784 epoch 22 - iter 1116/3720 - loss 0.84072291 throughput (samples/sec): 75.87 -2019-08-14 04:41:10,545 epoch 22 - iter 1488/3720 - loss 0.83998939 throughput (samples/sec): 74.64 -2019-08-14 04:43:54,130 epoch 22 - iter 1860/3720 - loss 0.84403272 throughput (samples/sec): 76.22 -2019-08-14 04:46:38,536 epoch 22 - iter 2232/3720 - loss 0.84942158 throughput (samples/sec): 74.80 -2019-08-14 04:49:20,588 epoch 22 - iter 2604/3720 - loss 0.84874437 throughput (samples/sec): 76.22 -2019-08-14 04:52:05,792 epoch 22 - iter 2976/3720 - loss 0.85171919 throughput (samples/sec): 75.04 -2019-08-14 04:54:49,210 epoch 22 - iter 3348/3720 - loss 0.85604964 throughput (samples/sec): 75.56 -2019-08-14 04:57:34,840 ---------------------------------------------------------------------------------------------------- -2019-08-14 04:57:34,840 EPOCH 22 done: loss 0.8578 - lr 0.1000 -2019-08-14 04:57:34,840 BAD EPOCHS (no improvement): 0 -2019-08-14 04:57:34,841 ---------------------------------------------------------------------------------------------------- -2019-08-14 04:57:36,662 epoch 23 - iter 0/3720 - loss 1.06055808 throughput (samples/sec): 20889.12 -2019-08-14 05:00:20,555 epoch 23 - iter 372/3720 - loss 0.84467029 throughput (samples/sec): 75.98 -2019-08-14 05:03:03,854 epoch 23 - iter 744/3720 - loss 0.84243446 throughput (samples/sec): 75.57 -2019-08-14 05:05:47,934 epoch 23 - iter 1116/3720 - loss 0.84262237 throughput (samples/sec): 75.97 -2019-08-14 05:08:33,229 epoch 23 - iter 1488/3720 - loss 0.84324205 throughput (samples/sec): 75.35 -2019-08-14 05:11:14,393 epoch 23 - iter 1860/3720 - loss 0.84156106 throughput (samples/sec): 76.96 -2019-08-14 05:13:55,410 epoch 23 - iter 2232/3720 - loss 0.84222028 throughput (samples/sec): 77.25 -2019-08-14 05:16:38,776 epoch 23 - iter 2604/3720 - loss 0.84328615 throughput (samples/sec): 75.54 -2019-08-14 05:19:20,151 epoch 23 - iter 2976/3720 - loss 0.84247815 throughput (samples/sec): 77.02 -2019-08-14 05:22:01,422 epoch 23 - iter 3348/3720 - loss 0.84689841 throughput (samples/sec): 76.29 -2019-08-14 05:24:44,157 ---------------------------------------------------------------------------------------------------- -2019-08-14 05:24:44,157 EPOCH 23 done: loss 0.8486 - lr 0.1000 -2019-08-14 05:24:44,157 BAD EPOCHS (no improvement): 0 -2019-08-14 05:24:44,158 ---------------------------------------------------------------------------------------------------- -2019-08-14 05:24:45,940 epoch 24 - iter 0/3720 - loss 0.65621853 throughput (samples/sec): 21065.63 -2019-08-14 05:27:27,336 epoch 24 - iter 372/3720 - loss 0.83702164 throughput (samples/sec): 76.83 -2019-08-14 05:30:08,605 epoch 24 - iter 744/3720 - loss 0.84950715 throughput (samples/sec): 77.33 -2019-08-14 05:32:50,482 epoch 24 - iter 1116/3720 - loss 0.84206434 throughput (samples/sec): 76.19 -2019-08-14 05:35:36,302 epoch 24 - iter 1488/3720 - loss 0.84671225 throughput (samples/sec): 75.09 -2019-08-14 05:38:17,424 epoch 24 - iter 1860/3720 - loss 0.84413467 throughput (samples/sec): 76.61 -2019-08-14 05:41:01,027 epoch 24 - iter 2232/3720 - loss 0.84923387 throughput (samples/sec): 76.04 -2019-08-14 05:43:43,257 epoch 24 - iter 2604/3720 - loss 0.85330688 throughput (samples/sec): 76.12 -2019-08-14 05:46:27,495 epoch 24 - iter 2976/3720 - loss 0.85167503 throughput (samples/sec): 74.86 -2019-08-14 05:49:08,628 epoch 24 - iter 3348/3720 - loss 0.85018266 throughput (samples/sec): 76.84 -2019-08-14 05:51:50,101 ---------------------------------------------------------------------------------------------------- -2019-08-14 05:51:50,102 EPOCH 24 done: loss 0.8477 - lr 0.1000 -2019-08-14 05:51:50,102 BAD EPOCHS (no improvement): 0 -2019-08-14 05:51:50,102 ---------------------------------------------------------------------------------------------------- -2019-08-14 05:51:51,847 epoch 25 - iter 0/3720 - loss 0.71347618 throughput (samples/sec): 25118.93 -2019-08-14 05:54:36,446 epoch 25 - iter 372/3720 - loss 0.85991709 throughput (samples/sec): 75.75 -2019-08-14 05:57:17,251 epoch 25 - iter 744/3720 - loss 0.83786292 throughput (samples/sec): 76.51 -2019-08-14 06:00:02,116 epoch 25 - iter 1116/3720 - loss 0.83896540 throughput (samples/sec): 75.86 -2019-08-14 06:02:45,841 epoch 25 - iter 1488/3720 - loss 0.83574753 throughput (samples/sec): 75.58 -2019-08-14 06:05:28,015 epoch 25 - iter 1860/3720 - loss 0.83645074 throughput (samples/sec): 76.24 -2019-08-14 06:08:10,178 epoch 25 - iter 2232/3720 - loss 0.83715705 throughput (samples/sec): 76.30 -2019-08-14 06:10:53,945 epoch 25 - iter 2604/3720 - loss 0.83963187 throughput (samples/sec): 75.39 -2019-08-14 06:13:36,254 epoch 25 - iter 2976/3720 - loss 0.84155767 throughput (samples/sec): 76.36 -2019-08-14 06:16:21,337 epoch 25 - iter 3348/3720 - loss 0.84476661 throughput (samples/sec): 75.26 -2019-08-14 06:19:03,859 ---------------------------------------------------------------------------------------------------- -2019-08-14 06:19:03,859 EPOCH 25 done: loss 0.8433 - lr 0.1000 -2019-08-14 06:19:03,859 BAD EPOCHS (no improvement): 0 -2019-08-14 06:19:03,859 ---------------------------------------------------------------------------------------------------- -2019-08-14 06:19:05,666 epoch 26 - iter 0/3720 - loss 0.88023210 throughput (samples/sec): 21552.83 -2019-08-14 06:21:48,810 epoch 26 - iter 372/3720 - loss 0.84433262 throughput (samples/sec): 75.33 -2019-08-14 06:24:31,596 epoch 26 - iter 744/3720 - loss 0.83719320 throughput (samples/sec): 76.31 -2019-08-14 06:27:13,986 epoch 26 - iter 1116/3720 - loss 0.83290649 throughput (samples/sec): 76.02 -2019-08-14 06:29:54,994 epoch 26 - iter 1488/3720 - loss 0.82956030 throughput (samples/sec): 77.52 -2019-08-14 06:32:36,910 epoch 26 - iter 1860/3720 - loss 0.83034662 throughput (samples/sec): 76.45 -2019-08-14 06:35:22,173 epoch 26 - iter 2232/3720 - loss 0.82507626 throughput (samples/sec): 74.52 -2019-08-14 06:38:07,405 epoch 26 - iter 2604/3720 - loss 0.82648450 throughput (samples/sec): 75.51 -2019-08-14 06:40:51,333 epoch 26 - iter 2976/3720 - loss 0.82981519 throughput (samples/sec): 75.30 -2019-08-14 06:43:32,719 epoch 26 - iter 3348/3720 - loss 0.83140997 throughput (samples/sec): 76.46 -2019-08-14 06:46:17,478 ---------------------------------------------------------------------------------------------------- -2019-08-14 06:46:17,478 EPOCH 26 done: loss 0.8352 - lr 0.1000 -2019-08-14 06:46:17,478 BAD EPOCHS (no improvement): 0 -2019-08-14 06:46:17,478 ---------------------------------------------------------------------------------------------------- -2019-08-14 06:46:19,197 epoch 27 - iter 0/3720 - loss 0.95761752 throughput (samples/sec): 24075.10 -2019-08-14 06:49:03,838 epoch 27 - iter 372/3720 - loss 0.83662980 throughput (samples/sec): 75.05 -2019-08-14 06:51:46,611 epoch 27 - iter 744/3720 - loss 0.83097366 throughput (samples/sec): 76.62 -2019-08-14 06:54:28,903 epoch 27 - iter 1116/3720 - loss 0.83039268 throughput (samples/sec): 76.06 -2019-08-14 06:57:12,072 epoch 27 - iter 1488/3720 - loss 0.83309372 throughput (samples/sec): 75.86 -2019-08-14 06:59:54,970 epoch 27 - iter 1860/3720 - loss 0.83198055 throughput (samples/sec): 75.73 -2019-08-14 07:02:38,197 epoch 27 - iter 2232/3720 - loss 0.83196913 throughput (samples/sec): 75.55 -2019-08-14 07:05:20,915 epoch 27 - iter 2604/3720 - loss 0.83084750 throughput (samples/sec): 76.07 -2019-08-14 07:08:03,801 epoch 27 - iter 2976/3720 - loss 0.83090420 throughput (samples/sec): 75.46 -2019-08-14 07:10:46,067 epoch 27 - iter 3348/3720 - loss 0.83443070 throughput (samples/sec): 75.80 -2019-08-14 07:13:28,140 ---------------------------------------------------------------------------------------------------- -2019-08-14 07:13:28,141 EPOCH 27 done: loss 0.8340 - lr 0.1000 -2019-08-14 07:13:28,141 BAD EPOCHS (no improvement): 0 -2019-08-14 07:13:28,141 ---------------------------------------------------------------------------------------------------- -2019-08-14 07:13:29,878 epoch 28 - iter 0/3720 - loss 0.51765800 throughput (samples/sec): 24554.67 -2019-08-14 07:16:12,568 epoch 28 - iter 372/3720 - loss 0.81007848 throughput (samples/sec): 76.31 -2019-08-14 07:18:55,328 epoch 28 - iter 744/3720 - loss 0.82560806 throughput (samples/sec): 76.31 -2019-08-14 07:21:35,191 epoch 28 - iter 1116/3720 - loss 0.82835809 throughput (samples/sec): 77.23 -2019-08-14 07:24:18,629 epoch 28 - iter 1488/3720 - loss 0.82863870 throughput (samples/sec): 75.76 -2019-08-14 07:27:01,390 epoch 28 - iter 1860/3720 - loss 0.82668303 throughput (samples/sec): 76.09 -2019-08-14 07:29:43,626 epoch 28 - iter 2232/3720 - loss 0.82357014 throughput (samples/sec): 76.08 -2019-08-14 07:32:25,667 epoch 28 - iter 2604/3720 - loss 0.82544531 throughput (samples/sec): 76.72 -2019-08-14 07:35:08,241 epoch 28 - iter 2976/3720 - loss 0.82434317 throughput (samples/sec): 76.16 -2019-08-14 07:37:48,847 epoch 28 - iter 3348/3720 - loss 0.82709103 throughput (samples/sec): 77.15 -2019-08-14 07:40:30,475 ---------------------------------------------------------------------------------------------------- -2019-08-14 07:40:30,475 EPOCH 28 done: loss 0.8277 - lr 0.1000 -2019-08-14 07:40:30,475 BAD EPOCHS (no improvement): 0 -2019-08-14 07:40:30,476 ---------------------------------------------------------------------------------------------------- -2019-08-14 07:40:32,213 epoch 29 - iter 0/3720 - loss 1.31668711 throughput (samples/sec): 23044.76 -2019-08-14 07:43:14,658 epoch 29 - iter 372/3720 - loss 0.79486934 throughput (samples/sec): 76.46 -2019-08-14 07:45:56,633 epoch 29 - iter 744/3720 - loss 0.80516469 throughput (samples/sec): 76.35 -2019-08-14 07:48:40,786 epoch 29 - iter 1116/3720 - loss 0.80079043 throughput (samples/sec): 76.06 -2019-08-14 07:51:25,742 epoch 29 - iter 1488/3720 - loss 0.80786399 throughput (samples/sec): 74.92 -2019-08-14 07:54:06,967 epoch 29 - iter 1860/3720 - loss 0.81289379 throughput (samples/sec): 77.25 -2019-08-14 07:56:52,179 epoch 29 - iter 2232/3720 - loss 0.81925074 throughput (samples/sec): 75.05 -2019-08-14 07:59:33,585 epoch 29 - iter 2604/3720 - loss 0.82022979 throughput (samples/sec): 77.24 -2019-08-14 08:02:15,998 epoch 29 - iter 2976/3720 - loss 0.82210416 throughput (samples/sec): 76.28 -2019-08-14 08:04:58,708 epoch 29 - iter 3348/3720 - loss 0.82183504 throughput (samples/sec): 75.83 -2019-08-14 08:07:37,739 ---------------------------------------------------------------------------------------------------- -2019-08-14 08:07:37,739 EPOCH 29 done: loss 0.8233 - lr 0.1000 -2019-08-14 08:07:37,739 BAD EPOCHS (no improvement): 0 -2019-08-14 08:07:37,739 ---------------------------------------------------------------------------------------------------- -2019-08-14 08:07:39,514 epoch 30 - iter 0/3720 - loss 0.81500816 throughput (samples/sec): 20984.86 -2019-08-14 08:10:20,970 epoch 30 - iter 372/3720 - loss 0.81239048 throughput (samples/sec): 76.92 -2019-08-14 08:13:00,303 epoch 30 - iter 744/3720 - loss 0.81347853 throughput (samples/sec): 77.69 -2019-08-14 08:15:41,423 epoch 30 - iter 1116/3720 - loss 0.81150716 throughput (samples/sec): 77.10 -2019-08-14 08:18:23,031 epoch 30 - iter 1488/3720 - loss 0.81471588 throughput (samples/sec): 76.16 -2019-08-14 08:21:05,145 epoch 30 - iter 1860/3720 - loss 0.82097621 throughput (samples/sec): 76.68 -2019-08-14 08:23:46,690 epoch 30 - iter 2232/3720 - loss 0.82189468 throughput (samples/sec): 76.60 -2019-08-14 08:26:30,859 epoch 30 - iter 2604/3720 - loss 0.82199087 throughput (samples/sec): 74.89 -2019-08-14 08:29:16,310 epoch 30 - iter 2976/3720 - loss 0.82379773 throughput (samples/sec): 75.54 -2019-08-14 08:31:58,670 epoch 30 - iter 3348/3720 - loss 0.82254770 throughput (samples/sec): 76.73 -2019-08-14 08:34:39,291 ---------------------------------------------------------------------------------------------------- -2019-08-14 08:34:39,291 EPOCH 30 done: loss 0.8224 - lr 0.1000 -2019-08-14 08:34:39,291 BAD EPOCHS (no improvement): 0 -2019-08-14 08:34:39,291 ---------------------------------------------------------------------------------------------------- -2019-08-14 08:34:40,981 epoch 31 - iter 0/3720 - loss 0.87063098 throughput (samples/sec): 25978.72 -2019-08-14 08:37:24,160 epoch 31 - iter 372/3720 - loss 0.81877115 throughput (samples/sec): 76.62 -2019-08-14 08:40:06,376 epoch 31 - iter 744/3720 - loss 0.80957155 throughput (samples/sec): 76.01 -2019-08-14 08:42:47,552 epoch 31 - iter 1116/3720 - loss 0.81335378 throughput (samples/sec): 76.32 -2019-08-14 08:45:28,929 epoch 31 - iter 1488/3720 - loss 0.81152575 throughput (samples/sec): 76.71 -2019-08-14 08:48:08,944 epoch 31 - iter 1860/3720 - loss 0.81055201 throughput (samples/sec): 76.85 -2019-08-14 08:50:52,340 epoch 31 - iter 2232/3720 - loss 0.81597067 throughput (samples/sec): 75.77 -2019-08-14 08:53:34,379 epoch 31 - iter 2604/3720 - loss 0.81272879 throughput (samples/sec): 76.49 -2019-08-14 08:56:16,484 epoch 31 - iter 2976/3720 - loss 0.81034411 throughput (samples/sec): 76.71 -2019-08-14 08:58:57,677 epoch 31 - iter 3348/3720 - loss 0.81026002 throughput (samples/sec): 77.45 -2019-08-14 09:01:41,002 ---------------------------------------------------------------------------------------------------- -2019-08-14 09:01:41,002 EPOCH 31 done: loss 0.8125 - lr 0.1000 -2019-08-14 09:01:41,002 BAD EPOCHS (no improvement): 0 -2019-08-14 09:01:41,002 ---------------------------------------------------------------------------------------------------- -2019-08-14 09:01:42,852 epoch 32 - iter 0/3720 - loss 0.93556166 throughput (samples/sec): 19410.99 -2019-08-14 09:04:25,829 epoch 32 - iter 372/3720 - loss 0.81481181 throughput (samples/sec): 76.57 -2019-08-14 09:07:07,495 epoch 32 - iter 744/3720 - loss 0.81414005 throughput (samples/sec): 76.68 -2019-08-14 09:09:47,678 epoch 32 - iter 1116/3720 - loss 0.80444633 throughput (samples/sec): 77.64 -2019-08-14 09:12:29,577 epoch 32 - iter 1488/3720 - loss 0.80200519 throughput (samples/sec): 76.19 -2019-08-14 09:15:13,653 epoch 32 - iter 1860/3720 - loss 0.80578624 throughput (samples/sec): 75.43 -2019-08-14 09:17:57,057 epoch 32 - iter 2232/3720 - loss 0.80393197 throughput (samples/sec): 75.53 -2019-08-14 09:20:39,157 epoch 32 - iter 2604/3720 - loss 0.80579875 throughput (samples/sec): 76.64 -2019-08-14 09:23:19,397 epoch 32 - iter 2976/3720 - loss 0.80595655 throughput (samples/sec): 76.80 -2019-08-14 09:26:03,640 epoch 32 - iter 3348/3720 - loss 0.80699840 throughput (samples/sec): 75.44 -2019-08-14 09:28:46,952 ---------------------------------------------------------------------------------------------------- -2019-08-14 09:28:46,952 EPOCH 32 done: loss 0.8078 - lr 0.1000 -2019-08-14 09:28:46,952 BAD EPOCHS (no improvement): 0 -2019-08-14 09:28:46,953 ---------------------------------------------------------------------------------------------------- -2019-08-14 09:28:48,725 epoch 33 - iter 0/3720 - loss 1.14282894 throughput (samples/sec): 22741.75 -2019-08-14 09:31:33,065 epoch 33 - iter 372/3720 - loss 0.79242806 throughput (samples/sec): 75.38 -2019-08-14 09:34:14,938 epoch 33 - iter 744/3720 - loss 0.79153694 throughput (samples/sec): 76.27 -2019-08-14 09:36:57,067 epoch 33 - iter 1116/3720 - loss 0.78445381 throughput (samples/sec): 75.84 -2019-08-14 09:39:37,419 epoch 33 - iter 1488/3720 - loss 0.78898957 throughput (samples/sec): 77.22 -2019-08-14 09:42:18,527 epoch 33 - iter 1860/3720 - loss 0.79201788 throughput (samples/sec): 76.93 -2019-08-14 09:45:01,746 epoch 33 - iter 2232/3720 - loss 0.79793941 throughput (samples/sec): 75.70 -2019-08-14 09:47:44,620 epoch 33 - iter 2604/3720 - loss 0.80225023 throughput (samples/sec): 76.00 -2019-08-14 09:50:29,375 epoch 33 - iter 2976/3720 - loss 0.80390341 throughput (samples/sec): 75.19 -2019-08-14 09:53:13,518 epoch 33 - iter 3348/3720 - loss 0.80712164 throughput (samples/sec): 75.52 -2019-08-14 09:55:57,972 ---------------------------------------------------------------------------------------------------- -2019-08-14 09:55:57,972 EPOCH 33 done: loss 0.8091 - lr 0.1000 -2019-08-14 09:55:57,972 BAD EPOCHS (no improvement): 1 -2019-08-14 09:55:57,973 ---------------------------------------------------------------------------------------------------- -2019-08-14 09:56:01,659 epoch 34 - iter 0/3720 - loss 0.71488857 throughput (samples/sec): 27632.22 -2019-08-14 09:58:44,695 epoch 34 - iter 372/3720 - loss 0.77256594 throughput (samples/sec): 76.32 -2019-08-14 10:01:31,223 epoch 34 - iter 744/3720 - loss 0.78737526 throughput (samples/sec): 74.71 -2019-08-14 10:04:16,290 epoch 34 - iter 1116/3720 - loss 0.79715857 throughput (samples/sec): 75.06 -2019-08-14 10:07:01,248 epoch 34 - iter 1488/3720 - loss 0.79773837 throughput (samples/sec): 75.60 -2019-08-14 10:09:45,316 epoch 34 - iter 1860/3720 - loss 0.79813033 throughput (samples/sec): 75.29 -2019-08-14 10:12:27,569 epoch 34 - iter 2232/3720 - loss 0.79306019 throughput (samples/sec): 76.87 -2019-08-14 10:15:09,252 epoch 34 - iter 2604/3720 - loss 0.79574371 throughput (samples/sec): 76.64 -2019-08-14 10:17:53,436 epoch 34 - iter 2976/3720 - loss 0.79968203 throughput (samples/sec): 75.98 -2019-08-14 10:20:37,716 epoch 34 - iter 3348/3720 - loss 0.80178127 throughput (samples/sec): 75.67 -2019-08-14 10:23:19,623 ---------------------------------------------------------------------------------------------------- -2019-08-14 10:23:19,623 EPOCH 34 done: loss 0.8030 - lr 0.1000 -2019-08-14 10:23:19,623 BAD EPOCHS (no improvement): 0 -2019-08-14 10:23:19,623 ---------------------------------------------------------------------------------------------------- -2019-08-14 10:23:21,470 epoch 35 - iter 0/3720 - loss 0.62424660 throughput (samples/sec): 19489.28 -2019-08-14 10:26:02,607 epoch 35 - iter 372/3720 - loss 0.77490196 throughput (samples/sec): 77.13 -2019-08-14 10:28:47,662 epoch 35 - iter 744/3720 - loss 0.78308644 throughput (samples/sec): 75.51 -2019-08-14 10:31:31,611 epoch 35 - iter 1116/3720 - loss 0.78577719 throughput (samples/sec): 75.46 -2019-08-14 10:34:15,657 epoch 35 - iter 1488/3720 - loss 0.79807413 throughput (samples/sec): 75.70 -2019-08-14 10:36:59,903 epoch 35 - iter 1860/3720 - loss 0.79465278 throughput (samples/sec): 75.49 -2019-08-14 10:39:40,785 epoch 35 - iter 2232/3720 - loss 0.79383296 throughput (samples/sec): 77.22 -2019-08-14 10:42:21,943 epoch 35 - iter 2604/3720 - loss 0.79662813 throughput (samples/sec): 76.58 -2019-08-14 10:45:04,344 epoch 35 - iter 2976/3720 - loss 0.79632612 throughput (samples/sec): 76.49 -2019-08-14 10:47:47,713 epoch 35 - iter 3348/3720 - loss 0.79514678 throughput (samples/sec): 75.64 -2019-08-14 10:50:30,098 ---------------------------------------------------------------------------------------------------- -2019-08-14 10:50:30,098 EPOCH 35 done: loss 0.7968 - lr 0.1000 -2019-08-14 10:50:30,099 BAD EPOCHS (no improvement): 0 -2019-08-14 10:50:30,099 ---------------------------------------------------------------------------------------------------- -2019-08-14 10:50:31,987 epoch 36 - iter 0/3720 - loss 0.43951750 throughput (samples/sec): 18750.66 -2019-08-14 10:53:13,684 epoch 36 - iter 372/3720 - loss 0.79297794 throughput (samples/sec): 77.36 -2019-08-14 10:55:55,635 epoch 36 - iter 744/3720 - loss 0.78561678 throughput (samples/sec): 76.44 -2019-08-14 10:58:39,341 epoch 36 - iter 1116/3720 - loss 0.78337254 throughput (samples/sec): 75.98 -2019-08-14 11:01:21,391 epoch 36 - iter 1488/3720 - loss 0.78491121 throughput (samples/sec): 76.43 -2019-08-14 11:04:02,692 epoch 36 - iter 1860/3720 - loss 0.78543545 throughput (samples/sec): 76.81 -2019-08-14 11:06:45,948 epoch 36 - iter 2232/3720 - loss 0.78986404 throughput (samples/sec): 76.13 -2019-08-14 11:09:27,785 epoch 36 - iter 2604/3720 - loss 0.78871775 throughput (samples/sec): 76.79 -2019-08-14 11:12:10,671 epoch 36 - iter 2976/3720 - loss 0.79089339 throughput (samples/sec): 76.01 -2019-08-14 11:14:55,671 epoch 36 - iter 3348/3720 - loss 0.79021527 throughput (samples/sec): 74.78 -2019-08-14 11:17:40,495 ---------------------------------------------------------------------------------------------------- -2019-08-14 11:17:40,495 EPOCH 36 done: loss 0.7919 - lr 0.1000 -2019-08-14 11:17:40,495 BAD EPOCHS (no improvement): 0 -2019-08-14 11:17:40,496 ---------------------------------------------------------------------------------------------------- -2019-08-14 11:17:42,295 epoch 37 - iter 0/3720 - loss 0.82777739 throughput (samples/sec): 20768.61 -2019-08-14 11:20:28,417 epoch 37 - iter 372/3720 - loss 0.76822207 throughput (samples/sec): 75.23 -2019-08-14 11:23:11,308 epoch 37 - iter 744/3720 - loss 0.77435861 throughput (samples/sec): 76.35 -2019-08-14 11:25:53,236 epoch 37 - iter 1116/3720 - loss 0.76932787 throughput (samples/sec): 77.01 -2019-08-14 11:28:37,105 epoch 37 - iter 1488/3720 - loss 0.77894538 throughput (samples/sec): 75.85 -2019-08-14 11:31:17,366 epoch 37 - iter 1860/3720 - loss 0.77567754 throughput (samples/sec): 77.32 -2019-08-14 11:34:02,681 epoch 37 - iter 2232/3720 - loss 0.78024940 throughput (samples/sec): 75.18 -2019-08-14 11:36:46,301 epoch 37 - iter 2604/3720 - loss 0.78482170 throughput (samples/sec): 75.49 -2019-08-14 11:39:29,204 epoch 37 - iter 2976/3720 - loss 0.78479239 throughput (samples/sec): 76.09 -2019-08-14 11:42:10,412 epoch 37 - iter 3348/3720 - loss 0.78473515 throughput (samples/sec): 77.14 -2019-08-14 11:44:54,426 ---------------------------------------------------------------------------------------------------- -2019-08-14 11:44:54,426 EPOCH 37 done: loss 0.7892 - lr 0.1000 -2019-08-14 11:44:54,426 BAD EPOCHS (no improvement): 0 -2019-08-14 11:44:54,427 ---------------------------------------------------------------------------------------------------- -2019-08-14 11:44:56,216 epoch 38 - iter 0/3720 - loss 0.78023076 throughput (samples/sec): 21793.95 -2019-08-14 11:47:38,692 epoch 38 - iter 372/3720 - loss 0.74851398 throughput (samples/sec): 76.25 -2019-08-14 11:50:22,028 epoch 38 - iter 744/3720 - loss 0.76739986 throughput (samples/sec): 75.30 -2019-08-14 11:53:06,333 epoch 38 - iter 1116/3720 - loss 0.77736667 throughput (samples/sec): 75.70 -2019-08-14 11:55:48,826 epoch 38 - iter 1488/3720 - loss 0.77310367 throughput (samples/sec): 76.72 -2019-08-14 11:58:32,524 epoch 38 - iter 1860/3720 - loss 0.77840089 throughput (samples/sec): 75.46 -2019-08-14 12:01:14,962 epoch 38 - iter 2232/3720 - loss 0.77754011 throughput (samples/sec): 76.57 -2019-08-14 12:04:00,627 epoch 38 - iter 2604/3720 - loss 0.77969866 throughput (samples/sec): 75.07 -2019-08-14 12:06:43,417 epoch 38 - iter 2976/3720 - loss 0.78164577 throughput (samples/sec): 75.34 -2019-08-14 12:09:26,922 epoch 38 - iter 3348/3720 - loss 0.78217429 throughput (samples/sec): 75.74 -2019-08-14 12:12:11,148 ---------------------------------------------------------------------------------------------------- -2019-08-14 12:12:11,148 EPOCH 38 done: loss 0.7863 - lr 0.1000 -2019-08-14 12:12:11,148 BAD EPOCHS (no improvement): 0 -2019-08-14 12:12:11,148 ---------------------------------------------------------------------------------------------------- -2019-08-14 12:12:12,872 epoch 39 - iter 0/3720 - loss 0.23265123 throughput (samples/sec): 24101.04 -2019-08-14 12:14:58,524 epoch 39 - iter 372/3720 - loss 0.77197853 throughput (samples/sec): 74.71 -2019-08-14 12:17:40,433 epoch 39 - iter 744/3720 - loss 0.76961754 throughput (samples/sec): 76.66 -2019-08-14 12:20:25,155 epoch 39 - iter 1116/3720 - loss 0.76871698 throughput (samples/sec): 75.79 -2019-08-14 12:23:08,308 epoch 39 - iter 1488/3720 - loss 0.77651283 throughput (samples/sec): 76.24 -2019-08-14 12:25:49,448 epoch 39 - iter 1860/3720 - loss 0.77813435 throughput (samples/sec): 77.44 -2019-08-14 12:28:33,434 epoch 39 - iter 2232/3720 - loss 0.77693592 throughput (samples/sec): 75.80 -2019-08-14 12:31:15,148 epoch 39 - iter 2604/3720 - loss 0.77788986 throughput (samples/sec): 76.58 -2019-08-14 12:33:59,366 epoch 39 - iter 2976/3720 - loss 0.77861483 throughput (samples/sec): 75.68 -2019-08-14 12:36:39,819 epoch 39 - iter 3348/3720 - loss 0.78346222 throughput (samples/sec): 77.16 -2019-08-14 12:39:24,035 ---------------------------------------------------------------------------------------------------- -2019-08-14 12:39:24,035 EPOCH 39 done: loss 0.7853 - lr 0.1000 -2019-08-14 12:39:24,035 BAD EPOCHS (no improvement): 0 -2019-08-14 12:39:24,036 ---------------------------------------------------------------------------------------------------- -2019-08-14 12:39:25,791 epoch 40 - iter 0/3720 - loss 0.58722878 throughput (samples/sec): 22305.61 -2019-08-14 12:42:11,628 epoch 40 - iter 372/3720 - loss 0.75334743 throughput (samples/sec): 75.15 -2019-08-14 12:44:52,537 epoch 40 - iter 744/3720 - loss 0.76206844 throughput (samples/sec): 76.85 -2019-08-14 12:47:38,250 epoch 40 - iter 1116/3720 - loss 0.76499784 throughput (samples/sec): 74.33 -2019-08-14 12:50:23,460 epoch 40 - iter 1488/3720 - loss 0.77031140 throughput (samples/sec): 75.27 -2019-08-14 12:53:05,762 epoch 40 - iter 1860/3720 - loss 0.77018718 throughput (samples/sec): 76.65 -2019-08-14 12:55:48,750 epoch 40 - iter 2232/3720 - loss 0.76899935 throughput (samples/sec): 76.82 -2019-08-14 12:58:33,228 epoch 40 - iter 2604/3720 - loss 0.77190297 throughput (samples/sec): 75.30 -2019-08-14 13:01:19,377 epoch 40 - iter 2976/3720 - loss 0.77588937 throughput (samples/sec): 74.49 -2019-08-14 13:04:02,816 epoch 40 - iter 3348/3720 - loss 0.77817319 throughput (samples/sec): 75.37 -2019-08-14 13:06:45,763 ---------------------------------------------------------------------------------------------------- -2019-08-14 13:06:45,763 EPOCH 40 done: loss 0.7786 - lr 0.1000 -2019-08-14 13:06:45,763 BAD EPOCHS (no improvement): 0 -2019-08-14 13:06:45,763 ---------------------------------------------------------------------------------------------------- -2019-08-14 13:06:47,609 epoch 41 - iter 0/3720 - loss 0.97850704 throughput (samples/sec): 19867.87 -2019-08-14 13:09:31,086 epoch 41 - iter 372/3720 - loss 0.73826405 throughput (samples/sec): 76.17 -2019-08-14 13:12:11,708 epoch 41 - iter 744/3720 - loss 0.74929938 throughput (samples/sec): 77.55 -2019-08-14 13:14:54,562 epoch 41 - iter 1116/3720 - loss 0.75501634 throughput (samples/sec): 76.18 -2019-08-14 13:17:39,010 epoch 41 - iter 1488/3720 - loss 0.75722281 throughput (samples/sec): 75.95 -2019-08-14 13:20:20,933 epoch 41 - iter 1860/3720 - loss 0.76323961 throughput (samples/sec): 76.59 -2019-08-14 13:23:03,635 epoch 41 - iter 2232/3720 - loss 0.76721491 throughput (samples/sec): 76.39 -2019-08-14 13:25:47,994 epoch 41 - iter 2604/3720 - loss 0.76987636 throughput (samples/sec): 75.63 -2019-08-14 13:28:31,928 epoch 41 - iter 2976/3720 - loss 0.77010349 throughput (samples/sec): 75.27 -2019-08-14 13:31:13,193 epoch 41 - iter 3348/3720 - loss 0.77506491 throughput (samples/sec): 76.25 -2019-08-14 13:33:56,801 ---------------------------------------------------------------------------------------------------- -2019-08-14 13:33:56,802 EPOCH 41 done: loss 0.7786 - lr 0.1000 -2019-08-14 13:33:56,802 BAD EPOCHS (no improvement): 1 -2019-08-14 13:33:56,802 ---------------------------------------------------------------------------------------------------- -2019-08-14 13:33:58,532 epoch 42 - iter 0/3720 - loss 0.63338852 throughput (samples/sec): 24624.43 -2019-08-14 13:36:43,243 epoch 42 - iter 372/3720 - loss 0.75833072 throughput (samples/sec): 75.07 -2019-08-14 13:39:29,491 epoch 42 - iter 744/3720 - loss 0.77199813 throughput (samples/sec): 74.70 -2019-08-14 13:42:12,575 epoch 42 - iter 1116/3720 - loss 0.76894957 throughput (samples/sec): 76.30 -2019-08-14 13:44:56,045 epoch 42 - iter 1488/3720 - loss 0.77433610 throughput (samples/sec): 76.35 -2019-08-14 13:47:38,597 epoch 42 - iter 1860/3720 - loss 0.77794601 throughput (samples/sec): 76.25 -2019-08-14 13:50:22,368 epoch 42 - iter 2232/3720 - loss 0.78012072 throughput (samples/sec): 75.66 -2019-08-14 13:53:05,637 epoch 42 - iter 2604/3720 - loss 0.77964830 throughput (samples/sec): 75.92 -2019-08-14 13:55:49,360 epoch 42 - iter 2976/3720 - loss 0.77911553 throughput (samples/sec): 75.37 -2019-08-14 13:58:32,216 epoch 42 - iter 3348/3720 - loss 0.77941577 throughput (samples/sec): 75.55 -2019-08-14 14:01:15,078 ---------------------------------------------------------------------------------------------------- -2019-08-14 14:01:15,078 EPOCH 42 done: loss 0.7808 - lr 0.1000 -2019-08-14 14:01:15,078 BAD EPOCHS (no improvement): 2 -2019-08-14 14:01:15,079 ---------------------------------------------------------------------------------------------------- -2019-08-14 14:01:16,847 epoch 43 - iter 0/3720 - loss 0.68872690 throughput (samples/sec): 21838.42 -2019-08-14 14:04:00,625 epoch 43 - iter 372/3720 - loss 0.75214343 throughput (samples/sec): 76.07 -2019-08-14 14:06:43,941 epoch 43 - iter 744/3720 - loss 0.75778252 throughput (samples/sec): 76.17 -2019-08-14 14:09:27,845 epoch 43 - iter 1116/3720 - loss 0.76318982 throughput (samples/sec): 75.50 -2019-08-14 14:12:12,722 epoch 43 - iter 1488/3720 - loss 0.76836184 throughput (samples/sec): 75.05 -2019-08-14 14:14:55,965 epoch 43 - iter 1860/3720 - loss 0.77165607 throughput (samples/sec): 75.36 -2019-08-14 14:17:38,509 epoch 43 - iter 2232/3720 - loss 0.77207611 throughput (samples/sec): 75.71 -2019-08-14 14:20:21,869 epoch 43 - iter 2604/3720 - loss 0.76942012 throughput (samples/sec): 75.53 -2019-08-14 14:23:06,544 epoch 43 - iter 2976/3720 - loss 0.77072708 throughput (samples/sec): 75.16 -2019-08-14 14:25:51,156 epoch 43 - iter 3348/3720 - loss 0.77207772 throughput (samples/sec): 75.18 -2019-08-14 14:28:34,213 ---------------------------------------------------------------------------------------------------- -2019-08-14 14:28:34,213 EPOCH 43 done: loss 0.7747 - lr 0.1000 -2019-08-14 14:28:34,214 BAD EPOCHS (no improvement): 0 -2019-08-14 14:28:34,214 ---------------------------------------------------------------------------------------------------- -2019-08-14 14:28:35,986 epoch 44 - iter 0/3720 - loss 0.52772236 throughput (samples/sec): 22012.20 -2019-08-14 14:31:21,351 epoch 44 - iter 372/3720 - loss 0.73875834 throughput (samples/sec): 75.84 -2019-08-14 14:34:06,207 epoch 44 - iter 744/3720 - loss 0.74805818 throughput (samples/sec): 74.57 -2019-08-14 14:36:49,277 epoch 44 - iter 1116/3720 - loss 0.75838701 throughput (samples/sec): 76.39 -2019-08-14 14:39:32,521 epoch 44 - iter 1488/3720 - loss 0.75730461 throughput (samples/sec): 75.86 -2019-08-14 14:42:16,650 epoch 44 - iter 1860/3720 - loss 0.76060845 throughput (samples/sec): 75.37 -2019-08-14 14:44:58,867 epoch 44 - iter 2232/3720 - loss 0.75957031 throughput (samples/sec): 76.91 -2019-08-14 14:47:42,941 epoch 44 - iter 2604/3720 - loss 0.76498333 throughput (samples/sec): 75.28 -2019-08-14 14:50:25,547 epoch 44 - iter 2976/3720 - loss 0.76810558 throughput (samples/sec): 76.21 -2019-08-14 14:53:09,664 epoch 44 - iter 3348/3720 - loss 0.76843397 throughput (samples/sec): 76.13 -2019-08-14 14:55:52,688 ---------------------------------------------------------------------------------------------------- -2019-08-14 14:55:52,688 EPOCH 44 done: loss 0.7691 - lr 0.1000 -2019-08-14 14:55:52,689 BAD EPOCHS (no improvement): 0 -2019-08-14 14:55:52,689 ---------------------------------------------------------------------------------------------------- -2019-08-14 14:55:54,464 epoch 45 - iter 0/3720 - loss 1.43560195 throughput (samples/sec): 21068.02 -2019-08-14 14:58:38,510 epoch 45 - iter 372/3720 - loss 0.75508251 throughput (samples/sec): 75.95 -2019-08-14 15:01:21,132 epoch 45 - iter 744/3720 - loss 0.75836405 throughput (samples/sec): 75.97 -2019-08-14 15:04:01,105 epoch 45 - iter 1116/3720 - loss 0.76174958 throughput (samples/sec): 77.73 -2019-08-14 15:06:45,460 epoch 45 - iter 1488/3720 - loss 0.76080358 throughput (samples/sec): 75.89 -2019-08-14 15:09:29,688 epoch 45 - iter 1860/3720 - loss 0.76239873 throughput (samples/sec): 75.14 -2019-08-14 15:12:14,355 epoch 45 - iter 2232/3720 - loss 0.76074233 throughput (samples/sec): 75.69 -2019-08-14 15:14:56,725 epoch 45 - iter 2604/3720 - loss 0.76325412 throughput (samples/sec): 76.23 -2019-08-14 15:17:39,240 epoch 45 - iter 2976/3720 - loss 0.76365826 throughput (samples/sec): 75.82 -2019-08-14 15:20:23,125 epoch 45 - iter 3348/3720 - loss 0.76250980 throughput (samples/sec): 75.32 -2019-08-14 15:23:04,597 ---------------------------------------------------------------------------------------------------- -2019-08-14 15:23:04,597 EPOCH 45 done: loss 0.7651 - lr 0.1000 -2019-08-14 15:23:04,598 BAD EPOCHS (no improvement): 0 -2019-08-14 15:23:04,598 ---------------------------------------------------------------------------------------------------- -2019-08-14 15:23:06,328 epoch 46 - iter 0/3720 - loss 0.66252160 throughput (samples/sec): 23615.82 -2019-08-14 15:25:50,731 epoch 46 - iter 372/3720 - loss 0.75483485 throughput (samples/sec): 76.14 -2019-08-14 15:28:34,759 epoch 46 - iter 744/3720 - loss 0.74682368 throughput (samples/sec): 76.02 -2019-08-14 15:31:18,392 epoch 46 - iter 1116/3720 - loss 0.74561189 throughput (samples/sec): 75.77 -2019-08-14 15:33:59,985 epoch 46 - iter 1488/3720 - loss 0.75195894 throughput (samples/sec): 76.76 -2019-08-14 15:36:40,737 epoch 46 - iter 1860/3720 - loss 0.75655869 throughput (samples/sec): 76.26 -2019-08-14 15:39:24,545 epoch 46 - iter 2232/3720 - loss 0.75808917 throughput (samples/sec): 75.55 -2019-08-14 15:42:06,487 epoch 46 - iter 2604/3720 - loss 0.75924938 throughput (samples/sec): 76.33 -2019-08-14 15:44:48,150 epoch 46 - iter 2976/3720 - loss 0.76166353 throughput (samples/sec): 76.84 -2019-08-14 15:47:32,873 epoch 46 - iter 3348/3720 - loss 0.76376207 throughput (samples/sec): 75.20 -2019-08-14 15:50:16,533 ---------------------------------------------------------------------------------------------------- -2019-08-14 15:50:16,533 EPOCH 46 done: loss 0.7661 - lr 0.1000 -2019-08-14 15:50:16,533 BAD EPOCHS (no improvement): 1 -2019-08-14 15:50:16,533 ---------------------------------------------------------------------------------------------------- -2019-08-14 15:50:18,272 epoch 47 - iter 0/3720 - loss 0.39304829 throughput (samples/sec): 26489.37 -2019-08-14 15:53:02,730 epoch 47 - iter 372/3720 - loss 0.75428493 throughput (samples/sec): 75.68 -2019-08-14 15:55:47,310 epoch 47 - iter 744/3720 - loss 0.75820539 throughput (samples/sec): 75.31 -2019-08-14 15:58:30,958 epoch 47 - iter 1116/3720 - loss 0.74474148 throughput (samples/sec): 75.72 -2019-08-14 16:01:13,856 epoch 47 - iter 1488/3720 - loss 0.74930580 throughput (samples/sec): 75.58 -2019-08-14 16:04:00,001 epoch 47 - iter 1860/3720 - loss 0.75403889 throughput (samples/sec): 74.31 -2019-08-14 16:06:43,629 epoch 47 - iter 2232/3720 - loss 0.75405451 throughput (samples/sec): 76.32 -2019-08-14 16:09:28,623 epoch 47 - iter 2604/3720 - loss 0.75480857 throughput (samples/sec): 74.68 -2019-08-14 16:12:09,788 epoch 47 - iter 2976/3720 - loss 0.75980352 throughput (samples/sec): 76.79 -2019-08-14 16:14:52,904 epoch 47 - iter 3348/3720 - loss 0.75951706 throughput (samples/sec): 75.63 -2019-08-14 16:17:34,869 ---------------------------------------------------------------------------------------------------- -2019-08-14 16:17:34,869 EPOCH 47 done: loss 0.7607 - lr 0.1000 -2019-08-14 16:17:34,869 BAD EPOCHS (no improvement): 0 -2019-08-14 16:17:34,869 ---------------------------------------------------------------------------------------------------- -2019-08-14 16:17:36,701 epoch 48 - iter 0/3720 - loss 0.82291818 throughput (samples/sec): 20135.50 -2019-08-14 16:20:20,470 epoch 48 - iter 372/3720 - loss 0.77038898 throughput (samples/sec): 76.16 -2019-08-14 16:23:02,814 epoch 48 - iter 744/3720 - loss 0.76223179 throughput (samples/sec): 75.98 -2019-08-14 16:25:45,443 epoch 48 - iter 1116/3720 - loss 0.75885424 throughput (samples/sec): 76.18 -2019-08-14 16:28:27,667 epoch 48 - iter 1488/3720 - loss 0.75248719 throughput (samples/sec): 76.84 -2019-08-14 16:31:12,653 epoch 48 - iter 1860/3720 - loss 0.75099416 throughput (samples/sec): 74.57 -2019-08-14 16:33:53,844 epoch 48 - iter 2232/3720 - loss 0.75536231 throughput (samples/sec): 76.66 -2019-08-14 16:36:37,276 epoch 48 - iter 2604/3720 - loss 0.75770054 throughput (samples/sec): 76.06 -2019-08-14 16:39:19,486 epoch 48 - iter 2976/3720 - loss 0.75838775 throughput (samples/sec): 76.60 -2019-08-14 16:42:03,465 epoch 48 - iter 3348/3720 - loss 0.75958379 throughput (samples/sec): 75.55 -2019-08-14 16:44:48,637 ---------------------------------------------------------------------------------------------------- -2019-08-14 16:44:48,637 EPOCH 48 done: loss 0.7617 - lr 0.1000 -2019-08-14 16:44:48,638 BAD EPOCHS (no improvement): 1 -2019-08-14 16:44:48,638 ---------------------------------------------------------------------------------------------------- -2019-08-14 16:44:50,554 epoch 49 - iter 0/3720 - loss 1.34337878 throughput (samples/sec): 18654.33 -2019-08-14 16:47:34,761 epoch 49 - iter 372/3720 - loss 0.76156030 throughput (samples/sec): 74.94 -2019-08-14 16:50:19,841 epoch 49 - iter 744/3720 - loss 0.74941096 throughput (samples/sec): 74.69 -2019-08-14 16:53:03,839 epoch 49 - iter 1116/3720 - loss 0.75317018 throughput (samples/sec): 75.50 -2019-08-14 16:55:51,005 epoch 49 - iter 1488/3720 - loss 0.75337798 throughput (samples/sec): 74.28 -2019-08-14 16:58:34,530 epoch 49 - iter 1860/3720 - loss 0.75602612 throughput (samples/sec): 76.03 -2019-08-14 17:01:17,519 epoch 49 - iter 2232/3720 - loss 0.75180339 throughput (samples/sec): 75.61 -2019-08-14 17:04:00,090 epoch 49 - iter 2604/3720 - loss 0.75593186 throughput (samples/sec): 76.10 -2019-08-14 17:06:43,295 epoch 49 - iter 2976/3720 - loss 0.75534409 throughput (samples/sec): 75.83 -2019-08-14 17:09:26,002 epoch 49 - iter 3348/3720 - loss 0.75667819 throughput (samples/sec): 76.40 -2019-08-14 17:12:07,259 ---------------------------------------------------------------------------------------------------- -2019-08-14 17:12:07,259 EPOCH 49 done: loss 0.7601 - lr 0.1000 -2019-08-14 17:12:07,260 BAD EPOCHS (no improvement): 0 -2019-08-14 17:12:07,260 ---------------------------------------------------------------------------------------------------- -2019-08-14 17:12:09,042 epoch 50 - iter 0/3720 - loss 0.97927094 throughput (samples/sec): 21647.09 -2019-08-14 17:14:50,590 epoch 50 - iter 372/3720 - loss 0.73899130 throughput (samples/sec): 76.31 -2019-08-14 17:17:34,742 epoch 50 - iter 744/3720 - loss 0.75342126 throughput (samples/sec): 76.36 -2019-08-14 17:20:17,444 epoch 50 - iter 1116/3720 - loss 0.75718372 throughput (samples/sec): 76.44 -2019-08-14 17:22:59,231 epoch 50 - iter 1488/3720 - loss 0.76254187 throughput (samples/sec): 76.33 -2019-08-14 17:25:39,668 epoch 50 - iter 1860/3720 - loss 0.75906314 throughput (samples/sec): 77.44 -2019-08-14 17:28:22,556 epoch 50 - iter 2232/3720 - loss 0.75757680 throughput (samples/sec): 76.01 -2019-08-14 17:31:04,874 epoch 50 - iter 2604/3720 - loss 0.75783715 throughput (samples/sec): 75.98 -2019-08-14 17:33:48,252 epoch 50 - iter 2976/3720 - loss 0.75714920 throughput (samples/sec): 76.04 -2019-08-14 17:36:33,231 epoch 50 - iter 3348/3720 - loss 0.76068452 throughput (samples/sec): 75.13 -2019-08-14 17:39:16,121 ---------------------------------------------------------------------------------------------------- -2019-08-14 17:39:16,121 EPOCH 50 done: loss 0.7618 - lr 0.1000 -2019-08-14 17:39:16,121 BAD EPOCHS (no improvement): 1 -2019-08-14 17:39:16,122 ---------------------------------------------------------------------------------------------------- -2019-08-14 17:39:17,972 epoch 51 - iter 0/3720 - loss 1.26759529 throughput (samples/sec): 19009.72 -2019-08-14 17:42:03,535 epoch 51 - iter 372/3720 - loss 0.74237626 throughput (samples/sec): 74.69 -2019-08-14 17:44:46,059 epoch 51 - iter 744/3720 - loss 0.75311880 throughput (samples/sec): 75.38 -2019-08-14 17:47:27,270 epoch 51 - iter 1116/3720 - loss 0.75263479 throughput (samples/sec): 76.89 -2019-08-14 17:50:10,566 epoch 51 - iter 1488/3720 - loss 0.75039430 throughput (samples/sec): 75.87 -2019-08-14 17:52:54,928 epoch 51 - iter 1860/3720 - loss 0.75403713 throughput (samples/sec): 75.59 -2019-08-14 17:55:37,342 epoch 51 - iter 2232/3720 - loss 0.75930934 throughput (samples/sec): 76.54 -2019-08-14 17:58:20,705 epoch 51 - iter 2604/3720 - loss 0.76284662 throughput (samples/sec): 76.02 -2019-08-14 18:01:02,786 epoch 51 - iter 2976/3720 - loss 0.76178079 throughput (samples/sec): 76.42 -2019-08-14 18:03:44,865 epoch 51 - iter 3348/3720 - loss 0.76144413 throughput (samples/sec): 76.11 -2019-08-14 18:06:27,781 ---------------------------------------------------------------------------------------------------- -2019-08-14 18:06:27,781 EPOCH 51 done: loss 0.7619 - lr 0.1000 -2019-08-14 18:06:27,782 BAD EPOCHS (no improvement): 2 -2019-08-14 18:06:27,782 ---------------------------------------------------------------------------------------------------- -2019-08-14 18:06:29,458 epoch 52 - iter 0/3720 - loss 0.57871222 throughput (samples/sec): 26728.36 -2019-08-14 18:09:12,148 epoch 52 - iter 372/3720 - loss 0.73084527 throughput (samples/sec): 76.79 -2019-08-14 18:11:52,715 epoch 52 - iter 744/3720 - loss 0.73365897 throughput (samples/sec): 77.24 -2019-08-14 18:14:36,675 epoch 52 - iter 1116/3720 - loss 0.73434769 throughput (samples/sec): 75.17 -2019-08-14 18:17:20,420 epoch 52 - iter 1488/3720 - loss 0.74055205 throughput (samples/sec): 75.79 -2019-08-14 18:20:01,495 epoch 52 - iter 1860/3720 - loss 0.74339731 throughput (samples/sec): 76.39 -2019-08-14 18:22:44,949 epoch 52 - iter 2232/3720 - loss 0.74755466 throughput (samples/sec): 75.76 -2019-08-14 18:25:26,574 epoch 52 - iter 2604/3720 - loss 0.74820550 throughput (samples/sec): 76.57 -2019-08-14 18:28:09,429 epoch 52 - iter 2976/3720 - loss 0.75173387 throughput (samples/sec): 76.06 -2019-08-14 18:30:53,253 epoch 52 - iter 3348/3720 - loss 0.75201545 throughput (samples/sec): 75.82 -2019-08-14 18:33:35,457 ---------------------------------------------------------------------------------------------------- -2019-08-14 18:33:35,458 EPOCH 52 done: loss 0.7543 - lr 0.1000 -2019-08-14 18:33:35,458 BAD EPOCHS (no improvement): 0 -2019-08-14 18:33:35,458 ---------------------------------------------------------------------------------------------------- -2019-08-14 18:33:37,166 epoch 53 - iter 0/3720 - loss 0.61249542 throughput (samples/sec): 25208.06 -2019-08-14 18:36:21,613 epoch 53 - iter 372/3720 - loss 0.74805649 throughput (samples/sec): 75.41 -2019-08-14 18:39:03,272 epoch 53 - iter 744/3720 - loss 0.75072114 throughput (samples/sec): 77.14 -2019-08-14 18:41:45,956 epoch 53 - iter 1116/3720 - loss 0.75108793 throughput (samples/sec): 76.32 -2019-08-14 18:44:29,766 epoch 53 - iter 1488/3720 - loss 0.75391734 throughput (samples/sec): 75.66 -2019-08-14 18:47:12,592 epoch 53 - iter 1860/3720 - loss 0.74764612 throughput (samples/sec): 76.07 -2019-08-14 18:49:57,318 epoch 53 - iter 2232/3720 - loss 0.74757328 throughput (samples/sec): 75.73 -2019-08-14 18:52:40,159 epoch 53 - iter 2604/3720 - loss 0.74952306 throughput (samples/sec): 76.39 -2019-08-14 18:55:24,083 epoch 53 - iter 2976/3720 - loss 0.75313432 throughput (samples/sec): 76.14 -2019-08-14 18:58:06,199 epoch 53 - iter 3348/3720 - loss 0.75308205 throughput (samples/sec): 76.81 -2019-08-14 19:00:47,100 ---------------------------------------------------------------------------------------------------- -2019-08-14 19:00:47,100 EPOCH 53 done: loss 0.7549 - lr 0.1000 -2019-08-14 19:00:47,101 BAD EPOCHS (no improvement): 1 -2019-08-14 19:00:47,101 ---------------------------------------------------------------------------------------------------- -2019-08-14 19:00:48,951 epoch 54 - iter 0/3720 - loss 0.67171741 throughput (samples/sec): 19161.77 -2019-08-14 19:03:32,920 epoch 54 - iter 372/3720 - loss 0.74230660 throughput (samples/sec): 75.75 -2019-08-14 19:06:15,827 epoch 54 - iter 744/3720 - loss 0.74685144 throughput (samples/sec): 76.25 -2019-08-14 19:08:56,069 epoch 54 - iter 1116/3720 - loss 0.74700704 throughput (samples/sec): 77.52 -2019-08-14 19:11:38,544 epoch 54 - iter 1488/3720 - loss 0.75306211 throughput (samples/sec): 75.96 -2019-08-14 19:14:18,157 epoch 54 - iter 1860/3720 - loss 0.74918223 throughput (samples/sec): 77.93 -2019-08-14 19:17:00,573 epoch 54 - iter 2232/3720 - loss 0.74933947 throughput (samples/sec): 75.74 -2019-08-14 19:19:44,474 epoch 54 - iter 2604/3720 - loss 0.74663575 throughput (samples/sec): 75.33 -2019-08-14 19:22:29,900 epoch 54 - iter 2976/3720 - loss 0.75019036 throughput (samples/sec): 75.45 -2019-08-14 19:25:12,543 epoch 54 - iter 3348/3720 - loss 0.74980327 throughput (samples/sec): 76.71 -2019-08-14 19:27:54,033 ---------------------------------------------------------------------------------------------------- -2019-08-14 19:27:54,034 EPOCH 54 done: loss 0.7506 - lr 0.1000 -2019-08-14 19:27:54,034 BAD EPOCHS (no improvement): 0 -2019-08-14 19:27:54,034 ---------------------------------------------------------------------------------------------------- -2019-08-14 19:27:55,738 epoch 55 - iter 0/3720 - loss 0.97331429 throughput (samples/sec): 24427.91 -2019-08-14 19:30:40,109 epoch 55 - iter 372/3720 - loss 0.74853712 throughput (samples/sec): 75.99 -2019-08-14 19:33:24,213 epoch 55 - iter 744/3720 - loss 0.74421961 throughput (samples/sec): 76.03 -2019-08-14 19:36:05,022 epoch 55 - iter 1116/3720 - loss 0.74577684 throughput (samples/sec): 77.32 -2019-08-14 19:38:47,992 epoch 55 - iter 1488/3720 - loss 0.73921052 throughput (samples/sec): 76.25 -2019-08-14 19:41:29,736 epoch 55 - iter 1860/3720 - loss 0.73542538 throughput (samples/sec): 76.68 -2019-08-14 19:44:13,233 epoch 55 - iter 2232/3720 - loss 0.73635269 throughput (samples/sec): 76.21 -2019-08-14 19:46:55,509 epoch 55 - iter 2604/3720 - loss 0.74106540 throughput (samples/sec): 76.10 -2019-08-14 19:49:36,958 epoch 55 - iter 2976/3720 - loss 0.74200035 throughput (samples/sec): 76.16 -2019-08-14 19:52:18,341 epoch 55 - iter 3348/3720 - loss 0.74679479 throughput (samples/sec): 77.29 -2019-08-14 19:55:01,598 ---------------------------------------------------------------------------------------------------- -2019-08-14 19:55:01,598 EPOCH 55 done: loss 0.7470 - lr 0.1000 -2019-08-14 19:55:01,598 BAD EPOCHS (no improvement): 0 -2019-08-14 19:55:01,598 ---------------------------------------------------------------------------------------------------- -2019-08-14 19:55:04,348 epoch 56 - iter 0/3720 - loss 0.71890688 throughput (samples/sec): 26169.36 -2019-08-14 19:57:46,757 epoch 56 - iter 372/3720 - loss 0.73207588 throughput (samples/sec): 76.13 -2019-08-14 20:00:31,072 epoch 56 - iter 744/3720 - loss 0.73348572 throughput (samples/sec): 75.57 -2019-08-14 20:03:14,341 epoch 56 - iter 1116/3720 - loss 0.73629637 throughput (samples/sec): 75.59 -2019-08-14 20:05:58,793 epoch 56 - iter 1488/3720 - loss 0.73891543 throughput (samples/sec): 75.60 -2019-08-14 20:08:42,905 epoch 56 - iter 1860/3720 - loss 0.73834341 throughput (samples/sec): 75.46 -2019-08-14 20:11:26,841 epoch 56 - iter 2232/3720 - loss 0.74414507 throughput (samples/sec): 75.58 -2019-08-14 20:14:10,118 epoch 56 - iter 2604/3720 - loss 0.74336110 throughput (samples/sec): 75.92 -2019-08-14 20:16:53,154 epoch 56 - iter 2976/3720 - loss 0.74796666 throughput (samples/sec): 76.31 -2019-08-14 20:19:37,163 epoch 56 - iter 3348/3720 - loss 0.74692581 throughput (samples/sec): 75.53 -2019-08-14 20:22:19,883 ---------------------------------------------------------------------------------------------------- -2019-08-14 20:22:19,883 EPOCH 56 done: loss 0.7478 - lr 0.1000 -2019-08-14 20:22:19,883 BAD EPOCHS (no improvement): 1 -2019-08-14 20:22:19,883 ---------------------------------------------------------------------------------------------------- -2019-08-14 20:22:21,648 epoch 57 - iter 0/3720 - loss 0.85472202 throughput (samples/sec): 23897.78 -2019-08-14 20:25:04,667 epoch 57 - iter 372/3720 - loss 0.74693981 throughput (samples/sec): 76.14 -2019-08-14 20:27:46,998 epoch 57 - iter 744/3720 - loss 0.73994685 throughput (samples/sec): 76.06 -2019-08-14 20:30:31,197 epoch 57 - iter 1116/3720 - loss 0.74037492 throughput (samples/sec): 75.43 -2019-08-14 20:33:14,800 epoch 57 - iter 1488/3720 - loss 0.74129951 throughput (samples/sec): 75.93 -2019-08-14 20:35:57,416 epoch 57 - iter 1860/3720 - loss 0.73970720 throughput (samples/sec): 76.50 -2019-08-14 20:38:42,450 epoch 57 - iter 2232/3720 - loss 0.74059481 throughput (samples/sec): 75.31 -2019-08-14 20:41:24,561 epoch 57 - iter 2604/3720 - loss 0.74169771 throughput (samples/sec): 75.89 -2019-08-14 20:44:07,375 epoch 57 - iter 2976/3720 - loss 0.74399671 throughput (samples/sec): 76.10 -2019-08-14 20:46:48,123 epoch 57 - iter 3348/3720 - loss 0.74345626 throughput (samples/sec): 77.02 -2019-08-14 20:49:30,093 ---------------------------------------------------------------------------------------------------- -2019-08-14 20:49:30,093 EPOCH 57 done: loss 0.7457 - lr 0.1000 -2019-08-14 20:49:30,093 BAD EPOCHS (no improvement): 0 -2019-08-14 20:49:30,093 ---------------------------------------------------------------------------------------------------- -2019-08-14 20:49:31,806 epoch 58 - iter 0/3720 - loss 0.45362616 throughput (samples/sec): 24082.73 -2019-08-14 20:52:12,699 epoch 58 - iter 372/3720 - loss 0.71354575 throughput (samples/sec): 77.09 -2019-08-14 20:54:55,703 epoch 58 - iter 744/3720 - loss 0.73145597 throughput (samples/sec): 76.00 -2019-08-14 20:57:39,064 epoch 58 - iter 1116/3720 - loss 0.73658571 throughput (samples/sec): 75.80 -2019-08-14 21:00:24,993 epoch 58 - iter 1488/3720 - loss 0.74017712 throughput (samples/sec): 74.09 -2019-08-14 21:03:11,005 epoch 58 - iter 1860/3720 - loss 0.74260920 throughput (samples/sec): 75.10 -2019-08-14 21:05:56,837 epoch 58 - iter 2232/3720 - loss 0.74577490 throughput (samples/sec): 74.64 -2019-08-14 21:08:41,970 epoch 58 - iter 2604/3720 - loss 0.74515352 throughput (samples/sec): 74.53 -2019-08-14 21:11:24,564 epoch 58 - iter 2976/3720 - loss 0.74174200 throughput (samples/sec): 76.23 -2019-08-14 21:14:06,955 epoch 58 - iter 3348/3720 - loss 0.74376989 throughput (samples/sec): 76.31 -2019-08-14 21:16:48,132 ---------------------------------------------------------------------------------------------------- -2019-08-14 21:16:48,132 EPOCH 58 done: loss 0.7435 - lr 0.1000 -2019-08-14 21:16:48,132 BAD EPOCHS (no improvement): 0 -2019-08-14 21:16:48,132 ---------------------------------------------------------------------------------------------------- -2019-08-14 21:16:49,917 epoch 59 - iter 0/3720 - loss 0.77027607 throughput (samples/sec): 20987.49 -2019-08-14 21:19:33,135 epoch 59 - iter 372/3720 - loss 0.72925466 throughput (samples/sec): 76.27 -2019-08-14 21:22:17,906 epoch 59 - iter 744/3720 - loss 0.72926642 throughput (samples/sec): 75.43 -2019-08-14 21:25:01,002 epoch 59 - iter 1116/3720 - loss 0.73202464 throughput (samples/sec): 75.72 -2019-08-14 21:27:43,015 epoch 59 - iter 1488/3720 - loss 0.73810149 throughput (samples/sec): 76.94 -2019-08-14 21:30:24,864 epoch 59 - iter 1860/3720 - loss 0.73238014 throughput (samples/sec): 76.48 -2019-08-14 21:33:08,055 epoch 59 - iter 2232/3720 - loss 0.73436774 throughput (samples/sec): 75.09 -2019-08-14 21:35:49,184 epoch 59 - iter 2604/3720 - loss 0.73559569 throughput (samples/sec): 76.78 -2019-08-14 21:38:29,149 epoch 59 - iter 2976/3720 - loss 0.73635392 throughput (samples/sec): 77.17 -2019-08-14 21:41:10,739 epoch 59 - iter 3348/3720 - loss 0.73718110 throughput (samples/sec): 76.35 -2019-08-14 21:43:52,881 ---------------------------------------------------------------------------------------------------- -2019-08-14 21:43:52,881 EPOCH 59 done: loss 0.7408 - lr 0.1000 -2019-08-14 21:43:52,882 BAD EPOCHS (no improvement): 0 -2019-08-14 21:43:52,882 ---------------------------------------------------------------------------------------------------- -2019-08-14 21:43:54,645 epoch 60 - iter 0/3720 - loss 0.98191810 throughput (samples/sec): 24219.36 -2019-08-14 21:46:39,021 epoch 60 - iter 372/3720 - loss 0.72176144 throughput (samples/sec): 75.11 -2019-08-14 21:49:22,117 epoch 60 - iter 744/3720 - loss 0.71403301 throughput (samples/sec): 76.32 -2019-08-14 21:52:08,652 epoch 60 - iter 1116/3720 - loss 0.72868535 throughput (samples/sec): 74.50 -2019-08-14 21:54:50,475 epoch 60 - iter 1488/3720 - loss 0.72737240 throughput (samples/sec): 76.78 -2019-08-14 21:57:31,210 epoch 60 - iter 1860/3720 - loss 0.72907355 throughput (samples/sec): 77.56 -2019-08-14 22:00:15,489 epoch 60 - iter 2232/3720 - loss 0.73434055 throughput (samples/sec): 75.60 -2019-08-14 22:02:58,923 epoch 60 - iter 2604/3720 - loss 0.73681225 throughput (samples/sec): 75.67 -2019-08-14 22:05:40,964 epoch 60 - iter 2976/3720 - loss 0.73618339 throughput (samples/sec): 76.16 -2019-08-14 22:08:24,714 epoch 60 - iter 3348/3720 - loss 0.73901849 throughput (samples/sec): 75.85 -2019-08-14 22:11:05,914 ---------------------------------------------------------------------------------------------------- -2019-08-14 22:11:05,914 EPOCH 60 done: loss 0.7396 - lr 0.1000 -2019-08-14 22:11:05,914 BAD EPOCHS (no improvement): 0 -2019-08-14 22:11:05,915 ---------------------------------------------------------------------------------------------------- -2019-08-14 22:11:07,721 epoch 61 - iter 0/3720 - loss 0.68382168 throughput (samples/sec): 20916.51 -2019-08-14 22:13:53,808 epoch 61 - iter 372/3720 - loss 0.72449317 throughput (samples/sec): 74.61 -2019-08-14 22:16:34,307 epoch 61 - iter 744/3720 - loss 0.72894727 throughput (samples/sec): 77.55 -2019-08-14 22:19:18,381 epoch 61 - iter 1116/3720 - loss 0.72805352 throughput (samples/sec): 75.28 -2019-08-14 22:22:00,195 epoch 61 - iter 1488/3720 - loss 0.72741397 throughput (samples/sec): 76.37 -2019-08-14 22:24:46,291 epoch 61 - iter 1860/3720 - loss 0.73107531 throughput (samples/sec): 74.55 -2019-08-14 22:27:31,773 epoch 61 - iter 2232/3720 - loss 0.73336004 throughput (samples/sec): 74.84 -2019-08-14 22:30:14,513 epoch 61 - iter 2604/3720 - loss 0.73496273 throughput (samples/sec): 76.09 -2019-08-14 22:32:56,866 epoch 61 - iter 2976/3720 - loss 0.73693016 throughput (samples/sec): 76.55 -2019-08-14 22:35:41,443 epoch 61 - iter 3348/3720 - loss 0.73819449 throughput (samples/sec): 75.50 -2019-08-14 22:38:25,650 ---------------------------------------------------------------------------------------------------- -2019-08-14 22:38:25,651 EPOCH 61 done: loss 0.7396 - lr 0.1000 -2019-08-14 22:38:25,651 BAD EPOCHS (no improvement): 1 -2019-08-14 22:38:25,651 ---------------------------------------------------------------------------------------------------- -2019-08-14 22:38:27,327 epoch 62 - iter 0/3720 - loss 0.83497143 throughput (samples/sec): 26690.88 -2019-08-14 22:41:10,801 epoch 62 - iter 372/3720 - loss 0.69928461 throughput (samples/sec): 75.24 -2019-08-14 22:43:54,445 epoch 62 - iter 744/3720 - loss 0.71689739 throughput (samples/sec): 76.03 -2019-08-14 22:46:36,484 epoch 62 - iter 1116/3720 - loss 0.72613737 throughput (samples/sec): 76.55 -2019-08-14 22:49:17,903 epoch 62 - iter 1488/3720 - loss 0.73413796 throughput (samples/sec): 76.33 -2019-08-14 22:52:00,843 epoch 62 - iter 1860/3720 - loss 0.73513153 throughput (samples/sec): 76.06 -2019-08-14 22:54:42,384 epoch 62 - iter 2232/3720 - loss 0.73457161 throughput (samples/sec): 76.71 -2019-08-14 22:57:25,245 epoch 62 - iter 2604/3720 - loss 0.73525830 throughput (samples/sec): 75.84 -2019-08-14 23:00:10,382 epoch 62 - iter 2976/3720 - loss 0.73539528 throughput (samples/sec): 74.49 -2019-08-14 23:02:54,673 epoch 62 - iter 3348/3720 - loss 0.73383654 throughput (samples/sec): 75.92 -2019-08-14 23:05:34,924 ---------------------------------------------------------------------------------------------------- -2019-08-14 23:05:34,924 EPOCH 62 done: loss 0.7342 - lr 0.1000 -2019-08-14 23:05:34,924 BAD EPOCHS (no improvement): 0 -2019-08-14 23:05:34,924 ---------------------------------------------------------------------------------------------------- -2019-08-14 23:05:36,841 epoch 63 - iter 0/3720 - loss 1.00062656 throughput (samples/sec): 18842.43 -2019-08-14 23:08:20,041 epoch 63 - iter 372/3720 - loss 0.69916077 throughput (samples/sec): 76.12 -2019-08-14 23:11:02,950 epoch 63 - iter 744/3720 - loss 0.72681805 throughput (samples/sec): 75.80 -2019-08-14 23:13:44,788 epoch 63 - iter 1116/3720 - loss 0.72989547 throughput (samples/sec): 76.79 -2019-08-14 23:16:26,209 epoch 63 - iter 1488/3720 - loss 0.72719493 throughput (samples/sec): 76.23 -2019-08-14 23:19:09,212 epoch 63 - iter 1860/3720 - loss 0.72988845 throughput (samples/sec): 75.72 -2019-08-14 23:21:50,108 epoch 63 - iter 2232/3720 - loss 0.72970043 throughput (samples/sec): 77.64 -2019-08-14 23:24:33,016 epoch 63 - iter 2604/3720 - loss 0.73382251 throughput (samples/sec): 76.58 -2019-08-14 23:27:15,137 epoch 63 - iter 2976/3720 - loss 0.73717136 throughput (samples/sec): 76.45 -2019-08-14 23:30:00,155 epoch 63 - iter 3348/3720 - loss 0.73925103 throughput (samples/sec): 75.52 -2019-08-14 23:32:45,883 ---------------------------------------------------------------------------------------------------- -2019-08-14 23:32:45,883 EPOCH 63 done: loss 0.7375 - lr 0.1000 -2019-08-14 23:32:45,884 BAD EPOCHS (no improvement): 1 -2019-08-14 23:32:45,884 ---------------------------------------------------------------------------------------------------- -2019-08-14 23:32:47,718 epoch 64 - iter 0/3720 - loss 0.91116095 throughput (samples/sec): 20787.57 -2019-08-14 23:35:30,844 epoch 64 - iter 372/3720 - loss 0.70937026 throughput (samples/sec): 76.14 -2019-08-14 23:38:12,954 epoch 64 - iter 744/3720 - loss 0.71416915 throughput (samples/sec): 76.25 -2019-08-14 23:40:56,537 epoch 64 - iter 1116/3720 - loss 0.72306656 throughput (samples/sec): 75.73 -2019-08-14 23:43:38,795 epoch 64 - iter 1488/3720 - loss 0.72950350 throughput (samples/sec): 76.38 -2019-08-14 23:46:22,240 epoch 64 - iter 1860/3720 - loss 0.73023188 throughput (samples/sec): 75.55 -2019-08-14 23:49:07,508 epoch 64 - iter 2232/3720 - loss 0.73991050 throughput (samples/sec): 75.24 -2019-08-14 23:51:50,472 epoch 64 - iter 2604/3720 - loss 0.73558476 throughput (samples/sec): 75.55 -2019-08-14 23:54:34,035 epoch 64 - iter 2976/3720 - loss 0.73780724 throughput (samples/sec): 75.39 -2019-08-14 23:57:17,902 epoch 64 - iter 3348/3720 - loss 0.73830823 throughput (samples/sec): 75.54 -2019-08-15 00:00:00,770 ---------------------------------------------------------------------------------------------------- -2019-08-15 00:00:00,771 EPOCH 64 done: loss 0.7381 - lr 0.1000 -2019-08-15 00:00:00,771 BAD EPOCHS (no improvement): 2 -2019-08-15 00:00:00,771 ---------------------------------------------------------------------------------------------------- -2019-08-15 00:00:02,584 epoch 65 - iter 0/3720 - loss 0.32693148 throughput (samples/sec): 22815.08 -2019-08-15 00:02:47,795 epoch 65 - iter 372/3720 - loss 0.72546808 throughput (samples/sec): 75.18 -2019-08-15 00:05:30,832 epoch 65 - iter 744/3720 - loss 0.71997078 throughput (samples/sec): 76.18 -2019-08-15 00:08:13,133 epoch 65 - iter 1116/3720 - loss 0.72379885 throughput (samples/sec): 76.64 -2019-08-15 00:10:55,748 epoch 65 - iter 1488/3720 - loss 0.73026003 throughput (samples/sec): 75.58 -2019-08-15 00:13:38,831 epoch 65 - iter 1860/3720 - loss 0.72866729 throughput (samples/sec): 76.15 -2019-08-15 00:16:23,230 epoch 65 - iter 2232/3720 - loss 0.73193202 throughput (samples/sec): 75.80 -2019-08-15 00:19:05,811 epoch 65 - iter 2604/3720 - loss 0.73488588 throughput (samples/sec): 76.17 -2019-08-15 00:21:47,458 epoch 65 - iter 2976/3720 - loss 0.73342155 throughput (samples/sec): 76.66 -2019-08-15 00:24:30,573 epoch 65 - iter 3348/3720 - loss 0.73317977 throughput (samples/sec): 76.68 -2019-08-15 00:27:11,098 ---------------------------------------------------------------------------------------------------- -2019-08-15 00:27:11,098 EPOCH 65 done: loss 0.7337 - lr 0.1000 -2019-08-15 00:27:11,098 BAD EPOCHS (no improvement): 0 -2019-08-15 00:27:11,098 ---------------------------------------------------------------------------------------------------- -2019-08-15 00:27:12,805 epoch 66 - iter 0/3720 - loss 1.38492656 throughput (samples/sec): 24216.29 -2019-08-15 00:29:57,474 epoch 66 - iter 372/3720 - loss 0.71938262 throughput (samples/sec): 75.01 -2019-08-15 00:32:40,660 epoch 66 - iter 744/3720 - loss 0.72769710 throughput (samples/sec): 76.13 -2019-08-15 00:35:22,466 epoch 66 - iter 1116/3720 - loss 0.72472734 throughput (samples/sec): 76.03 -2019-08-15 00:38:06,013 epoch 66 - iter 1488/3720 - loss 0.72307139 throughput (samples/sec): 75.42 -2019-08-15 00:40:50,079 epoch 66 - iter 1860/3720 - loss 0.72180992 throughput (samples/sec): 75.22 -2019-08-15 00:43:33,965 epoch 66 - iter 2232/3720 - loss 0.72316565 throughput (samples/sec): 75.38 -2019-08-15 00:46:16,414 epoch 66 - iter 2604/3720 - loss 0.72457269 throughput (samples/sec): 76.39 -2019-08-15 00:48:56,521 epoch 66 - iter 2976/3720 - loss 0.72574739 throughput (samples/sec): 78.13 -2019-08-15 00:51:37,662 epoch 66 - iter 3348/3720 - loss 0.72776009 throughput (samples/sec): 77.15 -2019-08-15 00:54:19,066 ---------------------------------------------------------------------------------------------------- -2019-08-15 00:54:19,066 EPOCH 66 done: loss 0.7284 - lr 0.1000 -2019-08-15 00:54:19,067 BAD EPOCHS (no improvement): 0 -2019-08-15 00:54:19,067 ---------------------------------------------------------------------------------------------------- -2019-08-15 00:54:20,778 epoch 67 - iter 0/3720 - loss 0.29524422 throughput (samples/sec): 23902.01 -2019-08-15 00:57:03,137 epoch 67 - iter 372/3720 - loss 0.72741403 throughput (samples/sec): 76.22 -2019-08-15 00:59:46,280 epoch 67 - iter 744/3720 - loss 0.73207031 throughput (samples/sec): 75.99 -2019-08-15 01:02:30,298 epoch 67 - iter 1116/3720 - loss 0.72823694 throughput (samples/sec): 75.11 -2019-08-15 01:05:13,201 epoch 67 - iter 1488/3720 - loss 0.72249613 throughput (samples/sec): 76.04 -2019-08-15 01:07:57,837 epoch 67 - iter 1860/3720 - loss 0.72294863 throughput (samples/sec): 75.16 -2019-08-15 01:10:39,856 epoch 67 - iter 2232/3720 - loss 0.72870617 throughput (samples/sec): 76.78 -2019-08-15 01:13:26,215 epoch 67 - iter 2604/3720 - loss 0.72928314 throughput (samples/sec): 74.99 -2019-08-15 01:16:08,614 epoch 67 - iter 2976/3720 - loss 0.72970321 throughput (samples/sec): 76.23 -2019-08-15 01:18:50,806 epoch 67 - iter 3348/3720 - loss 0.73397555 throughput (samples/sec): 77.01 -2019-08-15 01:21:31,706 ---------------------------------------------------------------------------------------------------- -2019-08-15 01:21:31,706 EPOCH 67 done: loss 0.7338 - lr 0.1000 -2019-08-15 01:21:31,706 BAD EPOCHS (no improvement): 1 -2019-08-15 01:21:31,706 ---------------------------------------------------------------------------------------------------- -2019-08-15 01:21:33,410 epoch 68 - iter 0/3720 - loss 0.67003703 throughput (samples/sec): 24858.96 -2019-08-15 01:24:17,204 epoch 68 - iter 372/3720 - loss 0.73624984 throughput (samples/sec): 76.25 -2019-08-15 01:26:58,749 epoch 68 - iter 744/3720 - loss 0.72983033 throughput (samples/sec): 77.27 -2019-08-15 01:29:44,311 epoch 68 - iter 1116/3720 - loss 0.73069375 throughput (samples/sec): 74.94 -2019-08-15 01:32:27,170 epoch 68 - iter 1488/3720 - loss 0.73006510 throughput (samples/sec): 75.58 -2019-08-15 01:35:08,281 epoch 68 - iter 1860/3720 - loss 0.73174060 throughput (samples/sec): 76.45 -2019-08-15 01:37:49,065 epoch 68 - iter 2232/3720 - loss 0.73429225 throughput (samples/sec): 77.10 -2019-08-15 01:40:32,401 epoch 68 - iter 2604/3720 - loss 0.73327953 throughput (samples/sec): 76.05 -2019-08-15 01:43:16,714 epoch 68 - iter 2976/3720 - loss 0.73036007 throughput (samples/sec): 75.14 -2019-08-15 01:45:59,292 epoch 68 - iter 3348/3720 - loss 0.73032353 throughput (samples/sec): 75.96 -2019-08-15 01:48:42,887 ---------------------------------------------------------------------------------------------------- -2019-08-15 01:48:42,887 EPOCH 68 done: loss 0.7318 - lr 0.1000 -2019-08-15 01:48:42,888 BAD EPOCHS (no improvement): 2 -2019-08-15 01:48:42,888 ---------------------------------------------------------------------------------------------------- -2019-08-15 01:48:44,721 epoch 69 - iter 0/3720 - loss 0.57055688 throughput (samples/sec): 20567.90 -2019-08-15 01:51:31,678 epoch 69 - iter 372/3720 - loss 0.72734542 throughput (samples/sec): 74.45 -2019-08-15 01:54:15,084 epoch 69 - iter 744/3720 - loss 0.71460183 throughput (samples/sec): 75.57 -2019-08-15 01:57:00,147 epoch 69 - iter 1116/3720 - loss 0.72294163 throughput (samples/sec): 75.02 -2019-08-15 01:59:43,995 epoch 69 - iter 1488/3720 - loss 0.72427458 throughput (samples/sec): 75.80 -2019-08-15 02:02:29,087 epoch 69 - iter 1860/3720 - loss 0.72531735 throughput (samples/sec): 75.63 -2019-08-15 02:05:12,095 epoch 69 - iter 2232/3720 - loss 0.72807255 throughput (samples/sec): 75.89 -2019-08-15 02:07:53,268 epoch 69 - iter 2604/3720 - loss 0.72898052 throughput (samples/sec): 77.13 -2019-08-15 02:10:34,126 epoch 69 - iter 2976/3720 - loss 0.72987105 throughput (samples/sec): 76.51 -2019-08-15 02:13:17,368 epoch 69 - iter 3348/3720 - loss 0.73000897 throughput (samples/sec): 76.12 -2019-08-15 02:16:01,888 ---------------------------------------------------------------------------------------------------- -2019-08-15 02:16:01,889 EPOCH 69 done: loss 0.7306 - lr 0.1000 -2019-08-15 02:16:01,889 BAD EPOCHS (no improvement): 3 -2019-08-15 02:16:01,889 ---------------------------------------------------------------------------------------------------- -2019-08-15 02:16:03,814 epoch 70 - iter 0/3720 - loss 0.97699761 throughput (samples/sec): 18425.36 -2019-08-15 02:18:46,478 epoch 70 - iter 372/3720 - loss 0.70845860 throughput (samples/sec): 75.86 -2019-08-15 02:21:28,715 epoch 70 - iter 744/3720 - loss 0.71032953 throughput (samples/sec): 75.87 -2019-08-15 02:24:10,744 epoch 70 - iter 1116/3720 - loss 0.71447943 throughput (samples/sec): 76.43 -2019-08-15 02:26:55,204 epoch 70 - iter 1488/3720 - loss 0.71618417 throughput (samples/sec): 75.94 -2019-08-15 02:29:41,116 epoch 70 - iter 1860/3720 - loss 0.72085057 throughput (samples/sec): 75.03 -2019-08-15 02:32:25,554 epoch 70 - iter 2232/3720 - loss 0.71992998 throughput (samples/sec): 75.38 -2019-08-15 02:35:10,529 epoch 70 - iter 2604/3720 - loss 0.72028464 throughput (samples/sec): 75.42 -2019-08-15 02:37:52,344 epoch 70 - iter 2976/3720 - loss 0.72268211 throughput (samples/sec): 77.17 -2019-08-15 02:40:36,752 epoch 70 - iter 3348/3720 - loss 0.72653488 throughput (samples/sec): 75.34 -2019-08-15 02:43:19,012 ---------------------------------------------------------------------------------------------------- -2019-08-15 02:43:19,012 EPOCH 70 done: loss 0.7278 - lr 0.1000 -2019-08-15 02:43:19,012 BAD EPOCHS (no improvement): 0 -2019-08-15 02:43:19,012 ---------------------------------------------------------------------------------------------------- -2019-08-15 02:43:20,862 epoch 71 - iter 0/3720 - loss 0.53312159 throughput (samples/sec): 19862.51 -2019-08-15 02:46:03,991 epoch 71 - iter 372/3720 - loss 0.68086883 throughput (samples/sec): 76.58 -2019-08-15 02:48:48,128 epoch 71 - iter 744/3720 - loss 0.69431109 throughput (samples/sec): 75.90 -2019-08-15 02:51:32,226 epoch 71 - iter 1116/3720 - loss 0.71224295 throughput (samples/sec): 75.00 -2019-08-15 02:54:14,881 epoch 71 - iter 1488/3720 - loss 0.71512592 throughput (samples/sec): 75.38 -2019-08-15 02:56:55,867 epoch 71 - iter 1860/3720 - loss 0.72039237 throughput (samples/sec): 76.90 -2019-08-15 02:59:37,478 epoch 71 - iter 2232/3720 - loss 0.71872483 throughput (samples/sec): 76.40 -2019-08-15 03:02:21,129 epoch 71 - iter 2604/3720 - loss 0.72429349 throughput (samples/sec): 75.36 -2019-08-15 03:05:03,392 epoch 71 - iter 2976/3720 - loss 0.72168151 throughput (samples/sec): 76.56 -2019-08-15 03:07:50,560 epoch 71 - iter 3348/3720 - loss 0.72144655 throughput (samples/sec): 73.08 -2019-08-15 03:10:33,438 ---------------------------------------------------------------------------------------------------- -2019-08-15 03:10:33,439 EPOCH 71 done: loss 0.7229 - lr 0.1000 -2019-08-15 03:10:33,439 BAD EPOCHS (no improvement): 0 -2019-08-15 03:10:33,439 ---------------------------------------------------------------------------------------------------- -2019-08-15 03:10:35,178 epoch 72 - iter 0/3720 - loss 0.40853429 throughput (samples/sec): 23554.41 -2019-08-15 03:13:21,397 epoch 72 - iter 372/3720 - loss 0.71296803 throughput (samples/sec): 75.05 -2019-08-15 03:16:02,433 epoch 72 - iter 744/3720 - loss 0.71170126 throughput (samples/sec): 76.84 -2019-08-15 03:18:45,983 epoch 72 - iter 1116/3720 - loss 0.71463712 throughput (samples/sec): 76.57 -2019-08-15 03:21:28,359 epoch 72 - iter 1488/3720 - loss 0.71537863 throughput (samples/sec): 75.28 -2019-08-15 03:24:11,358 epoch 72 - iter 1860/3720 - loss 0.71696821 throughput (samples/sec): 76.23 -2019-08-15 03:26:55,292 epoch 72 - iter 2232/3720 - loss 0.71599127 throughput (samples/sec): 75.48 -2019-08-15 03:29:39,591 epoch 72 - iter 2604/3720 - loss 0.72146313 throughput (samples/sec): 75.11 -2019-08-15 03:32:21,803 epoch 72 - iter 2976/3720 - loss 0.72167216 throughput (samples/sec): 77.15 -2019-08-15 03:35:04,416 epoch 72 - iter 3348/3720 - loss 0.72258994 throughput (samples/sec): 76.43 -2019-08-15 03:37:47,613 ---------------------------------------------------------------------------------------------------- -2019-08-15 03:37:47,613 EPOCH 72 done: loss 0.7245 - lr 0.1000 -2019-08-15 03:37:47,613 BAD EPOCHS (no improvement): 1 -2019-08-15 03:37:47,614 ---------------------------------------------------------------------------------------------------- -2019-08-15 03:37:49,294 epoch 73 - iter 0/3720 - loss 1.01668167 throughput (samples/sec): 26542.08 -2019-08-15 03:40:34,891 epoch 73 - iter 372/3720 - loss 0.70263460 throughput (samples/sec): 74.77 -2019-08-15 03:43:21,047 epoch 73 - iter 744/3720 - loss 0.71070209 throughput (samples/sec): 74.39 -2019-08-15 03:46:02,782 epoch 73 - iter 1116/3720 - loss 0.72047758 throughput (samples/sec): 77.23 -2019-08-15 03:48:45,799 epoch 73 - iter 1488/3720 - loss 0.71563202 throughput (samples/sec): 76.31 -2019-08-15 03:51:27,011 epoch 73 - iter 1860/3720 - loss 0.71693005 throughput (samples/sec): 76.35 -2019-08-15 03:54:10,802 epoch 73 - iter 2232/3720 - loss 0.71710801 throughput (samples/sec): 76.37 -2019-08-15 03:56:55,901 epoch 73 - iter 2604/3720 - loss 0.71896015 throughput (samples/sec): 75.14 -2019-08-15 03:59:40,831 epoch 73 - iter 2976/3720 - loss 0.72367945 throughput (samples/sec): 75.10 -2019-08-15 04:02:23,487 epoch 73 - iter 3348/3720 - loss 0.72534895 throughput (samples/sec): 76.15 -2019-08-15 04:05:05,349 ---------------------------------------------------------------------------------------------------- -2019-08-15 04:05:05,349 EPOCH 73 done: loss 0.7245 - lr 0.1000 -2019-08-15 04:05:05,349 BAD EPOCHS (no improvement): 2 -2019-08-15 04:05:05,349 ---------------------------------------------------------------------------------------------------- -2019-08-15 04:05:07,114 epoch 74 - iter 0/3720 - loss 0.67168379 throughput (samples/sec): 21854.29 -2019-08-15 04:07:51,709 epoch 74 - iter 372/3720 - loss 0.70502705 throughput (samples/sec): 76.11 -2019-08-15 04:10:31,758 epoch 74 - iter 744/3720 - loss 0.70284704 throughput (samples/sec): 77.43 -2019-08-15 04:13:13,650 epoch 74 - iter 1116/3720 - loss 0.71386810 throughput (samples/sec): 76.77 -2019-08-15 04:15:55,467 epoch 74 - iter 1488/3720 - loss 0.72145716 throughput (samples/sec): 76.34 -2019-08-15 04:18:39,745 epoch 74 - iter 1860/3720 - loss 0.72396943 throughput (samples/sec): 75.41 -2019-08-15 04:21:24,043 epoch 74 - iter 2232/3720 - loss 0.72395768 throughput (samples/sec): 75.12 -2019-08-15 04:24:08,149 epoch 74 - iter 2604/3720 - loss 0.72496868 throughput (samples/sec): 75.51 -2019-08-15 04:26:49,271 epoch 74 - iter 2976/3720 - loss 0.72165204 throughput (samples/sec): 77.56 -2019-08-15 04:29:31,617 epoch 74 - iter 3348/3720 - loss 0.72267190 throughput (samples/sec): 76.39 -2019-08-15 04:32:13,662 ---------------------------------------------------------------------------------------------------- -2019-08-15 04:32:13,663 EPOCH 74 done: loss 0.7221 - lr 0.1000 -2019-08-15 04:32:13,663 BAD EPOCHS (no improvement): 0 -2019-08-15 04:32:13,663 ---------------------------------------------------------------------------------------------------- -2019-08-15 04:32:15,322 epoch 75 - iter 0/3720 - loss 0.84960723 throughput (samples/sec): 26459.01 -2019-08-15 04:34:59,521 epoch 75 - iter 372/3720 - loss 0.71652927 throughput (samples/sec): 75.41 -2019-08-15 04:37:41,936 epoch 75 - iter 744/3720 - loss 0.71393114 throughput (samples/sec): 76.44 -2019-08-15 04:40:24,954 epoch 75 - iter 1116/3720 - loss 0.71468260 throughput (samples/sec): 75.65 -2019-08-15 04:43:09,205 epoch 75 - iter 1488/3720 - loss 0.71450697 throughput (samples/sec): 74.88 -2019-08-15 04:45:53,382 epoch 75 - iter 1860/3720 - loss 0.71734949 throughput (samples/sec): 75.98 -2019-08-15 04:48:34,921 epoch 75 - iter 2232/3720 - loss 0.71510473 throughput (samples/sec): 76.60 -2019-08-15 04:51:16,729 epoch 75 - iter 2604/3720 - loss 0.71423974 throughput (samples/sec): 76.49 -2019-08-15 04:53:59,035 epoch 75 - iter 2976/3720 - loss 0.71413269 throughput (samples/sec): 75.74 -2019-08-15 04:56:41,420 epoch 75 - iter 3348/3720 - loss 0.71801581 throughput (samples/sec): 75.96 -2019-08-15 04:59:20,344 ---------------------------------------------------------------------------------------------------- -2019-08-15 04:59:20,344 EPOCH 75 done: loss 0.7187 - lr 0.1000 -2019-08-15 04:59:20,344 BAD EPOCHS (no improvement): 0 -2019-08-15 04:59:20,344 ---------------------------------------------------------------------------------------------------- -2019-08-15 04:59:22,183 epoch 76 - iter 0/3720 - loss 0.87450647 throughput (samples/sec): 19539.75 -2019-08-15 05:02:07,392 epoch 76 - iter 372/3720 - loss 0.68854967 throughput (samples/sec): 75.68 -2019-08-15 05:04:50,287 epoch 76 - iter 744/3720 - loss 0.70348101 throughput (samples/sec): 76.63 -2019-08-15 05:07:30,853 epoch 76 - iter 1116/3720 - loss 0.70430096 throughput (samples/sec): 77.89 -2019-08-15 05:10:11,753 epoch 76 - iter 1488/3720 - loss 0.70855042 throughput (samples/sec): 77.07 -2019-08-15 05:12:54,191 epoch 76 - iter 1860/3720 - loss 0.71257842 throughput (samples/sec): 76.36 -2019-08-15 05:15:37,557 epoch 76 - iter 2232/3720 - loss 0.71623783 throughput (samples/sec): 75.93 -2019-08-15 05:18:22,732 epoch 76 - iter 2604/3720 - loss 0.72027613 throughput (samples/sec): 75.08 -2019-08-15 05:21:08,796 epoch 76 - iter 2976/3720 - loss 0.72262447 throughput (samples/sec): 74.79 -2019-08-15 05:23:52,011 epoch 76 - iter 3348/3720 - loss 0.72023026 throughput (samples/sec): 76.23 -2019-08-15 05:26:37,511 ---------------------------------------------------------------------------------------------------- -2019-08-15 05:26:37,511 EPOCH 76 done: loss 0.7230 - lr 0.1000 -2019-08-15 05:26:37,511 BAD EPOCHS (no improvement): 1 -2019-08-15 05:26:37,512 ---------------------------------------------------------------------------------------------------- -2019-08-15 05:26:39,232 epoch 77 - iter 0/3720 - loss 0.52319741 throughput (samples/sec): 23352.40 -2019-08-15 05:29:21,675 epoch 77 - iter 372/3720 - loss 0.71583633 throughput (samples/sec): 76.16 -2019-08-15 05:32:05,303 epoch 77 - iter 744/3720 - loss 0.71254326 throughput (samples/sec): 76.31 -2019-08-15 05:34:47,816 epoch 77 - iter 1116/3720 - loss 0.71629789 throughput (samples/sec): 75.95 -2019-08-15 05:37:32,859 epoch 77 - iter 1488/3720 - loss 0.71531216 throughput (samples/sec): 75.25 -2019-08-15 05:40:15,170 epoch 77 - iter 1860/3720 - loss 0.71335654 throughput (samples/sec): 75.75 -2019-08-15 05:42:57,713 epoch 77 - iter 2232/3720 - loss 0.71539711 throughput (samples/sec): 76.37 -2019-08-15 05:45:39,956 epoch 77 - iter 2604/3720 - loss 0.71539725 throughput (samples/sec): 76.54 -2019-08-15 05:48:22,430 epoch 77 - iter 2976/3720 - loss 0.71572561 throughput (samples/sec): 75.67 -2019-08-15 05:51:04,496 epoch 77 - iter 3348/3720 - loss 0.71707533 throughput (samples/sec): 75.88 -2019-08-15 05:53:49,131 ---------------------------------------------------------------------------------------------------- -2019-08-15 05:53:49,131 EPOCH 77 done: loss 0.7192 - lr 0.1000 -2019-08-15 05:53:49,131 BAD EPOCHS (no improvement): 2 -2019-08-15 05:53:49,132 ---------------------------------------------------------------------------------------------------- -2019-08-15 05:53:50,962 epoch 78 - iter 0/3720 - loss 0.97095966 throughput (samples/sec): 20609.26 -2019-08-15 05:56:35,608 epoch 78 - iter 372/3720 - loss 0.73151890 throughput (samples/sec): 75.82 -2019-08-15 05:59:18,956 epoch 78 - iter 744/3720 - loss 0.72853587 throughput (samples/sec): 76.37 -2019-08-15 06:02:03,159 epoch 78 - iter 1116/3720 - loss 0.73047497 throughput (samples/sec): 74.92 -2019-08-15 06:04:45,146 epoch 78 - iter 1488/3720 - loss 0.72710424 throughput (samples/sec): 75.74 -2019-08-15 06:07:28,599 epoch 78 - iter 1860/3720 - loss 0.72542390 throughput (samples/sec): 75.55 -2019-08-15 06:10:10,266 epoch 78 - iter 2232/3720 - loss 0.72400651 throughput (samples/sec): 77.07 -2019-08-15 06:12:52,101 epoch 78 - iter 2604/3720 - loss 0.72071700 throughput (samples/sec): 76.22 -2019-08-15 06:15:33,194 epoch 78 - iter 2976/3720 - loss 0.71757029 throughput (samples/sec): 76.34 -2019-08-15 06:18:16,394 epoch 78 - iter 3348/3720 - loss 0.71722795 throughput (samples/sec): 75.63 -2019-08-15 06:20:59,860 ---------------------------------------------------------------------------------------------------- -2019-08-15 06:20:59,860 EPOCH 78 done: loss 0.7190 - lr 0.1000 -2019-08-15 06:20:59,860 BAD EPOCHS (no improvement): 3 -2019-08-15 06:20:59,860 ---------------------------------------------------------------------------------------------------- -2019-08-15 06:21:01,656 epoch 79 - iter 0/3720 - loss 0.54581165 throughput (samples/sec): 21264.34 -2019-08-15 06:23:44,914 epoch 79 - iter 372/3720 - loss 0.68827411 throughput (samples/sec): 75.96 -2019-08-15 06:26:30,442 epoch 79 - iter 744/3720 - loss 0.69388890 throughput (samples/sec): 74.95 -2019-08-15 06:29:11,896 epoch 79 - iter 1116/3720 - loss 0.70319973 throughput (samples/sec): 77.26 -2019-08-15 06:31:57,059 epoch 79 - iter 1488/3720 - loss 0.70832690 throughput (samples/sec): 75.16 -2019-08-15 06:34:40,432 epoch 79 - iter 1860/3720 - loss 0.70641430 throughput (samples/sec): 76.10 -2019-08-15 06:37:26,014 epoch 79 - iter 2232/3720 - loss 0.70745979 throughput (samples/sec): 75.01 -2019-08-15 06:40:09,389 epoch 79 - iter 2604/3720 - loss 0.70879405 throughput (samples/sec): 75.90 -2019-08-15 06:42:51,843 epoch 79 - iter 2976/3720 - loss 0.71328096 throughput (samples/sec): 76.05 -2019-08-15 06:45:35,117 epoch 79 - iter 3348/3720 - loss 0.71352927 throughput (samples/sec): 76.16 -2019-08-15 06:48:18,389 ---------------------------------------------------------------------------------------------------- -2019-08-15 06:48:18,390 EPOCH 79 done: loss 0.7167 - lr 0.1000 -2019-08-15 06:48:18,390 BAD EPOCHS (no improvement): 0 -2019-08-15 06:48:18,390 ---------------------------------------------------------------------------------------------------- -2019-08-15 06:48:20,204 epoch 80 - iter 0/3720 - loss 1.34681654 throughput (samples/sec): 20757.17 -2019-08-15 06:51:01,871 epoch 80 - iter 372/3720 - loss 0.71983846 throughput (samples/sec): 77.08 -2019-08-15 06:53:44,055 epoch 80 - iter 744/3720 - loss 0.71534590 throughput (samples/sec): 76.99 -2019-08-15 06:56:24,785 epoch 80 - iter 1116/3720 - loss 0.71601787 throughput (samples/sec): 77.18 -2019-08-15 06:59:04,403 epoch 80 - iter 1488/3720 - loss 0.71458852 throughput (samples/sec): 78.54 -2019-08-15 07:01:46,283 epoch 80 - iter 1860/3720 - loss 0.72151747 throughput (samples/sec): 76.75 -2019-08-15 07:04:31,175 epoch 80 - iter 2232/3720 - loss 0.71984675 throughput (samples/sec): 75.51 -2019-08-15 07:07:14,738 epoch 80 - iter 2604/3720 - loss 0.71869264 throughput (samples/sec): 75.61 -2019-08-15 07:09:56,980 epoch 80 - iter 2976/3720 - loss 0.71889504 throughput (samples/sec): 75.77 -2019-08-15 07:12:39,419 epoch 80 - iter 3348/3720 - loss 0.71922591 throughput (samples/sec): 76.74 -2019-08-15 07:15:22,799 ---------------------------------------------------------------------------------------------------- -2019-08-15 07:15:22,800 EPOCH 80 done: loss 0.7171 - lr 0.1000 -2019-08-15 07:15:22,800 BAD EPOCHS (no improvement): 1 -2019-08-15 07:15:22,800 ---------------------------------------------------------------------------------------------------- -2019-08-15 07:15:24,513 epoch 81 - iter 0/3720 - loss 0.39379978 throughput (samples/sec): 24755.38 -2019-08-15 07:18:07,050 epoch 81 - iter 372/3720 - loss 0.74374821 throughput (samples/sec): 76.82 -2019-08-15 07:20:49,091 epoch 81 - iter 744/3720 - loss 0.72158863 throughput (samples/sec): 76.70 -2019-08-15 07:23:33,651 epoch 81 - iter 1116/3720 - loss 0.72504865 throughput (samples/sec): 75.01 -2019-08-15 07:26:17,674 epoch 81 - iter 1488/3720 - loss 0.71647176 throughput (samples/sec): 75.51 -2019-08-15 07:29:02,835 epoch 81 - iter 1860/3720 - loss 0.71379372 throughput (samples/sec): 75.25 -2019-08-15 07:31:47,124 epoch 81 - iter 2232/3720 - loss 0.71409927 throughput (samples/sec): 75.30 -2019-08-15 07:34:30,674 epoch 81 - iter 2604/3720 - loss 0.71473264 throughput (samples/sec): 75.41 -2019-08-15 07:37:14,612 epoch 81 - iter 2976/3720 - loss 0.71694004 throughput (samples/sec): 75.91 -2019-08-15 07:39:58,013 epoch 81 - iter 3348/3720 - loss 0.71819758 throughput (samples/sec): 75.95 -2019-08-15 07:42:42,442 ---------------------------------------------------------------------------------------------------- -2019-08-15 07:42:42,443 EPOCH 81 done: loss 0.7201 - lr 0.1000 -2019-08-15 07:42:42,443 BAD EPOCHS (no improvement): 2 -2019-08-15 07:42:42,443 ---------------------------------------------------------------------------------------------------- -2019-08-15 07:42:44,431 epoch 82 - iter 0/3720 - loss 1.17524791 throughput (samples/sec): 15472.25 -2019-08-15 07:45:27,863 epoch 82 - iter 372/3720 - loss 0.70881768 throughput (samples/sec): 76.34 -2019-08-15 07:48:10,445 epoch 82 - iter 744/3720 - loss 0.71449206 throughput (samples/sec): 76.47 -2019-08-15 07:50:52,159 epoch 82 - iter 1116/3720 - loss 0.71133143 throughput (samples/sec): 76.31 -2019-08-15 07:53:37,238 epoch 82 - iter 1488/3720 - loss 0.71113557 throughput (samples/sec): 75.28 -2019-08-15 07:56:19,905 epoch 82 - iter 1860/3720 - loss 0.71583577 throughput (samples/sec): 76.38 -2019-08-15 07:59:02,293 epoch 82 - iter 2232/3720 - loss 0.71294326 throughput (samples/sec): 76.54 -2019-08-15 08:01:46,967 epoch 82 - iter 2604/3720 - loss 0.71000824 throughput (samples/sec): 75.17 -2019-08-15 08:04:30,774 epoch 82 - iter 2976/3720 - loss 0.71203944 throughput (samples/sec): 75.60 -2019-08-15 08:07:13,887 epoch 82 - iter 3348/3720 - loss 0.71309405 throughput (samples/sec): 75.71 -2019-08-15 08:09:56,305 ---------------------------------------------------------------------------------------------------- -2019-08-15 08:09:56,305 EPOCH 82 done: loss 0.7161 - lr 0.1000 -2019-08-15 08:09:56,305 BAD EPOCHS (no improvement): 0 -2019-08-15 08:09:56,306 ---------------------------------------------------------------------------------------------------- -2019-08-15 08:09:58,063 epoch 83 - iter 0/3720 - loss 0.47900760 throughput (samples/sec): 22416.92 -2019-08-15 08:12:43,439 epoch 83 - iter 372/3720 - loss 0.69056693 throughput (samples/sec): 75.38 -2019-08-15 08:15:26,418 epoch 83 - iter 744/3720 - loss 0.68401196 throughput (samples/sec): 76.36 -2019-08-15 08:18:13,124 epoch 83 - iter 1116/3720 - loss 0.69711455 throughput (samples/sec): 74.64 -2019-08-15 08:20:55,299 epoch 83 - iter 1488/3720 - loss 0.69848398 throughput (samples/sec): 75.48 -2019-08-15 08:23:38,996 epoch 83 - iter 1860/3720 - loss 0.70625398 throughput (samples/sec): 76.01 -2019-08-15 08:26:21,621 epoch 83 - iter 2232/3720 - loss 0.71175847 throughput (samples/sec): 76.52 -2019-08-15 08:29:06,650 epoch 83 - iter 2604/3720 - loss 0.71315146 throughput (samples/sec): 75.52 -2019-08-15 08:31:49,028 epoch 83 - iter 2976/3720 - loss 0.71186003 throughput (samples/sec): 76.06 -2019-08-15 08:34:31,404 epoch 83 - iter 3348/3720 - loss 0.71244067 throughput (samples/sec): 76.30 -2019-08-15 08:37:12,221 ---------------------------------------------------------------------------------------------------- -2019-08-15 08:37:12,221 EPOCH 83 done: loss 0.7155 - lr 0.1000 -2019-08-15 08:37:12,221 BAD EPOCHS (no improvement): 0 -2019-08-15 08:37:12,221 ---------------------------------------------------------------------------------------------------- -2019-08-15 08:37:14,859 epoch 84 - iter 0/3720 - loss 0.79604387 throughput (samples/sec): 26615.75 -2019-08-15 08:39:57,170 epoch 84 - iter 372/3720 - loss 0.69947158 throughput (samples/sec): 76.89 -2019-08-15 08:42:39,447 epoch 84 - iter 744/3720 - loss 0.68920619 throughput (samples/sec): 76.38 -2019-08-15 08:45:24,778 epoch 84 - iter 1116/3720 - loss 0.69616719 throughput (samples/sec): 74.80 -2019-08-15 08:48:07,320 epoch 84 - iter 1488/3720 - loss 0.69967011 throughput (samples/sec): 75.88 -2019-08-15 08:50:48,332 epoch 84 - iter 1860/3720 - loss 0.70326130 throughput (samples/sec): 76.90 -2019-08-15 08:53:32,567 epoch 84 - iter 2232/3720 - loss 0.70575530 throughput (samples/sec): 75.69 -2019-08-15 08:56:18,199 epoch 84 - iter 2604/3720 - loss 0.70827250 throughput (samples/sec): 74.72 -2019-08-15 08:58:59,678 epoch 84 - iter 2976/3720 - loss 0.70836913 throughput (samples/sec): 77.00 -2019-08-15 09:01:46,405 epoch 84 - iter 3348/3720 - loss 0.70765945 throughput (samples/sec): 74.55 -2019-08-15 09:04:30,003 ---------------------------------------------------------------------------------------------------- -2019-08-15 09:04:30,004 EPOCH 84 done: loss 0.7102 - lr 0.1000 -2019-08-15 09:04:30,004 BAD EPOCHS (no improvement): 0 -2019-08-15 09:04:30,004 ---------------------------------------------------------------------------------------------------- -2019-08-15 09:04:31,760 epoch 85 - iter 0/3720 - loss 1.04851484 throughput (samples/sec): 21752.62 -2019-08-15 09:07:16,977 epoch 85 - iter 372/3720 - loss 0.68933940 throughput (samples/sec): 75.44 -2019-08-15 09:10:00,302 epoch 85 - iter 744/3720 - loss 0.68677650 throughput (samples/sec): 75.84 -2019-08-15 09:12:41,129 epoch 85 - iter 1116/3720 - loss 0.69379703 throughput (samples/sec): 77.26 -2019-08-15 09:15:26,305 epoch 85 - iter 1488/3720 - loss 0.69705130 throughput (samples/sec): 74.71 -2019-08-15 09:18:06,181 epoch 85 - iter 1860/3720 - loss 0.70090496 throughput (samples/sec): 76.94 -2019-08-15 09:20:46,179 epoch 85 - iter 2232/3720 - loss 0.70292175 throughput (samples/sec): 77.44 -2019-08-15 09:23:28,857 epoch 85 - iter 2604/3720 - loss 0.70599916 throughput (samples/sec): 75.89 -2019-08-15 09:26:11,513 epoch 85 - iter 2976/3720 - loss 0.70623089 throughput (samples/sec): 76.13 -2019-08-15 09:28:54,064 epoch 85 - iter 3348/3720 - loss 0.70744431 throughput (samples/sec): 76.13 -2019-08-15 09:31:35,233 ---------------------------------------------------------------------------------------------------- -2019-08-15 09:31:35,233 EPOCH 85 done: loss 0.7111 - lr 0.1000 -2019-08-15 09:31:35,233 BAD EPOCHS (no improvement): 1 -2019-08-15 09:31:35,233 ---------------------------------------------------------------------------------------------------- -2019-08-15 09:31:36,970 epoch 86 - iter 0/3720 - loss 0.59926081 throughput (samples/sec): 23991.90 -2019-08-15 09:34:24,464 epoch 86 - iter 372/3720 - loss 0.67925644 throughput (samples/sec): 74.58 -2019-08-15 09:37:06,840 epoch 86 - iter 744/3720 - loss 0.69237543 throughput (samples/sec): 76.98 -2019-08-15 09:39:49,809 epoch 86 - iter 1116/3720 - loss 0.70589843 throughput (samples/sec): 75.27 -2019-08-15 09:42:33,734 epoch 86 - iter 1488/3720 - loss 0.70206745 throughput (samples/sec): 76.08 -2019-08-15 09:45:16,693 epoch 86 - iter 1860/3720 - loss 0.69944569 throughput (samples/sec): 76.30 -2019-08-15 09:47:59,208 epoch 86 - iter 2232/3720 - loss 0.70114293 throughput (samples/sec): 76.79 -2019-08-15 09:50:43,378 epoch 86 - iter 2604/3720 - loss 0.70259871 throughput (samples/sec): 75.73 -2019-08-15 09:53:25,082 epoch 86 - iter 2976/3720 - loss 0.70381558 throughput (samples/sec): 76.59 -2019-08-15 09:56:10,321 epoch 86 - iter 3348/3720 - loss 0.70828687 throughput (samples/sec): 74.86 -2019-08-15 09:58:51,895 ---------------------------------------------------------------------------------------------------- -2019-08-15 09:58:51,895 EPOCH 86 done: loss 0.7095 - lr 0.1000 -2019-08-15 09:58:51,895 BAD EPOCHS (no improvement): 0 -2019-08-15 09:58:51,896 ---------------------------------------------------------------------------------------------------- -2019-08-15 09:58:53,809 epoch 87 - iter 0/3720 - loss 0.64586198 throughput (samples/sec): 17257.59 -2019-08-15 10:01:39,109 epoch 87 - iter 372/3720 - loss 0.72373479 throughput (samples/sec): 75.08 -2019-08-15 10:04:24,280 epoch 87 - iter 744/3720 - loss 0.71417689 throughput (samples/sec): 74.62 -2019-08-15 10:07:10,359 epoch 87 - iter 1116/3720 - loss 0.71381881 throughput (samples/sec): 75.46 -2019-08-15 10:09:55,066 epoch 87 - iter 1488/3720 - loss 0.71484314 throughput (samples/sec): 75.28 -2019-08-15 10:12:38,177 epoch 87 - iter 1860/3720 - loss 0.71553585 throughput (samples/sec): 76.02 -2019-08-15 10:15:23,093 epoch 87 - iter 2232/3720 - loss 0.71716088 throughput (samples/sec): 74.94 -2019-08-15 10:18:08,134 epoch 87 - iter 2604/3720 - loss 0.71587155 throughput (samples/sec): 75.60 -2019-08-15 10:20:54,701 epoch 87 - iter 2976/3720 - loss 0.71455893 throughput (samples/sec): 74.11 -2019-08-15 10:23:37,852 epoch 87 - iter 3348/3720 - loss 0.71655961 throughput (samples/sec): 75.75 -2019-08-15 10:26:24,409 ---------------------------------------------------------------------------------------------------- -2019-08-15 10:26:24,410 EPOCH 87 done: loss 0.7139 - lr 0.1000 -2019-08-15 10:26:24,410 BAD EPOCHS (no improvement): 1 -2019-08-15 10:26:24,410 ---------------------------------------------------------------------------------------------------- -2019-08-15 10:26:27,111 epoch 88 - iter 0/3720 - loss 0.49761629 throughput (samples/sec): 25767.01 -2019-08-15 10:29:10,743 epoch 88 - iter 372/3720 - loss 0.70082877 throughput (samples/sec): 75.66 -2019-08-15 10:31:53,139 epoch 88 - iter 744/3720 - loss 0.70259585 throughput (samples/sec): 75.82 -2019-08-15 10:34:37,683 epoch 88 - iter 1116/3720 - loss 0.71057055 throughput (samples/sec): 75.59 -2019-08-15 10:37:18,805 epoch 88 - iter 1488/3720 - loss 0.71126708 throughput (samples/sec): 76.53 -2019-08-15 10:40:03,781 epoch 88 - iter 1860/3720 - loss 0.71237696 throughput (samples/sec): 75.01 -2019-08-15 10:42:46,044 epoch 88 - iter 2232/3720 - loss 0.71301907 throughput (samples/sec): 76.09 -2019-08-15 10:45:29,130 epoch 88 - iter 2604/3720 - loss 0.71401924 throughput (samples/sec): 76.35 -2019-08-15 10:48:13,363 epoch 88 - iter 2976/3720 - loss 0.71401680 throughput (samples/sec): 75.38 -2019-08-15 10:50:55,740 epoch 88 - iter 3348/3720 - loss 0.71652158 throughput (samples/sec): 76.53 -2019-08-15 10:53:37,522 ---------------------------------------------------------------------------------------------------- -2019-08-15 10:53:37,522 EPOCH 88 done: loss 0.7165 - lr 0.1000 -2019-08-15 10:53:37,522 BAD EPOCHS (no improvement): 2 -2019-08-15 10:53:37,522 ---------------------------------------------------------------------------------------------------- -2019-08-15 10:53:39,283 epoch 89 - iter 0/3720 - loss 1.21095634 throughput (samples/sec): 22379.86 -2019-08-15 10:56:25,124 epoch 89 - iter 372/3720 - loss 0.69631875 throughput (samples/sec): 75.58 -2019-08-15 10:59:05,971 epoch 89 - iter 744/3720 - loss 0.69787559 throughput (samples/sec): 76.83 -2019-08-15 11:01:47,429 epoch 89 - iter 1116/3720 - loss 0.70622424 throughput (samples/sec): 77.46 -2019-08-15 11:04:30,693 epoch 89 - iter 1488/3720 - loss 0.70424365 throughput (samples/sec): 76.07 -2019-08-15 11:07:13,966 epoch 89 - iter 1860/3720 - loss 0.70365037 throughput (samples/sec): 76.09 -2019-08-15 11:09:56,968 epoch 89 - iter 2232/3720 - loss 0.70647564 throughput (samples/sec): 76.29 -2019-08-15 11:12:38,676 epoch 89 - iter 2604/3720 - loss 0.71037065 throughput (samples/sec): 76.02 -2019-08-15 11:15:22,715 epoch 89 - iter 2976/3720 - loss 0.70962950 throughput (samples/sec): 75.73 -2019-08-15 11:18:07,655 epoch 89 - iter 3348/3720 - loss 0.71011431 throughput (samples/sec): 74.79 -2019-08-15 11:20:48,510 ---------------------------------------------------------------------------------------------------- -2019-08-15 11:20:48,510 EPOCH 89 done: loss 0.7107 - lr 0.1000 -2019-08-15 11:20:48,510 BAD EPOCHS (no improvement): 3 -2019-08-15 11:20:48,510 ---------------------------------------------------------------------------------------------------- -2019-08-15 11:20:50,252 epoch 90 - iter 0/3720 - loss 0.63048029 throughput (samples/sec): 23207.70 -2019-08-15 11:23:31,574 epoch 90 - iter 372/3720 - loss 0.69213680 throughput (samples/sec): 77.01 -2019-08-15 11:26:16,566 epoch 90 - iter 744/3720 - loss 0.69593750 throughput (samples/sec): 74.86 -2019-08-15 11:29:00,168 epoch 90 - iter 1116/3720 - loss 0.69884459 throughput (samples/sec): 76.32 -2019-08-15 11:31:43,980 epoch 90 - iter 1488/3720 - loss 0.70703582 throughput (samples/sec): 76.28 -2019-08-15 11:34:29,153 epoch 90 - iter 1860/3720 - loss 0.71135421 throughput (samples/sec): 75.39 -2019-08-15 11:37:12,852 epoch 90 - iter 2232/3720 - loss 0.71268124 throughput (samples/sec): 76.08 -2019-08-15 11:39:54,687 epoch 90 - iter 2604/3720 - loss 0.71307644 throughput (samples/sec): 77.02 -2019-08-15 11:42:38,448 epoch 90 - iter 2976/3720 - loss 0.71470457 throughput (samples/sec): 75.74 -2019-08-15 11:45:21,089 epoch 90 - iter 3348/3720 - loss 0.71586859 throughput (samples/sec): 76.84 -2019-08-15 11:48:04,454 ---------------------------------------------------------------------------------------------------- -2019-08-15 11:48:04,455 EPOCH 90 done: loss 0.7134 - lr 0.1000 -2019-08-15 11:48:04,455 BAD EPOCHS (no improvement): 4 -2019-08-15 11:48:04,455 ---------------------------------------------------------------------------------------------------- -2019-08-15 11:48:06,214 epoch 91 - iter 0/3720 - loss 0.49616086 throughput (samples/sec): 24371.09 -2019-08-15 11:50:48,683 epoch 91 - iter 372/3720 - loss 0.67276427 throughput (samples/sec): 76.58 -2019-08-15 11:53:29,991 epoch 91 - iter 744/3720 - loss 0.66631579 throughput (samples/sec): 77.74 -2019-08-15 11:56:11,923 epoch 91 - iter 1116/3720 - loss 0.67888678 throughput (samples/sec): 76.50 -2019-08-15 11:58:55,536 epoch 91 - iter 1488/3720 - loss 0.67353506 throughput (samples/sec): 75.46 -2019-08-15 12:01:38,144 epoch 91 - iter 1860/3720 - loss 0.67393512 throughput (samples/sec): 75.51 -2019-08-15 12:04:20,108 epoch 91 - iter 2232/3720 - loss 0.67502196 throughput (samples/sec): 76.60 -2019-08-15 12:07:01,377 epoch 91 - iter 2604/3720 - loss 0.67667188 throughput (samples/sec): 76.90 -2019-08-15 12:09:43,721 epoch 91 - iter 2976/3720 - loss 0.67674436 throughput (samples/sec): 76.65 -2019-08-15 12:12:24,817 epoch 91 - iter 3348/3720 - loss 0.67568441 throughput (samples/sec): 77.26 -2019-08-15 12:15:04,909 ---------------------------------------------------------------------------------------------------- -2019-08-15 12:15:04,910 EPOCH 91 done: loss 0.6728 - lr 0.0500 -2019-08-15 12:15:04,910 BAD EPOCHS (no improvement): 0 -2019-08-15 12:15:04,910 ---------------------------------------------------------------------------------------------------- -2019-08-15 12:15:06,782 epoch 92 - iter 0/3720 - loss 0.39718634 throughput (samples/sec): 18577.93 -2019-08-15 12:17:49,964 epoch 92 - iter 372/3720 - loss 0.67530175 throughput (samples/sec): 75.83 -2019-08-15 12:20:34,174 epoch 92 - iter 744/3720 - loss 0.66614103 throughput (samples/sec): 75.84 -2019-08-15 12:23:16,239 epoch 92 - iter 1116/3720 - loss 0.66604268 throughput (samples/sec): 76.48 -2019-08-15 12:26:00,173 epoch 92 - iter 1488/3720 - loss 0.66534981 throughput (samples/sec): 75.50 -2019-08-15 12:28:43,583 epoch 92 - iter 1860/3720 - loss 0.65883827 throughput (samples/sec): 75.48 -2019-08-15 12:31:24,738 epoch 92 - iter 2232/3720 - loss 0.65952887 throughput (samples/sec): 77.31 -2019-08-15 12:34:07,118 epoch 92 - iter 2604/3720 - loss 0.65772248 throughput (samples/sec): 76.54 -2019-08-15 12:36:49,730 epoch 92 - iter 2976/3720 - loss 0.66022477 throughput (samples/sec): 76.48 -2019-08-15 12:39:31,805 epoch 92 - iter 3348/3720 - loss 0.65835097 throughput (samples/sec): 76.71 -2019-08-15 12:42:15,465 ---------------------------------------------------------------------------------------------------- -2019-08-15 12:42:15,465 EPOCH 92 done: loss 0.6581 - lr 0.0500 -2019-08-15 12:42:15,465 BAD EPOCHS (no improvement): 0 -2019-08-15 12:42:15,465 ---------------------------------------------------------------------------------------------------- -2019-08-15 12:42:17,439 epoch 93 - iter 0/3720 - loss 1.09071684 throughput (samples/sec): 15992.46 -2019-08-15 12:45:01,882 epoch 93 - iter 372/3720 - loss 0.65859486 throughput (samples/sec): 75.53 -2019-08-15 12:47:44,055 epoch 93 - iter 744/3720 - loss 0.66256201 throughput (samples/sec): 76.67 -2019-08-15 12:50:27,783 epoch 93 - iter 1116/3720 - loss 0.65954278 throughput (samples/sec): 75.63 -2019-08-15 12:53:13,470 epoch 93 - iter 1488/3720 - loss 0.65372360 throughput (samples/sec): 74.81 -2019-08-15 12:55:58,808 epoch 93 - iter 1860/3720 - loss 0.65663737 throughput (samples/sec): 75.13 -2019-08-15 12:58:42,249 epoch 93 - iter 2232/3720 - loss 0.65242910 throughput (samples/sec): 76.19 -2019-08-15 13:01:26,385 epoch 93 - iter 2604/3720 - loss 0.65140102 throughput (samples/sec): 75.87 -2019-08-15 13:04:11,148 epoch 93 - iter 2976/3720 - loss 0.64991429 throughput (samples/sec): 75.35 -2019-08-15 13:06:58,390 epoch 93 - iter 3348/3720 - loss 0.65157121 throughput (samples/sec): 74.22 -2019-08-15 13:09:39,492 ---------------------------------------------------------------------------------------------------- -2019-08-15 13:09:39,493 EPOCH 93 done: loss 0.6506 - lr 0.0500 -2019-08-15 13:09:39,493 BAD EPOCHS (no improvement): 0 -2019-08-15 13:09:39,493 ---------------------------------------------------------------------------------------------------- -2019-08-15 13:09:41,329 epoch 94 - iter 0/3720 - loss 1.00084543 throughput (samples/sec): 19950.96 -2019-08-15 13:12:25,957 epoch 94 - iter 372/3720 - loss 0.62551682 throughput (samples/sec): 75.26 -2019-08-15 13:15:08,102 epoch 94 - iter 744/3720 - loss 0.63496570 throughput (samples/sec): 76.99 -2019-08-15 13:17:51,914 epoch 94 - iter 1116/3720 - loss 0.63428354 throughput (samples/sec): 75.37 -2019-08-15 13:20:35,855 epoch 94 - iter 1488/3720 - loss 0.64017830 throughput (samples/sec): 75.76 -2019-08-15 13:23:20,396 epoch 94 - iter 1860/3720 - loss 0.64151697 throughput (samples/sec): 75.48 -2019-08-15 13:26:02,019 epoch 94 - iter 2232/3720 - loss 0.64507035 throughput (samples/sec): 77.18 -2019-08-15 13:28:44,792 epoch 94 - iter 2604/3720 - loss 0.64439664 throughput (samples/sec): 76.40 -2019-08-15 13:31:28,265 epoch 94 - iter 2976/3720 - loss 0.64545096 throughput (samples/sec): 76.30 -2019-08-15 13:34:10,181 epoch 94 - iter 3348/3720 - loss 0.64639107 throughput (samples/sec): 76.21 -2019-08-15 13:36:55,423 ---------------------------------------------------------------------------------------------------- -2019-08-15 13:36:55,424 EPOCH 94 done: loss 0.6460 - lr 0.0500 -2019-08-15 13:36:55,424 BAD EPOCHS (no improvement): 0 -2019-08-15 13:36:55,424 ---------------------------------------------------------------------------------------------------- -2019-08-15 13:36:57,213 epoch 95 - iter 0/3720 - loss 0.55233073 throughput (samples/sec): 21130.19 -2019-08-15 13:39:39,636 epoch 95 - iter 372/3720 - loss 0.63800182 throughput (samples/sec): 76.55 -2019-08-15 13:42:21,745 epoch 95 - iter 744/3720 - loss 0.64091769 throughput (samples/sec): 77.03 -2019-08-15 13:45:01,542 epoch 95 - iter 1116/3720 - loss 0.64148922 throughput (samples/sec): 76.96 -2019-08-15 13:47:44,375 epoch 95 - iter 1488/3720 - loss 0.63801494 throughput (samples/sec): 76.56 -2019-08-15 13:50:25,981 epoch 95 - iter 1860/3720 - loss 0.63944375 throughput (samples/sec): 76.72 -2019-08-15 13:53:08,050 epoch 95 - iter 2232/3720 - loss 0.63940173 throughput (samples/sec): 77.15 -2019-08-15 13:55:47,989 epoch 95 - iter 2604/3720 - loss 0.64117580 throughput (samples/sec): 77.23 -2019-08-15 13:58:28,924 epoch 95 - iter 2976/3720 - loss 0.64273247 throughput (samples/sec): 77.52 -2019-08-15 14:01:10,735 epoch 95 - iter 3348/3720 - loss 0.64274266 throughput (samples/sec): 77.24 -2019-08-15 14:03:53,994 ---------------------------------------------------------------------------------------------------- -2019-08-15 14:03:53,995 EPOCH 95 done: loss 0.6413 - lr 0.0500 -2019-08-15 14:03:53,995 BAD EPOCHS (no improvement): 0 -2019-08-15 14:03:53,995 ---------------------------------------------------------------------------------------------------- -2019-08-15 14:03:55,709 epoch 96 - iter 0/3720 - loss 0.42119169 throughput (samples/sec): 23783.91 -2019-08-15 14:06:38,565 epoch 96 - iter 372/3720 - loss 0.62577714 throughput (samples/sec): 76.23 -2019-08-15 14:09:24,091 epoch 96 - iter 744/3720 - loss 0.61780517 throughput (samples/sec): 75.22 -2019-08-15 14:12:09,219 epoch 96 - iter 1116/3720 - loss 0.62529063 throughput (samples/sec): 75.08 -2019-08-15 14:14:54,769 epoch 96 - iter 1488/3720 - loss 0.62640795 throughput (samples/sec): 75.12 -2019-08-15 14:17:37,138 epoch 96 - iter 1860/3720 - loss 0.62769568 throughput (samples/sec): 75.64 -2019-08-15 14:20:21,747 epoch 96 - iter 2232/3720 - loss 0.62664363 throughput (samples/sec): 74.83 -2019-08-15 14:23:08,783 epoch 96 - iter 2604/3720 - loss 0.62868551 throughput (samples/sec): 74.46 -2019-08-15 14:25:54,262 epoch 96 - iter 2976/3720 - loss 0.63070080 throughput (samples/sec): 74.96 -2019-08-15 14:28:38,192 epoch 96 - iter 3348/3720 - loss 0.63070599 throughput (samples/sec): 75.82 -2019-08-15 14:31:18,711 ---------------------------------------------------------------------------------------------------- -2019-08-15 14:31:18,711 EPOCH 96 done: loss 0.6308 - lr 0.0500 -2019-08-15 14:31:18,711 BAD EPOCHS (no improvement): 0 -2019-08-15 14:31:18,711 ---------------------------------------------------------------------------------------------------- -2019-08-15 14:31:20,445 epoch 97 - iter 0/3720 - loss 0.45479202 throughput (samples/sec): 22924.22 -2019-08-15 14:34:05,063 epoch 97 - iter 372/3720 - loss 0.64063845 throughput (samples/sec): 75.57 -2019-08-15 14:36:47,516 epoch 97 - iter 744/3720 - loss 0.63489159 throughput (samples/sec): 75.72 -2019-08-15 14:39:30,298 epoch 97 - iter 1116/3720 - loss 0.63447781 throughput (samples/sec): 75.77 -2019-08-15 14:42:12,896 epoch 97 - iter 1488/3720 - loss 0.63035372 throughput (samples/sec): 76.11 -2019-08-15 14:44:54,645 epoch 97 - iter 1860/3720 - loss 0.63191040 throughput (samples/sec): 76.81 -2019-08-15 14:47:38,361 epoch 97 - iter 2232/3720 - loss 0.63127765 throughput (samples/sec): 76.18 -2019-08-15 14:50:22,852 epoch 97 - iter 2604/3720 - loss 0.63028821 throughput (samples/sec): 75.23 -2019-08-15 14:53:07,120 epoch 97 - iter 2976/3720 - loss 0.62950294 throughput (samples/sec): 75.62 -2019-08-15 14:55:48,840 epoch 97 - iter 3348/3720 - loss 0.62849805 throughput (samples/sec): 76.77 -2019-08-15 14:58:28,719 ---------------------------------------------------------------------------------------------------- -2019-08-15 14:58:28,720 EPOCH 97 done: loss 0.6308 - lr 0.0500 -2019-08-15 14:58:28,720 BAD EPOCHS (no improvement): 1 -2019-08-15 14:58:28,720 ---------------------------------------------------------------------------------------------------- -2019-08-15 14:58:30,447 epoch 98 - iter 0/3720 - loss 0.62233019 throughput (samples/sec): 24589.70 -2019-08-15 15:01:11,944 epoch 98 - iter 372/3720 - loss 0.64372592 throughput (samples/sec): 77.07 -2019-08-15 15:03:53,559 epoch 98 - iter 744/3720 - loss 0.62826146 throughput (samples/sec): 76.66 -2019-08-15 15:06:37,710 epoch 98 - iter 1116/3720 - loss 0.61668310 throughput (samples/sec): 75.62 -2019-08-15 15:09:19,776 epoch 98 - iter 1488/3720 - loss 0.62476347 throughput (samples/sec): 76.67 -2019-08-15 15:12:03,552 epoch 98 - iter 1860/3720 - loss 0.62283315 throughput (samples/sec): 75.81 -2019-08-15 15:14:49,447 epoch 98 - iter 2232/3720 - loss 0.62418568 throughput (samples/sec): 74.87 -2019-08-15 15:17:31,210 epoch 98 - iter 2604/3720 - loss 0.62312362 throughput (samples/sec): 76.54 -2019-08-15 15:20:13,858 epoch 98 - iter 2976/3720 - loss 0.62438885 throughput (samples/sec): 75.86 -2019-08-15 15:22:54,700 epoch 98 - iter 3348/3720 - loss 0.62598018 throughput (samples/sec): 77.00 -2019-08-15 15:25:36,170 ---------------------------------------------------------------------------------------------------- -2019-08-15 15:25:36,170 EPOCH 98 done: loss 0.6290 - lr 0.0500 -2019-08-15 15:25:36,170 BAD EPOCHS (no improvement): 0 -2019-08-15 15:25:36,171 ---------------------------------------------------------------------------------------------------- -2019-08-15 15:25:37,944 epoch 99 - iter 0/3720 - loss 1.45279622 throughput (samples/sec): 21265.61 -2019-08-15 15:28:21,393 epoch 99 - iter 372/3720 - loss 0.61880012 throughput (samples/sec): 75.98 -2019-08-15 15:31:02,832 epoch 99 - iter 744/3720 - loss 0.61726374 throughput (samples/sec): 77.19 -2019-08-15 15:33:47,652 epoch 99 - iter 1116/3720 - loss 0.61193990 throughput (samples/sec): 75.35 -2019-08-15 15:36:31,796 epoch 99 - iter 1488/3720 - loss 0.61393909 throughput (samples/sec): 75.52 -2019-08-15 15:39:13,994 epoch 99 - iter 1860/3720 - loss 0.61321433 throughput (samples/sec): 76.36 -2019-08-15 15:41:55,607 epoch 99 - iter 2232/3720 - loss 0.61665175 throughput (samples/sec): 76.34 -2019-08-15 15:44:37,373 epoch 99 - iter 2604/3720 - loss 0.61896207 throughput (samples/sec): 76.52 -2019-08-15 15:47:19,209 epoch 99 - iter 2976/3720 - loss 0.61902363 throughput (samples/sec): 76.24 -2019-08-15 15:50:01,877 epoch 99 - iter 3348/3720 - loss 0.61904724 throughput (samples/sec): 75.59 -2019-08-15 15:52:47,679 ---------------------------------------------------------------------------------------------------- -2019-08-15 15:52:47,680 EPOCH 99 done: loss 0.6215 - lr 0.0500 -2019-08-15 15:52:47,680 BAD EPOCHS (no improvement): 0 -2019-08-15 15:52:47,680 ---------------------------------------------------------------------------------------------------- -2019-08-15 15:52:49,443 epoch 100 - iter 0/3720 - loss 0.54642630 throughput (samples/sec): 24541.17 -2019-08-15 15:55:32,568 epoch 100 - iter 372/3720 - loss 0.61056836 throughput (samples/sec): 76.29 -2019-08-15 15:58:15,024 epoch 100 - iter 744/3720 - loss 0.61241410 throughput (samples/sec): 76.08 -2019-08-15 16:00:57,834 epoch 100 - iter 1116/3720 - loss 0.61404895 throughput (samples/sec): 76.41 -2019-08-15 16:03:39,600 epoch 100 - iter 1488/3720 - loss 0.61525729 throughput (samples/sec): 76.77 -2019-08-15 16:06:21,514 epoch 100 - iter 1860/3720 - loss 0.61654127 throughput (samples/sec): 76.91 -2019-08-15 16:09:02,986 epoch 100 - iter 2232/3720 - loss 0.61950030 throughput (samples/sec): 76.81 -2019-08-15 16:11:45,323 epoch 100 - iter 2604/3720 - loss 0.62108938 throughput (samples/sec): 76.37 -2019-08-15 16:14:26,196 epoch 100 - iter 2976/3720 - loss 0.62416983 throughput (samples/sec): 77.40 -2019-08-15 16:17:07,905 epoch 100 - iter 3348/3720 - loss 0.62407691 throughput (samples/sec): 76.99 -2019-08-15 16:19:49,657 ---------------------------------------------------------------------------------------------------- -2019-08-15 16:19:49,657 EPOCH 100 done: loss 0.6227 - lr 0.0500 -2019-08-15 16:19:49,658 BAD EPOCHS (no improvement): 1 -2019-08-15 16:19:49,658 ---------------------------------------------------------------------------------------------------- -2019-08-15 16:19:51,424 epoch 101 - iter 0/3720 - loss 0.65780997 throughput (samples/sec): 22230.39 -2019-08-15 16:22:38,072 epoch 101 - iter 372/3720 - loss 0.61123396 throughput (samples/sec): 75.12 -2019-08-15 16:25:18,765 epoch 101 - iter 744/3720 - loss 0.61567542 throughput (samples/sec): 77.92 -2019-08-15 16:28:00,441 epoch 101 - iter 1116/3720 - loss 0.62212683 throughput (samples/sec): 77.45 -2019-08-15 16:30:41,605 epoch 101 - iter 1488/3720 - loss 0.62188442 throughput (samples/sec): 76.94 -2019-08-15 16:33:23,290 epoch 101 - iter 1860/3720 - loss 0.61791660 throughput (samples/sec): 77.40 -2019-08-15 16:36:07,277 epoch 101 - iter 2232/3720 - loss 0.61719855 throughput (samples/sec): 75.55 -2019-08-15 16:38:49,841 epoch 101 - iter 2604/3720 - loss 0.61359046 throughput (samples/sec): 76.77 -2019-08-15 16:41:32,382 epoch 101 - iter 2976/3720 - loss 0.61565532 throughput (samples/sec): 76.75 -2019-08-15 16:44:15,543 epoch 101 - iter 3348/3720 - loss 0.61401280 throughput (samples/sec): 76.73 -2019-08-15 16:46:56,225 ---------------------------------------------------------------------------------------------------- -2019-08-15 16:46:56,225 EPOCH 101 done: loss 0.6151 - lr 0.0500 -2019-08-15 16:46:56,225 BAD EPOCHS (no improvement): 0 -2019-08-15 16:46:56,226 ---------------------------------------------------------------------------------------------------- -2019-08-15 16:46:57,930 epoch 102 - iter 0/3720 - loss 0.42971063 throughput (samples/sec): 24247.62 -2019-08-15 16:49:44,117 epoch 102 - iter 372/3720 - loss 0.61023064 throughput (samples/sec): 74.98 -2019-08-15 16:52:27,577 epoch 102 - iter 744/3720 - loss 0.60729476 throughput (samples/sec): 76.10 -2019-08-15 16:55:09,070 epoch 102 - iter 1116/3720 - loss 0.61372550 throughput (samples/sec): 77.29 -2019-08-15 16:57:52,679 epoch 102 - iter 1488/3720 - loss 0.61079615 throughput (samples/sec): 75.92 -2019-08-15 17:00:35,804 epoch 102 - iter 1860/3720 - loss 0.61463909 throughput (samples/sec): 75.86 -2019-08-15 17:03:19,998 epoch 102 - iter 2232/3720 - loss 0.61448224 throughput (samples/sec): 75.60 -2019-08-15 17:06:03,352 epoch 102 - iter 2604/3720 - loss 0.61627213 throughput (samples/sec): 75.25 -2019-08-15 17:08:45,467 epoch 102 - iter 2976/3720 - loss 0.61430747 throughput (samples/sec): 76.35 -2019-08-15 17:11:30,621 epoch 102 - iter 3348/3720 - loss 0.61617906 throughput (samples/sec): 75.19 -2019-08-15 17:14:15,251 ---------------------------------------------------------------------------------------------------- -2019-08-15 17:14:15,251 EPOCH 102 done: loss 0.6159 - lr 0.0500 -2019-08-15 17:14:15,251 BAD EPOCHS (no improvement): 1 -2019-08-15 17:14:15,251 ---------------------------------------------------------------------------------------------------- -2019-08-15 17:14:17,030 epoch 103 - iter 0/3720 - loss 0.67080927 throughput (samples/sec): 21136.46 -2019-08-15 17:17:01,361 epoch 103 - iter 372/3720 - loss 0.59975937 throughput (samples/sec): 75.37 -2019-08-15 17:19:43,823 epoch 103 - iter 744/3720 - loss 0.60953414 throughput (samples/sec): 76.35 -2019-08-15 17:22:27,348 epoch 103 - iter 1116/3720 - loss 0.60603285 throughput (samples/sec): 75.99 -2019-08-15 17:25:13,320 epoch 103 - iter 1488/3720 - loss 0.61922883 throughput (samples/sec): 74.32 -2019-08-15 17:27:58,382 epoch 103 - iter 1860/3720 - loss 0.62008388 throughput (samples/sec): 75.20 -2019-08-15 17:30:44,846 epoch 103 - iter 2232/3720 - loss 0.61872820 throughput (samples/sec): 74.60 -2019-08-15 17:33:28,352 epoch 103 - iter 2604/3720 - loss 0.61705110 throughput (samples/sec): 74.99 -2019-08-15 17:36:12,301 epoch 103 - iter 2976/3720 - loss 0.61775754 throughput (samples/sec): 75.32 -2019-08-15 17:38:54,702 epoch 103 - iter 3348/3720 - loss 0.61733405 throughput (samples/sec): 76.77 -2019-08-15 17:41:38,421 ---------------------------------------------------------------------------------------------------- -2019-08-15 17:41:38,421 EPOCH 103 done: loss 0.6192 - lr 0.0500 -2019-08-15 17:41:38,421 BAD EPOCHS (no improvement): 2 -2019-08-15 17:41:38,421 ---------------------------------------------------------------------------------------------------- -2019-08-15 17:41:40,113 epoch 104 - iter 0/3720 - loss 0.27204943 throughput (samples/sec): 25208.92 -2019-08-15 17:44:23,826 epoch 104 - iter 372/3720 - loss 0.62765215 throughput (samples/sec): 75.53 -2019-08-15 17:47:08,884 epoch 104 - iter 744/3720 - loss 0.61095222 throughput (samples/sec): 75.11 -2019-08-15 17:49:51,049 epoch 104 - iter 1116/3720 - loss 0.61002849 throughput (samples/sec): 76.33 -2019-08-15 17:52:33,684 epoch 104 - iter 1488/3720 - loss 0.61629461 throughput (samples/sec): 76.20 -2019-08-15 17:55:16,152 epoch 104 - iter 1860/3720 - loss 0.61757004 throughput (samples/sec): 75.80 -2019-08-15 17:57:56,628 epoch 104 - iter 2232/3720 - loss 0.61756313 throughput (samples/sec): 77.50 -2019-08-15 18:00:42,952 epoch 104 - iter 2604/3720 - loss 0.61514988 throughput (samples/sec): 74.66 -2019-08-15 18:03:26,669 epoch 104 - iter 2976/3720 - loss 0.61333382 throughput (samples/sec): 75.35 -2019-08-15 18:06:09,296 epoch 104 - iter 3348/3720 - loss 0.61346646 throughput (samples/sec): 76.68 -2019-08-15 18:08:52,374 ---------------------------------------------------------------------------------------------------- -2019-08-15 18:08:52,374 EPOCH 104 done: loss 0.6121 - lr 0.0500 -2019-08-15 18:08:52,375 BAD EPOCHS (no improvement): 0 -2019-08-15 18:08:52,375 ---------------------------------------------------------------------------------------------------- -2019-08-15 18:08:54,161 epoch 105 - iter 0/3720 - loss 0.68123388 throughput (samples/sec): 21915.36 -2019-08-15 18:11:36,989 epoch 105 - iter 372/3720 - loss 0.62446579 throughput (samples/sec): 76.15 -2019-08-15 18:14:19,808 epoch 105 - iter 744/3720 - loss 0.61425018 throughput (samples/sec): 75.82 -2019-08-15 18:17:01,434 epoch 105 - iter 1116/3720 - loss 0.61481906 throughput (samples/sec): 77.20 -2019-08-15 18:19:42,983 epoch 105 - iter 1488/3720 - loss 0.60925369 throughput (samples/sec): 76.35 -2019-08-15 18:22:25,549 epoch 105 - iter 1860/3720 - loss 0.61138140 throughput (samples/sec): 76.15 -2019-08-15 18:25:08,114 epoch 105 - iter 2232/3720 - loss 0.61135585 throughput (samples/sec): 76.14 -2019-08-15 18:27:49,104 epoch 105 - iter 2604/3720 - loss 0.61108508 throughput (samples/sec): 77.26 -2019-08-15 18:30:31,354 epoch 105 - iter 2976/3720 - loss 0.60951046 throughput (samples/sec): 76.34 -2019-08-15 18:33:14,419 epoch 105 - iter 3348/3720 - loss 0.60904241 throughput (samples/sec): 75.43 -2019-08-15 18:35:57,037 ---------------------------------------------------------------------------------------------------- -2019-08-15 18:35:57,038 EPOCH 105 done: loss 0.6113 - lr 0.0500 -2019-08-15 18:35:57,038 BAD EPOCHS (no improvement): 0 -2019-08-15 18:35:57,038 ---------------------------------------------------------------------------------------------------- -2019-08-15 18:35:58,867 epoch 106 - iter 0/3720 - loss 0.62008142 throughput (samples/sec): 21646.67 -2019-08-15 18:38:42,708 epoch 106 - iter 372/3720 - loss 0.60260119 throughput (samples/sec): 75.94 -2019-08-15 18:41:24,726 epoch 106 - iter 744/3720 - loss 0.60465597 throughput (samples/sec): 76.84 -2019-08-15 18:44:05,261 epoch 106 - iter 1116/3720 - loss 0.60509169 throughput (samples/sec): 77.22 -2019-08-15 18:46:48,298 epoch 106 - iter 1488/3720 - loss 0.60674448 throughput (samples/sec): 75.46 -2019-08-15 18:49:33,420 epoch 106 - iter 1860/3720 - loss 0.60638386 throughput (samples/sec): 75.53 -2019-08-15 18:52:16,975 epoch 106 - iter 2232/3720 - loss 0.60688622 throughput (samples/sec): 76.05 -2019-08-15 18:54:57,681 epoch 106 - iter 2604/3720 - loss 0.60534770 throughput (samples/sec): 77.82 -2019-08-15 18:57:43,540 epoch 106 - iter 2976/3720 - loss 0.60630924 throughput (samples/sec): 75.31 -2019-08-15 19:01:04,432 epoch 106 - iter 3348/3720 - loss 0.60565243 throughput (samples/sec): 61.66 -2019-08-15 19:05:12,598 ---------------------------------------------------------------------------------------------------- -2019-08-15 19:05:12,599 EPOCH 106 done: loss 0.6053 - lr 0.0500 -2019-08-15 19:05:12,599 BAD EPOCHS (no improvement): 0 -2019-08-15 19:05:12,599 ---------------------------------------------------------------------------------------------------- -2019-08-15 19:05:14,615 epoch 107 - iter 0/3720 - loss 0.71445060 throughput (samples/sec): 15840.57 -2019-08-15 19:08:47,842 epoch 107 - iter 372/3720 - loss 0.60664396 throughput (samples/sec): 57.92 -2019-08-15 19:12:19,641 epoch 107 - iter 744/3720 - loss 0.60306316 throughput (samples/sec): 57.67 -2019-08-15 19:15:49,627 epoch 107 - iter 1116/3720 - loss 0.61462703 throughput (samples/sec): 58.33 -2019-08-15 19:19:22,435 epoch 107 - iter 1488/3720 - loss 0.61029595 throughput (samples/sec): 57.69 -2019-08-15 19:22:53,519 epoch 107 - iter 1860/3720 - loss 0.60924841 throughput (samples/sec): 58.20 -2019-08-15 19:26:27,644 epoch 107 - iter 2232/3720 - loss 0.61053323 throughput (samples/sec): 57.41 -2019-08-15 19:30:00,627 epoch 107 - iter 2604/3720 - loss 0.61071950 throughput (samples/sec): 57.49 -2019-08-15 19:33:34,416 epoch 107 - iter 2976/3720 - loss 0.60977944 throughput (samples/sec): 57.27 -2019-08-15 19:37:04,844 epoch 107 - iter 3348/3720 - loss 0.60928349 throughput (samples/sec): 58.37 -2019-08-15 19:40:35,598 ---------------------------------------------------------------------------------------------------- -2019-08-15 19:40:35,598 EPOCH 107 done: loss 0.6075 - lr 0.0500 -2019-08-15 19:40:35,598 BAD EPOCHS (no improvement): 1 -2019-08-15 19:40:35,599 ---------------------------------------------------------------------------------------------------- -2019-08-15 19:40:37,542 epoch 108 - iter 0/3720 - loss 0.48963618 throughput (samples/sec): 20426.45 -2019-08-15 19:44:08,945 epoch 108 - iter 372/3720 - loss 0.60048250 throughput (samples/sec): 58.19 -2019-08-15 19:47:37,388 epoch 108 - iter 744/3720 - loss 0.60919600 throughput (samples/sec): 58.50 -2019-08-15 19:51:08,243 epoch 108 - iter 1116/3720 - loss 0.61194809 throughput (samples/sec): 58.65 -2019-08-15 19:54:46,574 epoch 108 - iter 1488/3720 - loss 0.61508866 throughput (samples/sec): 56.16 -2019-08-15 19:58:17,471 epoch 108 - iter 1860/3720 - loss 0.61112373 throughput (samples/sec): 58.50 -2019-08-15 20:01:48,740 epoch 108 - iter 2232/3720 - loss 0.60941393 throughput (samples/sec): 58.05 -2019-08-15 20:05:17,998 epoch 108 - iter 2604/3720 - loss 0.61006349 throughput (samples/sec): 59.09 -2019-08-15 20:08:49,878 epoch 108 - iter 2976/3720 - loss 0.61159763 throughput (samples/sec): 58.09 -2019-08-15 20:12:23,001 epoch 108 - iter 3348/3720 - loss 0.61223164 throughput (samples/sec): 57.72 -2019-08-15 20:15:53,950 ---------------------------------------------------------------------------------------------------- -2019-08-15 20:15:53,950 EPOCH 108 done: loss 0.6124 - lr 0.0500 -2019-08-15 20:15:53,950 BAD EPOCHS (no improvement): 2 -2019-08-15 20:15:53,951 ---------------------------------------------------------------------------------------------------- -2019-08-15 20:15:55,846 epoch 109 - iter 0/3720 - loss 0.72649646 throughput (samples/sec): 17940.69 -2019-08-15 20:19:27,841 epoch 109 - iter 372/3720 - loss 0.59107875 throughput (samples/sec): 58.07 -2019-08-15 20:22:58,459 epoch 109 - iter 744/3720 - loss 0.59994461 throughput (samples/sec): 58.46 -2019-08-15 20:26:31,063 epoch 109 - iter 1116/3720 - loss 0.59782128 throughput (samples/sec): 58.09 -2019-08-15 20:30:04,268 epoch 109 - iter 1488/3720 - loss 0.59496026 throughput (samples/sec): 57.55 -2019-08-15 20:33:36,080 epoch 109 - iter 1860/3720 - loss 0.60085362 throughput (samples/sec): 57.72 -2019-08-15 20:37:07,035 epoch 109 - iter 2232/3720 - loss 0.60059297 throughput (samples/sec): 58.37 -2019-08-15 20:40:41,995 epoch 109 - iter 2604/3720 - loss 0.60027673 throughput (samples/sec): 57.21 -2019-08-15 20:44:13,355 epoch 109 - iter 2976/3720 - loss 0.59948289 throughput (samples/sec): 57.96 -2019-08-15 20:47:42,575 epoch 109 - iter 3348/3720 - loss 0.60185795 throughput (samples/sec): 58.89 -2019-08-15 20:51:14,168 ---------------------------------------------------------------------------------------------------- -2019-08-15 20:51:14,169 EPOCH 109 done: loss 0.6022 - lr 0.0500 -2019-08-15 20:51:14,169 BAD EPOCHS (no improvement): 0 -2019-08-15 20:51:14,169 ---------------------------------------------------------------------------------------------------- -2019-08-15 20:51:16,135 epoch 110 - iter 0/3720 - loss 0.87439907 throughput (samples/sec): 17278.50 -2019-08-15 20:54:47,274 epoch 110 - iter 372/3720 - loss 0.58362177 throughput (samples/sec): 58.92 -2019-08-15 20:58:21,468 epoch 110 - iter 744/3720 - loss 0.59336081 throughput (samples/sec): 57.08 -2019-08-15 21:01:52,850 epoch 110 - iter 1116/3720 - loss 0.59067641 throughput (samples/sec): 58.44 -2019-08-15 21:05:20,694 epoch 110 - iter 1488/3720 - loss 0.58923213 throughput (samples/sec): 59.23 -2019-08-15 21:08:54,917 epoch 110 - iter 1860/3720 - loss 0.59166240 throughput (samples/sec): 57.28 -2019-08-15 21:12:25,823 epoch 110 - iter 2232/3720 - loss 0.59461911 throughput (samples/sec): 58.21 -2019-08-15 21:15:56,443 epoch 110 - iter 2604/3720 - loss 0.59645312 throughput (samples/sec): 58.75 -2019-08-15 21:19:24,992 epoch 110 - iter 2976/3720 - loss 0.59799170 throughput (samples/sec): 59.01 -2019-08-15 21:23:01,028 epoch 110 - iter 3348/3720 - loss 0.59922152 throughput (samples/sec): 56.53 -2019-08-15 21:26:30,216 ---------------------------------------------------------------------------------------------------- -2019-08-15 21:26:30,216 EPOCH 110 done: loss 0.6012 - lr 0.0500 -2019-08-15 21:26:30,216 BAD EPOCHS (no improvement): 0 -2019-08-15 21:26:30,217 ---------------------------------------------------------------------------------------------------- -2019-08-15 21:26:32,157 epoch 111 - iter 0/3720 - loss 0.69870114 throughput (samples/sec): 16973.91 -2019-08-15 21:30:00,337 epoch 111 - iter 372/3720 - loss 0.60781592 throughput (samples/sec): 59.05 -2019-08-15 21:33:30,073 epoch 111 - iter 744/3720 - loss 0.59957324 throughput (samples/sec): 58.27 -2019-08-15 21:37:02,569 epoch 111 - iter 1116/3720 - loss 0.60380243 throughput (samples/sec): 58.12 -2019-08-15 21:40:31,856 epoch 111 - iter 1488/3720 - loss 0.60436290 throughput (samples/sec): 58.81 -2019-08-15 21:44:03,929 epoch 111 - iter 1860/3720 - loss 0.60221944 throughput (samples/sec): 57.93 -2019-08-15 21:47:35,926 epoch 111 - iter 2232/3720 - loss 0.60074389 throughput (samples/sec): 57.98 -2019-08-15 21:51:09,504 epoch 111 - iter 2604/3720 - loss 0.59895805 throughput (samples/sec): 57.53 -2019-08-15 21:54:40,527 epoch 111 - iter 2976/3720 - loss 0.59816125 throughput (samples/sec): 57.88 -2019-08-15 21:58:11,718 epoch 111 - iter 3348/3720 - loss 0.60199199 throughput (samples/sec): 58.36 -2019-08-15 22:01:42,670 ---------------------------------------------------------------------------------------------------- -2019-08-15 22:01:42,671 EPOCH 111 done: loss 0.6025 - lr 0.0500 -2019-08-15 22:01:42,671 BAD EPOCHS (no improvement): 1 -2019-08-15 22:01:42,671 ---------------------------------------------------------------------------------------------------- -2019-08-15 22:01:44,413 epoch 112 - iter 0/3720 - loss 0.51906109 throughput (samples/sec): 22587.04 -2019-08-15 22:05:16,377 epoch 112 - iter 372/3720 - loss 0.61510789 throughput (samples/sec): 57.83 -2019-08-15 22:08:45,628 epoch 112 - iter 744/3720 - loss 0.59874256 throughput (samples/sec): 58.66 -2019-08-15 22:12:18,939 epoch 112 - iter 1116/3720 - loss 0.60495522 throughput (samples/sec): 57.71 -2019-08-15 22:15:51,966 epoch 112 - iter 1488/3720 - loss 0.60260079 throughput (samples/sec): 57.78 -2019-08-15 22:19:29,426 epoch 112 - iter 1860/3720 - loss 0.59668091 throughput (samples/sec): 56.55 -2019-08-15 22:23:00,420 epoch 112 - iter 2232/3720 - loss 0.59595975 throughput (samples/sec): 58.06 -2019-08-15 22:26:32,414 epoch 112 - iter 2604/3720 - loss 0.59589281 throughput (samples/sec): 58.10 -2019-08-15 22:30:03,589 epoch 112 - iter 2976/3720 - loss 0.59935996 throughput (samples/sec): 58.31 -2019-08-15 22:33:33,970 epoch 112 - iter 3348/3720 - loss 0.59971808 throughput (samples/sec): 58.51 -2019-08-15 22:37:06,130 ---------------------------------------------------------------------------------------------------- -2019-08-15 22:37:06,131 EPOCH 112 done: loss 0.5994 - lr 0.0500 -2019-08-15 22:37:06,131 BAD EPOCHS (no improvement): 0 -2019-08-15 22:37:06,131 ---------------------------------------------------------------------------------------------------- -2019-08-15 22:37:07,887 epoch 113 - iter 0/3720 - loss 0.79381442 throughput (samples/sec): 23108.67 -2019-08-15 22:40:40,839 epoch 113 - iter 372/3720 - loss 0.58832858 throughput (samples/sec): 57.56 -2019-08-15 22:44:15,246 epoch 113 - iter 744/3720 - loss 0.59491492 throughput (samples/sec): 57.58 -2019-08-15 22:47:48,314 epoch 113 - iter 1116/3720 - loss 0.58867298 throughput (samples/sec): 57.81 -2019-08-15 22:51:18,257 epoch 113 - iter 1488/3720 - loss 0.59123104 throughput (samples/sec): 58.06 -2019-08-15 22:54:50,736 epoch 113 - iter 1860/3720 - loss 0.59420772 throughput (samples/sec): 58.08 -2019-08-15 22:58:22,365 epoch 113 - iter 2232/3720 - loss 0.59578527 throughput (samples/sec): 58.20 -2019-08-15 23:01:53,448 epoch 113 - iter 2604/3720 - loss 0.59661703 throughput (samples/sec): 58.08 -2019-08-15 23:05:25,208 epoch 113 - iter 2976/3720 - loss 0.59753241 throughput (samples/sec): 58.18 -2019-08-15 23:08:54,722 epoch 113 - iter 3348/3720 - loss 0.59621738 throughput (samples/sec): 59.01 -2019-08-15 23:12:26,792 ---------------------------------------------------------------------------------------------------- -2019-08-15 23:12:26,792 EPOCH 113 done: loss 0.5977 - lr 0.0500 -2019-08-15 23:12:26,792 BAD EPOCHS (no improvement): 0 -2019-08-15 23:12:26,792 ---------------------------------------------------------------------------------------------------- -2019-08-15 23:12:28,963 epoch 114 - iter 0/3720 - loss 0.44020462 throughput (samples/sec): 13328.63 -2019-08-15 23:15:59,855 epoch 114 - iter 372/3720 - loss 0.60498466 throughput (samples/sec): 58.62 -2019-08-15 23:19:31,646 epoch 114 - iter 744/3720 - loss 0.60049461 throughput (samples/sec): 57.99 -2019-08-15 23:23:01,018 epoch 114 - iter 1116/3720 - loss 0.60048319 throughput (samples/sec): 59.01 -2019-08-15 23:26:34,159 epoch 114 - iter 1488/3720 - loss 0.59521566 throughput (samples/sec): 57.66 -2019-08-15 23:30:00,767 epoch 114 - iter 1860/3720 - loss 0.59132477 throughput (samples/sec): 59.56 -2019-08-15 23:33:30,973 epoch 114 - iter 2232/3720 - loss 0.59224300 throughput (samples/sec): 58.50 -2019-08-15 23:36:59,338 epoch 114 - iter 2604/3720 - loss 0.59297217 throughput (samples/sec): 58.84 -2019-08-15 23:40:28,979 epoch 114 - iter 2976/3720 - loss 0.59424697 throughput (samples/sec): 58.76 -2019-08-15 23:44:02,089 epoch 114 - iter 3348/3720 - loss 0.59695058 throughput (samples/sec): 57.50 -2019-08-15 23:47:29,427 ---------------------------------------------------------------------------------------------------- -2019-08-15 23:47:29,427 EPOCH 114 done: loss 0.5972 - lr 0.0500 -2019-08-15 23:47:29,428 BAD EPOCHS (no improvement): 0 -2019-08-15 23:47:29,428 ---------------------------------------------------------------------------------------------------- -2019-08-15 23:47:31,434 epoch 115 - iter 0/3720 - loss 0.97544169 throughput (samples/sec): 15924.48 -2019-08-15 23:51:03,535 epoch 115 - iter 372/3720 - loss 0.58414099 throughput (samples/sec): 57.62 -2019-08-15 23:54:33,747 epoch 115 - iter 744/3720 - loss 0.58193530 throughput (samples/sec): 58.76 -2019-08-15 23:58:04,817 epoch 115 - iter 1116/3720 - loss 0.59084904 throughput (samples/sec): 58.37 -2019-08-16 00:01:36,881 epoch 115 - iter 1488/3720 - loss 0.59764592 throughput (samples/sec): 58.38 -2019-08-16 00:05:06,003 epoch 115 - iter 1860/3720 - loss 0.59529739 throughput (samples/sec): 58.25 -2019-08-16 00:08:35,223 epoch 115 - iter 2232/3720 - loss 0.59698760 throughput (samples/sec): 58.76 -2019-08-16 00:12:06,203 epoch 115 - iter 2604/3720 - loss 0.59775992 throughput (samples/sec): 58.50 -2019-08-16 00:15:37,324 epoch 115 - iter 2976/3720 - loss 0.59571867 throughput (samples/sec): 58.18 -2019-08-16 00:19:08,555 epoch 115 - iter 3348/3720 - loss 0.59520768 throughput (samples/sec): 58.04 -2019-08-16 00:22:36,381 ---------------------------------------------------------------------------------------------------- -2019-08-16 00:22:36,381 EPOCH 115 done: loss 0.5954 - lr 0.0500 -2019-08-16 00:22:36,381 BAD EPOCHS (no improvement): 0 -2019-08-16 00:22:36,381 ---------------------------------------------------------------------------------------------------- -2019-08-16 00:22:38,359 epoch 116 - iter 0/3720 - loss 0.59288645 throughput (samples/sec): 16458.81 -2019-08-16 00:26:08,819 epoch 116 - iter 372/3720 - loss 0.60542850 throughput (samples/sec): 58.22 -2019-08-16 00:29:40,845 epoch 116 - iter 744/3720 - loss 0.60701289 throughput (samples/sec): 58.11 -2019-08-16 00:33:11,786 epoch 116 - iter 1116/3720 - loss 0.59363126 throughput (samples/sec): 58.39 -2019-08-16 00:36:43,968 epoch 116 - iter 1488/3720 - loss 0.59582190 throughput (samples/sec): 57.98 -2019-08-16 00:40:16,466 epoch 116 - iter 1860/3720 - loss 0.59733874 throughput (samples/sec): 58.20 -2019-08-16 00:43:46,425 epoch 116 - iter 2232/3720 - loss 0.59626696 throughput (samples/sec): 58.54 -2019-08-16 00:47:16,524 epoch 116 - iter 2604/3720 - loss 0.59534390 throughput (samples/sec): 58.61 -2019-08-16 00:50:46,371 epoch 116 - iter 2976/3720 - loss 0.59540787 throughput (samples/sec): 58.83 -2019-08-16 00:54:19,132 epoch 116 - iter 3348/3720 - loss 0.59477717 throughput (samples/sec): 57.72 -2019-08-16 00:57:45,574 ---------------------------------------------------------------------------------------------------- -2019-08-16 00:57:45,575 EPOCH 116 done: loss 0.5940 - lr 0.0500 -2019-08-16 00:57:45,575 BAD EPOCHS (no improvement): 0 -2019-08-16 00:57:45,575 ---------------------------------------------------------------------------------------------------- -2019-08-16 00:57:47,563 epoch 117 - iter 0/3720 - loss 0.47679782 throughput (samples/sec): 17009.00 -2019-08-16 01:01:15,913 epoch 117 - iter 372/3720 - loss 0.58075638 throughput (samples/sec): 59.03 -2019-08-16 01:04:43,890 epoch 117 - iter 744/3720 - loss 0.58662185 throughput (samples/sec): 59.09 -2019-08-16 01:08:17,343 epoch 117 - iter 1116/3720 - loss 0.58428279 throughput (samples/sec): 57.66 -2019-08-16 01:11:48,330 epoch 117 - iter 1488/3720 - loss 0.59216672 throughput (samples/sec): 58.38 -2019-08-16 01:15:18,264 epoch 117 - iter 1860/3720 - loss 0.58883462 throughput (samples/sec): 58.68 -2019-08-16 01:18:48,676 epoch 117 - iter 2232/3720 - loss 0.59325335 throughput (samples/sec): 58.54 -2019-08-16 01:22:19,702 epoch 117 - iter 2604/3720 - loss 0.59182810 throughput (samples/sec): 58.41 -2019-08-16 01:25:52,066 epoch 117 - iter 2976/3720 - loss 0.59188577 throughput (samples/sec): 58.15 -2019-08-16 01:29:25,013 epoch 117 - iter 3348/3720 - loss 0.59390123 throughput (samples/sec): 57.53 -2019-08-16 01:32:57,349 ---------------------------------------------------------------------------------------------------- -2019-08-16 01:32:57,350 EPOCH 117 done: loss 0.5965 - lr 0.0500 -2019-08-16 01:32:57,350 BAD EPOCHS (no improvement): 1 -2019-08-16 01:32:57,350 ---------------------------------------------------------------------------------------------------- -2019-08-16 01:32:59,253 epoch 118 - iter 0/3720 - loss 0.58392191 throughput (samples/sec): 18582.23 -2019-08-16 01:36:30,965 epoch 118 - iter 372/3720 - loss 0.58285341 throughput (samples/sec): 58.39 -2019-08-16 01:40:03,465 epoch 118 - iter 744/3720 - loss 0.58091630 throughput (samples/sec): 57.46 -2019-08-16 01:43:38,280 epoch 118 - iter 1116/3720 - loss 0.57738529 throughput (samples/sec): 57.45 -2019-08-16 01:47:11,523 epoch 118 - iter 1488/3720 - loss 0.57851708 throughput (samples/sec): 57.62 -2019-08-16 01:50:40,526 epoch 118 - iter 1860/3720 - loss 0.58084901 throughput (samples/sec): 58.79 -2019-08-16 01:54:14,222 epoch 118 - iter 2232/3720 - loss 0.58253899 throughput (samples/sec): 57.94 -2019-08-16 01:57:45,140 epoch 118 - iter 2604/3720 - loss 0.58257910 throughput (samples/sec): 58.38 -2019-08-16 02:01:18,856 epoch 118 - iter 2976/3720 - loss 0.58437297 throughput (samples/sec): 57.64 -2019-08-16 02:04:52,171 epoch 118 - iter 3348/3720 - loss 0.58545966 throughput (samples/sec): 57.93 -2019-08-16 02:08:25,413 ---------------------------------------------------------------------------------------------------- -2019-08-16 02:08:25,413 EPOCH 118 done: loss 0.5879 - lr 0.0500 -2019-08-16 02:08:25,413 BAD EPOCHS (no improvement): 0 -2019-08-16 02:08:25,413 ---------------------------------------------------------------------------------------------------- -2019-08-16 02:08:27,368 epoch 119 - iter 0/3720 - loss 0.76026368 throughput (samples/sec): 17369.08 -2019-08-16 02:11:58,279 epoch 119 - iter 372/3720 - loss 0.58422249 throughput (samples/sec): 58.32 -2019-08-16 02:15:30,743 epoch 119 - iter 744/3720 - loss 0.58165900 throughput (samples/sec): 58.03 -2019-08-16 02:19:00,802 epoch 119 - iter 1116/3720 - loss 0.58716601 throughput (samples/sec): 58.69 -2019-08-16 02:22:30,996 epoch 119 - iter 1488/3720 - loss 0.58861893 throughput (samples/sec): 58.47 -2019-08-16 02:26:05,289 epoch 119 - iter 1860/3720 - loss 0.58873770 throughput (samples/sec): 57.76 -2019-08-16 02:29:38,982 epoch 119 - iter 2232/3720 - loss 0.59137538 throughput (samples/sec): 57.35 -2019-08-16 02:33:11,629 epoch 119 - iter 2604/3720 - loss 0.59093972 throughput (samples/sec): 57.96 -2019-08-16 02:36:45,728 epoch 119 - iter 2976/3720 - loss 0.59341173 throughput (samples/sec): 57.68 -2019-08-16 02:40:14,516 epoch 119 - iter 3348/3720 - loss 0.59375588 throughput (samples/sec): 58.81 -2019-08-16 02:43:43,584 ---------------------------------------------------------------------------------------------------- -2019-08-16 02:43:43,584 EPOCH 119 done: loss 0.5949 - lr 0.0500 -2019-08-16 02:43:43,585 BAD EPOCHS (no improvement): 1 -2019-08-16 02:43:43,585 ---------------------------------------------------------------------------------------------------- -2019-08-16 02:43:45,389 epoch 120 - iter 0/3720 - loss 0.50542879 throughput (samples/sec): 21535.45 -2019-08-16 02:47:21,244 epoch 120 - iter 372/3720 - loss 0.58426903 throughput (samples/sec): 57.24 -2019-08-16 02:50:49,865 epoch 120 - iter 744/3720 - loss 0.58405442 throughput (samples/sec): 58.98 -2019-08-16 02:54:21,188 epoch 120 - iter 1116/3720 - loss 0.58656675 throughput (samples/sec): 57.95 -2019-08-16 02:57:49,729 epoch 120 - iter 1488/3720 - loss 0.58659455 throughput (samples/sec): 58.88 -2019-08-16 03:01:18,117 epoch 120 - iter 1860/3720 - loss 0.58977915 throughput (samples/sec): 58.96 -2019-08-16 03:04:52,004 epoch 120 - iter 2232/3720 - loss 0.59045954 throughput (samples/sec): 57.22 -2019-08-16 03:08:23,305 epoch 120 - iter 2604/3720 - loss 0.58900803 throughput (samples/sec): 58.63 -2019-08-16 03:11:55,243 epoch 120 - iter 2976/3720 - loss 0.58595974 throughput (samples/sec): 58.25 -2019-08-16 03:15:25,667 epoch 120 - iter 3348/3720 - loss 0.58457410 throughput (samples/sec): 58.21 -2019-08-16 03:18:58,063 ---------------------------------------------------------------------------------------------------- -2019-08-16 03:18:58,063 EPOCH 120 done: loss 0.5856 - lr 0.0500 -2019-08-16 03:18:58,063 BAD EPOCHS (no improvement): 0 -2019-08-16 03:18:58,063 ---------------------------------------------------------------------------------------------------- -2019-08-16 03:19:00,037 epoch 121 - iter 0/3720 - loss 0.13390207 throughput (samples/sec): 16961.58 -2019-08-16 03:22:34,864 epoch 121 - iter 372/3720 - loss 0.57221153 throughput (samples/sec): 57.45 -2019-08-16 03:26:04,432 epoch 121 - iter 744/3720 - loss 0.58111747 throughput (samples/sec): 58.60 -2019-08-16 03:29:44,485 epoch 121 - iter 1116/3720 - loss 0.58337305 throughput (samples/sec): 55.68 -2019-08-16 03:33:14,052 epoch 121 - iter 1488/3720 - loss 0.57987685 throughput (samples/sec): 58.68 -2019-08-16 03:36:45,640 epoch 121 - iter 1860/3720 - loss 0.58314417 throughput (samples/sec): 57.91 -2019-08-16 03:40:17,977 epoch 121 - iter 2232/3720 - loss 0.58210603 throughput (samples/sec): 57.79 -2019-08-16 03:43:26,982 epoch 121 - iter 2604/3720 - loss 0.58138577 throughput (samples/sec): 65.47 -2019-08-16 03:46:10,130 epoch 121 - iter 2976/3720 - loss 0.58256960 throughput (samples/sec): 75.97 -2019-08-16 03:48:52,647 epoch 121 - iter 3348/3720 - loss 0.58571553 throughput (samples/sec): 75.97 -2019-08-16 03:51:34,961 ---------------------------------------------------------------------------------------------------- -2019-08-16 03:51:34,961 EPOCH 121 done: loss 0.5832 - lr 0.0500 -2019-08-16 03:51:34,961 BAD EPOCHS (no improvement): 0 -2019-08-16 03:51:34,961 ---------------------------------------------------------------------------------------------------- -2019-08-16 03:51:36,772 epoch 122 - iter 0/3720 - loss 0.75961542 throughput (samples/sec): 20532.89 -2019-08-16 03:54:20,393 epoch 122 - iter 372/3720 - loss 0.58586702 throughput (samples/sec): 75.91 -2019-08-16 03:57:03,926 epoch 122 - iter 744/3720 - loss 0.58222005 throughput (samples/sec): 75.46 -2019-08-16 03:59:46,722 epoch 122 - iter 1116/3720 - loss 0.58087299 throughput (samples/sec): 75.34 -2019-08-16 04:02:33,860 epoch 122 - iter 1488/3720 - loss 0.58086785 throughput (samples/sec): 74.31 -2019-08-16 04:05:16,644 epoch 122 - iter 1860/3720 - loss 0.57818127 throughput (samples/sec): 75.39 -2019-08-16 04:07:57,401 epoch 122 - iter 2232/3720 - loss 0.57916577 throughput (samples/sec): 76.03 -2019-08-16 04:10:39,951 epoch 122 - iter 2604/3720 - loss 0.58198257 throughput (samples/sec): 76.04 -2019-08-16 04:13:20,981 epoch 122 - iter 2976/3720 - loss 0.58429760 throughput (samples/sec): 77.36 -2019-08-16 04:16:02,050 epoch 122 - iter 3348/3720 - loss 0.58462099 throughput (samples/sec): 77.55 -2019-08-16 04:18:43,227 ---------------------------------------------------------------------------------------------------- -2019-08-16 04:18:43,227 EPOCH 122 done: loss 0.5855 - lr 0.0500 -2019-08-16 04:18:43,228 BAD EPOCHS (no improvement): 1 -2019-08-16 04:18:43,228 ---------------------------------------------------------------------------------------------------- -2019-08-16 04:18:44,957 epoch 123 - iter 0/3720 - loss 0.30337286 throughput (samples/sec): 23593.15 -2019-08-16 04:21:28,005 epoch 123 - iter 372/3720 - loss 0.58944040 throughput (samples/sec): 76.62 -2019-08-16 04:24:10,249 epoch 123 - iter 744/3720 - loss 0.57746133 throughput (samples/sec): 76.16 -2019-08-16 04:26:52,186 epoch 123 - iter 1116/3720 - loss 0.57335254 throughput (samples/sec): 76.48 -2019-08-16 04:29:35,540 epoch 123 - iter 1488/3720 - loss 0.58093705 throughput (samples/sec): 76.29 -2019-08-16 04:32:16,581 epoch 123 - iter 1860/3720 - loss 0.58347603 throughput (samples/sec): 77.26 -2019-08-16 04:34:55,882 epoch 123 - iter 2232/3720 - loss 0.58295878 throughput (samples/sec): 77.86 -2019-08-16 04:37:39,455 epoch 123 - iter 2604/3720 - loss 0.58263375 throughput (samples/sec): 75.56 -2019-08-16 04:40:23,396 epoch 123 - iter 2976/3720 - loss 0.58608931 throughput (samples/sec): 75.05 -2019-08-16 04:43:06,630 epoch 123 - iter 3348/3720 - loss 0.58725362 throughput (samples/sec): 75.81 -2019-08-16 04:45:49,508 ---------------------------------------------------------------------------------------------------- -2019-08-16 04:45:49,508 EPOCH 123 done: loss 0.5886 - lr 0.0500 -2019-08-16 04:45:49,508 BAD EPOCHS (no improvement): 2 -2019-08-16 04:45:49,509 ---------------------------------------------------------------------------------------------------- -2019-08-16 04:45:51,355 epoch 124 - iter 0/3720 - loss 0.68787766 throughput (samples/sec): 19935.91 -2019-08-16 04:48:34,724 epoch 124 - iter 372/3720 - loss 0.58605632 throughput (samples/sec): 75.42 -2019-08-16 04:51:19,493 epoch 124 - iter 744/3720 - loss 0.58418747 throughput (samples/sec): 75.32 -2019-08-16 04:54:02,302 epoch 124 - iter 1116/3720 - loss 0.58104620 throughput (samples/sec): 75.52 -2019-08-16 04:56:46,326 epoch 124 - iter 1488/3720 - loss 0.58163422 throughput (samples/sec): 75.41 -2019-08-16 04:59:30,142 epoch 124 - iter 1860/3720 - loss 0.58348783 throughput (samples/sec): 75.75 -2019-08-16 05:02:13,401 epoch 124 - iter 2232/3720 - loss 0.58435950 throughput (samples/sec): 75.74 -2019-08-16 05:04:54,429 epoch 124 - iter 2604/3720 - loss 0.58493045 throughput (samples/sec): 76.93 -2019-08-16 05:07:38,608 epoch 124 - iter 2976/3720 - loss 0.58430113 throughput (samples/sec): 75.89 -2019-08-16 05:10:22,187 epoch 124 - iter 3348/3720 - loss 0.58321136 throughput (samples/sec): 75.88 -2019-08-16 05:13:01,734 ---------------------------------------------------------------------------------------------------- -2019-08-16 05:13:01,734 EPOCH 124 done: loss 0.5843 - lr 0.0500 -2019-08-16 05:13:01,735 BAD EPOCHS (no improvement): 3 -2019-08-16 05:13:01,735 ---------------------------------------------------------------------------------------------------- -2019-08-16 05:13:03,424 epoch 125 - iter 0/3720 - loss 0.36915255 throughput (samples/sec): 25531.17 -2019-08-16 05:15:48,645 epoch 125 - iter 372/3720 - loss 0.56903807 throughput (samples/sec): 75.22 -2019-08-16 05:18:29,369 epoch 125 - iter 744/3720 - loss 0.57226500 throughput (samples/sec): 77.13 -2019-08-16 05:21:14,492 epoch 125 - iter 1116/3720 - loss 0.57583376 throughput (samples/sec): 74.90 -2019-08-16 05:23:56,546 epoch 125 - iter 1488/3720 - loss 0.57914059 throughput (samples/sec): 76.38 -2019-08-16 05:26:38,249 epoch 125 - iter 1860/3720 - loss 0.58039977 throughput (samples/sec): 76.17 -2019-08-16 05:29:21,254 epoch 125 - iter 2232/3720 - loss 0.57547496 throughput (samples/sec): 75.53 -2019-08-16 05:32:04,380 epoch 125 - iter 2604/3720 - loss 0.58005408 throughput (samples/sec): 75.94 -2019-08-16 05:34:46,709 epoch 125 - iter 2976/3720 - loss 0.58248779 throughput (samples/sec): 76.25 -2019-08-16 05:37:30,260 epoch 125 - iter 3348/3720 - loss 0.58349379 throughput (samples/sec): 75.44 -2019-08-16 05:40:16,512 ---------------------------------------------------------------------------------------------------- -2019-08-16 05:40:16,513 EPOCH 125 done: loss 0.5835 - lr 0.0500 -2019-08-16 05:40:16,513 BAD EPOCHS (no improvement): 4 -2019-08-16 05:40:16,513 ---------------------------------------------------------------------------------------------------- -2019-08-16 05:40:18,328 epoch 126 - iter 0/3720 - loss 0.42108583 throughput (samples/sec): 20464.85 -2019-08-16 05:43:01,393 epoch 126 - iter 372/3720 - loss 0.57105613 throughput (samples/sec): 76.44 -2019-08-16 05:45:44,995 epoch 126 - iter 744/3720 - loss 0.56416189 throughput (samples/sec): 75.51 -2019-08-16 05:48:27,352 epoch 126 - iter 1116/3720 - loss 0.56836867 throughput (samples/sec): 75.64 -2019-08-16 05:51:08,225 epoch 126 - iter 1488/3720 - loss 0.56206829 throughput (samples/sec): 77.06 -2019-08-16 05:53:49,191 epoch 126 - iter 1860/3720 - loss 0.56722397 throughput (samples/sec): 77.35 -2019-08-16 05:56:32,965 epoch 126 - iter 2232/3720 - loss 0.56590246 throughput (samples/sec): 74.88 -2019-08-16 05:59:18,900 epoch 126 - iter 2604/3720 - loss 0.56381979 throughput (samples/sec): 74.59 -2019-08-16 06:02:03,753 epoch 126 - iter 2976/3720 - loss 0.56611600 throughput (samples/sec): 75.44 -2019-08-16 06:04:47,811 epoch 126 - iter 3348/3720 - loss 0.56663485 throughput (samples/sec): 75.50 -2019-08-16 06:07:30,302 ---------------------------------------------------------------------------------------------------- -2019-08-16 06:07:30,302 EPOCH 126 done: loss 0.5669 - lr 0.0250 -2019-08-16 06:07:30,302 BAD EPOCHS (no improvement): 0 -2019-08-16 06:07:30,302 ---------------------------------------------------------------------------------------------------- -2019-08-16 06:07:32,074 epoch 127 - iter 0/3720 - loss 0.52399063 throughput (samples/sec): 21575.18 -2019-08-16 06:10:17,197 epoch 127 - iter 372/3720 - loss 0.57202326 throughput (samples/sec): 75.65 -2019-08-16 06:13:02,624 epoch 127 - iter 744/3720 - loss 0.56554477 throughput (samples/sec): 75.27 -2019-08-16 06:15:47,395 epoch 127 - iter 1116/3720 - loss 0.56657639 throughput (samples/sec): 75.07 -2019-08-16 06:18:29,762 epoch 127 - iter 1488/3720 - loss 0.56380863 throughput (samples/sec): 76.30 -2019-08-16 06:21:14,277 epoch 127 - iter 1860/3720 - loss 0.55965602 throughput (samples/sec): 75.22 -2019-08-16 06:23:55,999 epoch 127 - iter 2232/3720 - loss 0.55868144 throughput (samples/sec): 76.59 -2019-08-16 06:26:38,262 epoch 127 - iter 2604/3720 - loss 0.55808247 throughput (samples/sec): 76.23 -2019-08-16 06:29:20,958 epoch 127 - iter 2976/3720 - loss 0.55830459 throughput (samples/sec): 75.87 -2019-08-16 06:32:05,300 epoch 127 - iter 3348/3720 - loss 0.56010445 throughput (samples/sec): 75.87 -2019-08-16 06:34:47,788 ---------------------------------------------------------------------------------------------------- -2019-08-16 06:34:47,789 EPOCH 127 done: loss 0.5618 - lr 0.0250 -2019-08-16 06:34:47,789 BAD EPOCHS (no improvement): 0 -2019-08-16 06:34:47,789 ---------------------------------------------------------------------------------------------------- -2019-08-16 06:34:49,636 epoch 128 - iter 0/3720 - loss 0.66985488 throughput (samples/sec): 19557.90 -2019-08-16 06:37:34,840 epoch 128 - iter 372/3720 - loss 0.53489549 throughput (samples/sec): 75.35 -2019-08-16 06:40:18,060 epoch 128 - iter 744/3720 - loss 0.54392897 throughput (samples/sec): 75.94 -2019-08-16 06:43:00,259 epoch 128 - iter 1116/3720 - loss 0.54967535 throughput (samples/sec): 76.35 -2019-08-16 06:45:42,281 epoch 128 - iter 1488/3720 - loss 0.55922097 throughput (samples/sec): 76.43 -2019-08-16 06:48:24,989 epoch 128 - iter 1860/3720 - loss 0.55831286 throughput (samples/sec): 76.16 -2019-08-16 06:51:08,786 epoch 128 - iter 2232/3720 - loss 0.55818285 throughput (samples/sec): 75.35 -2019-08-16 06:53:53,194 epoch 128 - iter 2604/3720 - loss 0.55777916 throughput (samples/sec): 75.14 -2019-08-16 06:56:33,593 epoch 128 - iter 2976/3720 - loss 0.55920524 throughput (samples/sec): 77.02 -2019-08-16 06:59:17,302 epoch 128 - iter 3348/3720 - loss 0.56134678 throughput (samples/sec): 76.25 -2019-08-16 07:02:01,983 ---------------------------------------------------------------------------------------------------- -2019-08-16 07:02:01,984 EPOCH 128 done: loss 0.5626 - lr 0.0250 -2019-08-16 07:02:01,984 BAD EPOCHS (no improvement): 1 -2019-08-16 07:02:01,984 ---------------------------------------------------------------------------------------------------- -2019-08-16 07:02:03,952 epoch 129 - iter 0/3720 - loss 0.84288216 throughput (samples/sec): 15899.20 -2019-08-16 07:04:50,425 epoch 129 - iter 372/3720 - loss 0.55538852 throughput (samples/sec): 74.67 -2019-08-16 07:07:33,614 epoch 129 - iter 744/3720 - loss 0.56036498 throughput (samples/sec): 75.90 -2019-08-16 07:10:15,400 epoch 129 - iter 1116/3720 - loss 0.55306377 throughput (samples/sec): 76.62 -2019-08-16 07:12:58,291 epoch 129 - iter 1488/3720 - loss 0.55388745 throughput (samples/sec): 76.23 -2019-08-16 07:15:40,602 epoch 129 - iter 1860/3720 - loss 0.55736411 throughput (samples/sec): 76.67 -2019-08-16 07:18:23,101 epoch 129 - iter 2232/3720 - loss 0.55531710 throughput (samples/sec): 76.29 -2019-08-16 07:21:05,987 epoch 129 - iter 2604/3720 - loss 0.55306163 throughput (samples/sec): 76.02 -2019-08-16 07:23:49,315 epoch 129 - iter 2976/3720 - loss 0.55303047 throughput (samples/sec): 76.18 -2019-08-16 07:26:32,927 epoch 129 - iter 3348/3720 - loss 0.55545679 throughput (samples/sec): 75.58 -2019-08-16 07:29:14,303 ---------------------------------------------------------------------------------------------------- -2019-08-16 07:29:14,303 EPOCH 129 done: loss 0.5548 - lr 0.0250 -2019-08-16 07:29:14,303 BAD EPOCHS (no improvement): 0 -2019-08-16 07:29:14,303 ---------------------------------------------------------------------------------------------------- -2019-08-16 07:29:18,148 epoch 130 - iter 0/3720 - loss 0.62877369 throughput (samples/sec): 25832.58 -2019-08-16 07:32:01,111 epoch 130 - iter 372/3720 - loss 0.55213001 throughput (samples/sec): 75.83 -2019-08-16 07:34:42,670 epoch 130 - iter 744/3720 - loss 0.55016722 throughput (samples/sec): 77.23 -2019-08-16 07:37:26,045 epoch 130 - iter 1116/3720 - loss 0.55273786 throughput (samples/sec): 76.56 -2019-08-16 07:40:08,858 epoch 130 - iter 1488/3720 - loss 0.55365378 throughput (samples/sec): 76.63 -2019-08-16 07:42:52,923 epoch 130 - iter 1860/3720 - loss 0.55554798 throughput (samples/sec): 76.09 -2019-08-16 07:45:37,155 epoch 130 - iter 2232/3720 - loss 0.55455339 throughput (samples/sec): 75.76 -2019-08-16 07:48:20,073 epoch 130 - iter 2604/3720 - loss 0.55706412 throughput (samples/sec): 76.66 -2019-08-16 07:51:01,352 epoch 130 - iter 2976/3720 - loss 0.55752861 throughput (samples/sec): 77.18 -2019-08-16 07:53:44,949 epoch 130 - iter 3348/3720 - loss 0.55711935 throughput (samples/sec): 76.12 -2019-08-16 07:56:28,676 ---------------------------------------------------------------------------------------------------- -2019-08-16 07:56:28,676 EPOCH 130 done: loss 0.5562 - lr 0.0250 -2019-08-16 07:56:28,676 BAD EPOCHS (no improvement): 1 -2019-08-16 07:56:28,677 ---------------------------------------------------------------------------------------------------- -2019-08-16 07:56:30,526 epoch 131 - iter 0/3720 - loss 0.46423936 throughput (samples/sec): 21791.00 -2019-08-16 07:59:14,813 epoch 131 - iter 372/3720 - loss 0.56109171 throughput (samples/sec): 75.42 -2019-08-16 08:01:57,518 epoch 131 - iter 744/3720 - loss 0.54992709 throughput (samples/sec): 76.32 -2019-08-16 08:04:41,656 epoch 131 - iter 1116/3720 - loss 0.54973317 throughput (samples/sec): 75.56 -2019-08-16 08:07:24,455 epoch 131 - iter 1488/3720 - loss 0.55605991 throughput (samples/sec): 76.64 -2019-08-16 08:10:07,767 epoch 131 - iter 1860/3720 - loss 0.55302558 throughput (samples/sec): 75.36 -2019-08-16 08:12:51,395 epoch 131 - iter 2232/3720 - loss 0.55486521 throughput (samples/sec): 75.69 -2019-08-16 08:15:37,480 epoch 131 - iter 2604/3720 - loss 0.55119462 throughput (samples/sec): 74.58 -2019-08-16 08:18:21,867 epoch 131 - iter 2976/3720 - loss 0.55009820 throughput (samples/sec): 74.61 -2019-08-16 08:21:06,318 epoch 131 - iter 3348/3720 - loss 0.55068762 throughput (samples/sec): 74.59 -2019-08-16 08:23:51,778 ---------------------------------------------------------------------------------------------------- -2019-08-16 08:23:51,778 EPOCH 131 done: loss 0.5522 - lr 0.0250 -2019-08-16 08:23:51,778 BAD EPOCHS (no improvement): 0 -2019-08-16 08:23:51,778 ---------------------------------------------------------------------------------------------------- -2019-08-16 08:23:53,541 epoch 132 - iter 0/3720 - loss 0.48475194 throughput (samples/sec): 22973.51 -2019-08-16 08:26:38,093 epoch 132 - iter 372/3720 - loss 0.55327997 throughput (samples/sec): 74.97 -2019-08-16 08:29:21,744 epoch 132 - iter 744/3720 - loss 0.55767676 throughput (samples/sec): 75.94 -2019-08-16 08:32:05,264 epoch 132 - iter 1116/3720 - loss 0.54915754 throughput (samples/sec): 75.86 -2019-08-16 08:34:49,244 epoch 132 - iter 1488/3720 - loss 0.55122313 throughput (samples/sec): 75.05 -2019-08-16 08:37:33,712 epoch 132 - iter 1860/3720 - loss 0.54976697 throughput (samples/sec): 75.84 -2019-08-16 08:40:17,126 epoch 132 - iter 2232/3720 - loss 0.54959625 throughput (samples/sec): 76.03 -2019-08-16 08:42:59,506 epoch 132 - iter 2604/3720 - loss 0.55028682 throughput (samples/sec): 76.81 -2019-08-16 08:45:44,865 epoch 132 - iter 2976/3720 - loss 0.54871720 throughput (samples/sec): 74.84 -2019-08-16 08:48:28,845 epoch 132 - iter 3348/3720 - loss 0.54877515 throughput (samples/sec): 76.02 -2019-08-16 08:51:11,373 ---------------------------------------------------------------------------------------------------- -2019-08-16 08:51:11,374 EPOCH 132 done: loss 0.5482 - lr 0.0250 -2019-08-16 08:51:11,374 BAD EPOCHS (no improvement): 0 -2019-08-16 08:51:11,374 ---------------------------------------------------------------------------------------------------- -2019-08-16 08:51:13,035 epoch 133 - iter 0/3720 - loss 0.23740196 throughput (samples/sec): 29620.59 -2019-08-16 08:53:59,113 epoch 133 - iter 372/3720 - loss 0.53323255 throughput (samples/sec): 74.73 -2019-08-16 08:56:42,078 epoch 133 - iter 744/3720 - loss 0.54171826 throughput (samples/sec): 76.37 -2019-08-16 08:59:25,126 epoch 133 - iter 1116/3720 - loss 0.54648724 throughput (samples/sec): 76.17 -2019-08-16 09:02:08,593 epoch 133 - iter 1488/3720 - loss 0.54504599 throughput (samples/sec): 76.14 -2019-08-16 09:04:50,981 epoch 133 - iter 1860/3720 - loss 0.54764297 throughput (samples/sec): 75.64 -2019-08-16 09:07:34,000 epoch 133 - iter 2232/3720 - loss 0.54668967 throughput (samples/sec): 76.15 -2019-08-16 09:10:18,884 epoch 133 - iter 2604/3720 - loss 0.54623024 throughput (samples/sec): 74.60 -2019-08-16 09:13:01,086 epoch 133 - iter 2976/3720 - loss 0.54674772 throughput (samples/sec): 76.86 -2019-08-16 09:15:42,088 epoch 133 - iter 3348/3720 - loss 0.54447125 throughput (samples/sec): 76.40 -2019-08-16 09:18:23,968 ---------------------------------------------------------------------------------------------------- -2019-08-16 09:18:23,968 EPOCH 133 done: loss 0.5459 - lr 0.0250 -2019-08-16 09:18:23,968 BAD EPOCHS (no improvement): 0 -2019-08-16 09:18:23,968 ---------------------------------------------------------------------------------------------------- -2019-08-16 09:18:25,645 epoch 134 - iter 0/3720 - loss 0.63596296 throughput (samples/sec): 25826.88 -2019-08-16 09:21:11,248 epoch 134 - iter 372/3720 - loss 0.53748547 throughput (samples/sec): 75.12 -2019-08-16 09:23:54,450 epoch 134 - iter 744/3720 - loss 0.53590332 throughput (samples/sec): 76.03 -2019-08-16 09:26:37,595 epoch 134 - iter 1116/3720 - loss 0.54485081 throughput (samples/sec): 75.44 -2019-08-16 09:29:22,714 epoch 134 - iter 1488/3720 - loss 0.53994281 throughput (samples/sec): 75.02 -2019-08-16 09:32:05,721 epoch 134 - iter 1860/3720 - loss 0.54562568 throughput (samples/sec): 76.05 -2019-08-16 09:34:49,480 epoch 134 - iter 2232/3720 - loss 0.54627445 throughput (samples/sec): 75.67 -2019-08-16 09:37:34,286 epoch 134 - iter 2604/3720 - loss 0.54387174 throughput (samples/sec): 75.93 -2019-08-16 09:40:19,476 epoch 134 - iter 2976/3720 - loss 0.54453711 throughput (samples/sec): 75.26 -2019-08-16 09:43:04,655 epoch 134 - iter 3348/3720 - loss 0.54422456 throughput (samples/sec): 74.73 -2019-08-16 09:45:48,314 ---------------------------------------------------------------------------------------------------- -2019-08-16 09:45:48,314 EPOCH 134 done: loss 0.5442 - lr 0.0250 -2019-08-16 09:45:48,315 BAD EPOCHS (no improvement): 0 -2019-08-16 09:45:48,315 ---------------------------------------------------------------------------------------------------- -2019-08-16 09:45:49,962 epoch 135 - iter 0/3720 - loss 0.36704493 throughput (samples/sec): 30036.54 -2019-08-16 09:48:32,016 epoch 135 - iter 372/3720 - loss 0.53183833 throughput (samples/sec): 76.48 -2019-08-16 09:51:15,915 epoch 135 - iter 744/3720 - loss 0.52481571 throughput (samples/sec): 75.79 -2019-08-16 09:54:01,571 epoch 135 - iter 1116/3720 - loss 0.53838552 throughput (samples/sec): 75.35 -2019-08-16 09:56:43,693 epoch 135 - iter 1488/3720 - loss 0.54381951 throughput (samples/sec): 76.19 -2019-08-16 09:59:24,990 epoch 135 - iter 1860/3720 - loss 0.54270952 throughput (samples/sec): 76.56 -2019-08-16 10:02:07,489 epoch 135 - iter 2232/3720 - loss 0.54350146 throughput (samples/sec): 76.40 -2019-08-16 10:04:51,469 epoch 135 - iter 2604/3720 - loss 0.54611310 throughput (samples/sec): 75.50 -2019-08-16 10:07:34,468 epoch 135 - iter 2976/3720 - loss 0.54834997 throughput (samples/sec): 75.81 -2019-08-16 10:10:17,125 epoch 135 - iter 3348/3720 - loss 0.54604333 throughput (samples/sec): 76.62 -2019-08-16 10:13:00,315 ---------------------------------------------------------------------------------------------------- -2019-08-16 10:13:00,316 EPOCH 135 done: loss 0.5474 - lr 0.0250 -2019-08-16 10:13:00,316 BAD EPOCHS (no improvement): 1 -2019-08-16 10:13:00,316 ---------------------------------------------------------------------------------------------------- -2019-08-16 10:13:02,184 epoch 136 - iter 0/3720 - loss 0.51568985 throughput (samples/sec): 18872.89 -2019-08-16 10:15:48,450 epoch 136 - iter 372/3720 - loss 0.55596786 throughput (samples/sec): 75.10 -2019-08-16 10:18:31,660 epoch 136 - iter 744/3720 - loss 0.54414564 throughput (samples/sec): 76.19 -2019-08-16 10:21:16,235 epoch 136 - iter 1116/3720 - loss 0.54312637 throughput (samples/sec): 75.34 -2019-08-16 10:23:59,885 epoch 136 - iter 1488/3720 - loss 0.54612150 throughput (samples/sec): 75.72 -2019-08-16 10:26:43,180 epoch 136 - iter 1860/3720 - loss 0.54737286 throughput (samples/sec): 75.81 -2019-08-16 10:29:26,807 epoch 136 - iter 2232/3720 - loss 0.54682478 throughput (samples/sec): 76.30 -2019-08-16 10:32:08,030 epoch 136 - iter 2604/3720 - loss 0.54949765 throughput (samples/sec): 76.64 -2019-08-16 10:34:49,575 epoch 136 - iter 2976/3720 - loss 0.54944511 throughput (samples/sec): 75.92 -2019-08-16 10:37:33,817 epoch 136 - iter 3348/3720 - loss 0.54638724 throughput (samples/sec): 75.13 -2019-08-16 10:40:15,243 ---------------------------------------------------------------------------------------------------- -2019-08-16 10:40:15,244 EPOCH 136 done: loss 0.5470 - lr 0.0250 -2019-08-16 10:40:15,244 BAD EPOCHS (no improvement): 2 -2019-08-16 10:40:15,244 ---------------------------------------------------------------------------------------------------- -2019-08-16 10:40:17,043 epoch 137 - iter 0/3720 - loss 0.45256090 throughput (samples/sec): 21805.42 -2019-08-16 10:42:59,284 epoch 137 - iter 372/3720 - loss 0.53340439 throughput (samples/sec): 77.38 -2019-08-16 10:45:40,443 epoch 137 - iter 744/3720 - loss 0.53153445 throughput (samples/sec): 77.79 -2019-08-16 10:48:26,395 epoch 137 - iter 1116/3720 - loss 0.53840103 throughput (samples/sec): 75.18 -2019-08-16 10:51:11,305 epoch 137 - iter 1488/3720 - loss 0.53530071 throughput (samples/sec): 75.17 -2019-08-16 10:53:57,638 epoch 137 - iter 1860/3720 - loss 0.53379940 throughput (samples/sec): 74.99 -2019-08-16 10:56:41,987 epoch 137 - iter 2232/3720 - loss 0.53386588 throughput (samples/sec): 75.89 -2019-08-16 10:59:26,214 epoch 137 - iter 2604/3720 - loss 0.53706865 throughput (samples/sec): 75.40 -2019-08-16 11:02:17,100 epoch 137 - iter 2976/3720 - loss 0.53791899 throughput (samples/sec): 72.28 -2019-08-16 11:06:12,526 epoch 137 - iter 3348/3720 - loss 0.54047461 throughput (samples/sec): 51.98 -2019-08-16 11:09:52,037 ---------------------------------------------------------------------------------------------------- -2019-08-16 11:09:52,037 EPOCH 137 done: loss 0.5415 - lr 0.0250 -2019-08-16 11:09:52,037 BAD EPOCHS (no improvement): 0 -2019-08-16 11:09:52,037 ---------------------------------------------------------------------------------------------------- -2019-08-16 11:09:54,083 epoch 138 - iter 0/3720 - loss 1.19701672 throughput (samples/sec): 17924.70 -2019-08-16 11:14:10,554 epoch 138 - iter 372/3720 - loss 0.53208181 throughput (samples/sec): 47.68 -2019-08-16 11:18:06,179 epoch 138 - iter 744/3720 - loss 0.52045314 throughput (samples/sec): 52.18 -2019-08-16 11:22:21,515 epoch 138 - iter 1116/3720 - loss 0.53039163 throughput (samples/sec): 48.34 -2019-08-16 11:26:03,357 epoch 138 - iter 1488/3720 - loss 0.52938187 throughput (samples/sec): 55.22 -2019-08-16 11:30:18,229 epoch 138 - iter 1860/3720 - loss 0.53684335 throughput (samples/sec): 47.99 -2019-08-16 11:34:07,057 epoch 138 - iter 2232/3720 - loss 0.53465117 throughput (samples/sec): 53.79 -2019-08-16 11:38:17,774 epoch 138 - iter 2604/3720 - loss 0.53499290 throughput (samples/sec): 49.13 -2019-08-16 11:42:00,098 epoch 138 - iter 2976/3720 - loss 0.53972484 throughput (samples/sec): 55.52 -2019-08-16 11:46:12,661 epoch 138 - iter 3348/3720 - loss 0.54070237 throughput (samples/sec): 48.84 -2019-08-16 11:49:55,267 ---------------------------------------------------------------------------------------------------- -2019-08-16 11:49:55,267 EPOCH 138 done: loss 0.5436 - lr 0.0250 -2019-08-16 11:49:55,267 BAD EPOCHS (no improvement): 1 -2019-08-16 11:49:55,267 ---------------------------------------------------------------------------------------------------- -2019-08-16 11:49:57,533 epoch 139 - iter 0/3720 - loss 0.59516120 throughput (samples/sec): 15771.08 -2019-08-16 11:54:08,575 epoch 139 - iter 372/3720 - loss 0.54471094 throughput (samples/sec): 49.22 -2019-08-16 11:57:47,379 epoch 139 - iter 744/3720 - loss 0.54999249 throughput (samples/sec): 56.09 -2019-08-16 12:01:56,698 epoch 139 - iter 1116/3720 - loss 0.55402246 throughput (samples/sec): 49.28 -2019-08-16 12:05:39,323 epoch 139 - iter 1488/3720 - loss 0.55168439 throughput (samples/sec): 55.50 -2019-08-16 12:09:53,005 epoch 139 - iter 1860/3720 - loss 0.54996040 throughput (samples/sec): 48.34 -2019-08-16 12:13:37,668 epoch 139 - iter 2232/3720 - loss 0.54782652 throughput (samples/sec): 54.74 -2019-08-16 12:17:48,439 epoch 139 - iter 2604/3720 - loss 0.54441214 throughput (samples/sec): 49.10 -2019-08-16 12:21:36,083 epoch 139 - iter 2976/3720 - loss 0.54511269 throughput (samples/sec): 54.14 -2019-08-16 12:25:51,236 epoch 139 - iter 3348/3720 - loss 0.54443419 throughput (samples/sec): 47.92 -2019-08-16 12:29:34,368 ---------------------------------------------------------------------------------------------------- -2019-08-16 12:29:34,368 EPOCH 139 done: loss 0.5451 - lr 0.0250 -2019-08-16 12:29:34,368 BAD EPOCHS (no improvement): 2 -2019-08-16 12:29:34,369 ---------------------------------------------------------------------------------------------------- -2019-08-16 12:29:36,641 epoch 140 - iter 0/3720 - loss 0.49179482 throughput (samples/sec): 13183.81 -2019-08-16 12:33:50,410 epoch 140 - iter 372/3720 - loss 0.53342361 throughput (samples/sec): 48.58 -2019-08-16 12:37:28,837 epoch 140 - iter 744/3720 - loss 0.53187150 throughput (samples/sec): 56.58 -2019-08-16 12:41:41,541 epoch 140 - iter 1116/3720 - loss 0.53726347 throughput (samples/sec): 48.71 -2019-08-16 12:45:23,787 epoch 140 - iter 1488/3720 - loss 0.53682820 throughput (samples/sec): 55.52 -2019-08-16 12:49:35,771 epoch 140 - iter 1860/3720 - loss 0.53587026 throughput (samples/sec): 48.86 -2019-08-16 12:53:15,712 epoch 140 - iter 2232/3720 - loss 0.53511571 throughput (samples/sec): 56.28 -2019-08-16 12:57:28,486 epoch 140 - iter 2604/3720 - loss 0.53257680 throughput (samples/sec): 48.62 -2019-08-16 13:01:09,750 epoch 140 - iter 2976/3720 - loss 0.53344971 throughput (samples/sec): 55.62 -2019-08-16 13:05:19,098 epoch 140 - iter 3348/3720 - loss 0.53619032 throughput (samples/sec): 49.54 -2019-08-16 13:08:59,355 ---------------------------------------------------------------------------------------------------- -2019-08-16 13:08:59,356 EPOCH 140 done: loss 0.5363 - lr 0.0250 -2019-08-16 13:08:59,356 BAD EPOCHS (no improvement): 0 -2019-08-16 13:08:59,356 ---------------------------------------------------------------------------------------------------- -2019-08-16 13:09:01,279 epoch 141 - iter 0/3720 - loss 0.33176517 throughput (samples/sec): 19594.84 -2019-08-16 13:13:10,773 epoch 141 - iter 372/3720 - loss 0.52940859 throughput (samples/sec): 49.16 -2019-08-16 13:16:55,642 epoch 141 - iter 744/3720 - loss 0.53665618 throughput (samples/sec): 54.47 -2019-08-16 13:21:09,703 epoch 141 - iter 1116/3720 - loss 0.54078623 throughput (samples/sec): 48.20 -2019-08-16 13:24:50,477 epoch 141 - iter 1488/3720 - loss 0.54051847 throughput (samples/sec): 55.81 -2019-08-16 13:29:04,832 epoch 141 - iter 1860/3720 - loss 0.53706665 throughput (samples/sec): 48.39 -2019-08-16 13:32:46,708 epoch 141 - iter 2232/3720 - loss 0.54000080 throughput (samples/sec): 55.52 -2019-08-16 13:36:57,265 epoch 141 - iter 2604/3720 - loss 0.53741352 throughput (samples/sec): 49.29 -2019-08-16 13:40:36,232 epoch 141 - iter 2976/3720 - loss 0.53683066 throughput (samples/sec): 56.08 -2019-08-16 13:44:49,026 epoch 141 - iter 3348/3720 - loss 0.53870674 throughput (samples/sec): 48.39 -2019-08-16 13:48:27,638 ---------------------------------------------------------------------------------------------------- -2019-08-16 13:48:27,638 EPOCH 141 done: loss 0.5380 - lr 0.0250 -2019-08-16 13:48:27,638 BAD EPOCHS (no improvement): 1 -2019-08-16 13:48:27,638 ---------------------------------------------------------------------------------------------------- -2019-08-16 13:48:29,624 epoch 142 - iter 0/3720 - loss 0.44517446 throughput (samples/sec): 20414.95 -2019-08-16 13:52:48,297 epoch 142 - iter 372/3720 - loss 0.51014734 throughput (samples/sec): 47.67 -2019-08-16 13:56:27,857 epoch 142 - iter 744/3720 - loss 0.51879235 throughput (samples/sec): 56.28 -2019-08-16 14:00:42,008 epoch 142 - iter 1116/3720 - loss 0.52066611 throughput (samples/sec): 48.61 -2019-08-16 14:04:18,964 epoch 142 - iter 1488/3720 - loss 0.52941071 throughput (samples/sec): 56.80 -2019-08-16 14:08:32,437 epoch 142 - iter 1860/3720 - loss 0.53364108 throughput (samples/sec): 48.13 -2019-08-16 14:12:27,452 epoch 142 - iter 2232/3720 - loss 0.53802941 throughput (samples/sec): 52.54 -2019-08-16 14:16:36,689 epoch 142 - iter 2604/3720 - loss 0.53767510 throughput (samples/sec): 49.45 -2019-08-16 14:20:21,883 epoch 142 - iter 2976/3720 - loss 0.53739336 throughput (samples/sec): 54.81 -2019-08-16 14:24:33,209 epoch 142 - iter 3348/3720 - loss 0.53892493 throughput (samples/sec): 48.68 -2019-08-16 14:28:18,592 ---------------------------------------------------------------------------------------------------- -2019-08-16 14:28:18,593 EPOCH 142 done: loss 0.5381 - lr 0.0250 -2019-08-16 14:28:18,593 BAD EPOCHS (no improvement): 2 -2019-08-16 14:28:18,593 ---------------------------------------------------------------------------------------------------- -2019-08-16 14:28:20,758 epoch 143 - iter 0/3720 - loss 0.59441328 throughput (samples/sec): 15227.40 -2019-08-16 14:32:32,347 epoch 143 - iter 372/3720 - loss 0.54353970 throughput (samples/sec): 48.71 -2019-08-16 14:36:15,999 epoch 143 - iter 744/3720 - loss 0.53506296 throughput (samples/sec): 54.76 -2019-08-16 14:40:33,955 epoch 143 - iter 1116/3720 - loss 0.53436093 throughput (samples/sec): 47.65 -2019-08-16 14:44:09,109 epoch 143 - iter 1488/3720 - loss 0.54070474 throughput (samples/sec): 56.92 -2019-08-16 14:48:22,268 epoch 143 - iter 1860/3720 - loss 0.53960513 throughput (samples/sec): 48.69 -2019-08-16 14:52:06,421 epoch 143 - iter 2232/3720 - loss 0.53906203 throughput (samples/sec): 54.90 -2019-08-16 14:56:24,692 epoch 143 - iter 2604/3720 - loss 0.53996997 throughput (samples/sec): 47.79 -2019-08-16 15:00:06,492 epoch 143 - iter 2976/3720 - loss 0.53947131 throughput (samples/sec): 55.30 -2019-08-16 15:04:15,003 epoch 143 - iter 3348/3720 - loss 0.53918497 throughput (samples/sec): 49.83 -2019-08-16 15:07:56,787 ---------------------------------------------------------------------------------------------------- -2019-08-16 15:07:56,787 EPOCH 143 done: loss 0.5401 - lr 0.0250 -2019-08-16 15:07:56,787 BAD EPOCHS (no improvement): 3 -2019-08-16 15:07:56,788 ---------------------------------------------------------------------------------------------------- -2019-08-16 15:07:58,807 epoch 144 - iter 0/3720 - loss 0.65523267 throughput (samples/sec): 18691.42 -2019-08-16 15:12:12,991 epoch 144 - iter 372/3720 - loss 0.51497374 throughput (samples/sec): 48.28 -2019-08-16 15:15:55,774 epoch 144 - iter 744/3720 - loss 0.51904920 throughput (samples/sec): 55.25 -2019-08-16 15:20:10,156 epoch 144 - iter 1116/3720 - loss 0.52119448 throughput (samples/sec): 48.31 -2019-08-16 15:23:49,915 epoch 144 - iter 1488/3720 - loss 0.52178085 throughput (samples/sec): 55.70 -2019-08-16 15:28:02,741 epoch 144 - iter 1860/3720 - loss 0.52237854 throughput (samples/sec): 48.73 -2019-08-16 15:31:45,497 epoch 144 - iter 2232/3720 - loss 0.52511827 throughput (samples/sec): 55.60 -2019-08-16 15:35:58,064 epoch 144 - iter 2604/3720 - loss 0.52610562 throughput (samples/sec): 48.76 -2019-08-16 15:39:52,052 epoch 144 - iter 2976/3720 - loss 0.52720372 throughput (samples/sec): 52.49 -2019-08-16 15:44:04,484 epoch 144 - iter 3348/3720 - loss 0.52786657 throughput (samples/sec): 48.31 -2019-08-16 15:47:42,509 ---------------------------------------------------------------------------------------------------- -2019-08-16 15:47:42,509 EPOCH 144 done: loss 0.5301 - lr 0.0250 -2019-08-16 15:47:42,510 BAD EPOCHS (no improvement): 0 -2019-08-16 15:47:42,510 ---------------------------------------------------------------------------------------------------- -2019-08-16 15:47:44,471 epoch 145 - iter 0/3720 - loss 0.53303099 throughput (samples/sec): 18852.89 -2019-08-16 15:51:51,269 epoch 145 - iter 372/3720 - loss 0.54319095 throughput (samples/sec): 49.69 -2019-08-16 15:55:34,722 epoch 145 - iter 744/3720 - loss 0.55111078 throughput (samples/sec): 55.59 -2019-08-16 15:59:49,959 epoch 145 - iter 1116/3720 - loss 0.54632581 throughput (samples/sec): 48.18 -2019-08-16 16:03:52,687 epoch 145 - iter 1488/3720 - loss 0.54145772 throughput (samples/sec): 50.37 -2019-08-16 16:08:03,469 epoch 145 - iter 1860/3720 - loss 0.53752856 throughput (samples/sec): 48.91 -2019-08-16 16:11:45,993 epoch 145 - iter 2232/3720 - loss 0.53435324 throughput (samples/sec): 55.29 -2019-08-16 16:16:02,601 epoch 145 - iter 2604/3720 - loss 0.53203734 throughput (samples/sec): 47.68 -2019-08-16 16:19:47,558 epoch 145 - iter 2976/3720 - loss 0.53264483 throughput (samples/sec): 54.46 -2019-08-16 16:23:59,191 epoch 145 - iter 3348/3720 - loss 0.53460981 throughput (samples/sec): 48.87 -2019-08-16 16:27:39,672 ---------------------------------------------------------------------------------------------------- -2019-08-16 16:27:39,673 EPOCH 145 done: loss 0.5355 - lr 0.0250 -2019-08-16 16:27:39,673 BAD EPOCHS (no improvement): 1 -2019-08-16 16:27:39,673 ---------------------------------------------------------------------------------------------------- -2019-08-16 16:27:42,087 epoch 146 - iter 0/3720 - loss 0.36445189 throughput (samples/sec): 12935.79 -2019-08-16 16:31:58,404 epoch 146 - iter 372/3720 - loss 0.53069903 throughput (samples/sec): 47.86 -2019-08-16 16:35:37,960 epoch 146 - iter 744/3720 - loss 0.51701124 throughput (samples/sec): 56.51 -2019-08-16 16:39:48,375 epoch 146 - iter 1116/3720 - loss 0.52519196 throughput (samples/sec): 49.06 -2019-08-16 16:43:26,135 epoch 146 - iter 1488/3720 - loss 0.52646476 throughput (samples/sec): 56.58 -2019-08-16 16:47:40,289 epoch 146 - iter 1860/3720 - loss 0.53076636 throughput (samples/sec): 48.03 -2019-08-16 16:51:24,317 epoch 146 - iter 2232/3720 - loss 0.53141286 throughput (samples/sec): 55.09 -2019-08-16 16:55:37,270 epoch 146 - iter 2604/3720 - loss 0.52936052 throughput (samples/sec): 48.82 -2019-08-16 16:59:16,975 epoch 146 - iter 2976/3720 - loss 0.53222744 throughput (samples/sec): 56.38 -2019-08-16 17:03:26,144 epoch 146 - iter 3348/3720 - loss 0.53195692 throughput (samples/sec): 49.52 -2019-08-16 17:07:09,555 ---------------------------------------------------------------------------------------------------- -2019-08-16 17:07:09,555 EPOCH 146 done: loss 0.5329 - lr 0.0250 -2019-08-16 17:07:09,555 BAD EPOCHS (no improvement): 2 -2019-08-16 17:07:09,555 ---------------------------------------------------------------------------------------------------- -2019-08-16 17:07:11,491 epoch 147 - iter 0/3720 - loss 0.25649238 throughput (samples/sec): 19860.51 -2019-08-16 17:11:17,211 epoch 147 - iter 372/3720 - loss 0.53676751 throughput (samples/sec): 50.16 -2019-08-16 17:14:53,418 epoch 147 - iter 744/3720 - loss 0.54119203 throughput (samples/sec): 56.97 -2019-08-16 17:19:08,997 epoch 147 - iter 1116/3720 - loss 0.53600298 throughput (samples/sec): 48.34 -2019-08-16 17:22:49,309 epoch 147 - iter 1488/3720 - loss 0.53590698 throughput (samples/sec): 55.98 -2019-08-16 17:27:00,721 epoch 147 - iter 1860/3720 - loss 0.53652006 throughput (samples/sec): 48.66 -2019-08-16 17:30:39,801 epoch 147 - iter 2232/3720 - loss 0.53558644 throughput (samples/sec): 56.38 -2019-08-16 17:34:47,187 epoch 147 - iter 2604/3720 - loss 0.53431905 throughput (samples/sec): 49.93 -2019-08-16 17:38:26,823 epoch 147 - iter 2976/3720 - loss 0.53287713 throughput (samples/sec): 55.85 -2019-08-16 17:42:40,751 epoch 147 - iter 3348/3720 - loss 0.53244594 throughput (samples/sec): 48.53 -2019-08-16 17:46:21,389 ---------------------------------------------------------------------------------------------------- -2019-08-16 17:46:21,390 EPOCH 147 done: loss 0.5340 - lr 0.0250 -2019-08-16 17:46:21,390 BAD EPOCHS (no improvement): 3 -2019-08-16 17:46:21,390 ---------------------------------------------------------------------------------------------------- -2019-08-16 17:46:23,379 epoch 148 - iter 0/3720 - loss 0.51061249 throughput (samples/sec): 21030.85 -2019-08-16 17:50:38,308 epoch 148 - iter 372/3720 - loss 0.52756494 throughput (samples/sec): 47.88 -2019-08-16 17:54:19,136 epoch 148 - iter 744/3720 - loss 0.53368149 throughput (samples/sec): 55.50 -2019-08-16 17:58:31,805 epoch 148 - iter 1116/3720 - loss 0.53820451 throughput (samples/sec): 48.93 -2019-08-16 18:02:18,126 epoch 148 - iter 1488/3720 - loss 0.53257269 throughput (samples/sec): 54.20 -2019-08-16 18:06:32,858 epoch 148 - iter 1860/3720 - loss 0.53269776 throughput (samples/sec): 48.26 -2019-08-16 18:10:12,492 epoch 148 - iter 2232/3720 - loss 0.53014567 throughput (samples/sec): 56.02 -2019-08-16 18:14:21,052 epoch 148 - iter 2604/3720 - loss 0.52749310 throughput (samples/sec): 49.24 -2019-08-16 18:18:03,078 epoch 148 - iter 2976/3720 - loss 0.52590351 throughput (samples/sec): 55.46 -2019-08-16 18:22:17,481 epoch 148 - iter 3348/3720 - loss 0.52801033 throughput (samples/sec): 48.56 -2019-08-16 18:25:58,561 ---------------------------------------------------------------------------------------------------- -2019-08-16 18:25:58,562 EPOCH 148 done: loss 0.5280 - lr 0.0250 -2019-08-16 18:25:58,562 BAD EPOCHS (no improvement): 0 -2019-08-16 18:25:58,562 ---------------------------------------------------------------------------------------------------- -2019-08-16 18:26:00,669 epoch 149 - iter 0/3720 - loss 0.42755437 throughput (samples/sec): 18865.28 -2019-08-16 18:30:11,691 epoch 149 - iter 372/3720 - loss 0.53250036 throughput (samples/sec): 48.90 -2019-08-16 18:33:54,833 epoch 149 - iter 744/3720 - loss 0.53193735 throughput (samples/sec): 54.84 -2019-08-16 18:38:04,698 epoch 149 - iter 1116/3720 - loss 0.53354692 throughput (samples/sec): 48.95 -2019-08-16 18:41:46,458 epoch 149 - iter 1488/3720 - loss 0.53388988 throughput (samples/sec): 55.71 -2019-08-16 18:46:01,918 epoch 149 - iter 1860/3720 - loss 0.53713460 throughput (samples/sec): 48.27 -2019-08-16 18:49:41,623 epoch 149 - iter 2232/3720 - loss 0.53652019 throughput (samples/sec): 55.94 -2019-08-16 18:53:57,822 epoch 149 - iter 2604/3720 - loss 0.53371822 throughput (samples/sec): 47.70 -2019-08-16 18:57:36,436 epoch 149 - iter 2976/3720 - loss 0.53389733 throughput (samples/sec): 56.69 -2019-08-16 19:01:48,227 epoch 149 - iter 3348/3720 - loss 0.53356533 throughput (samples/sec): 48.88 -2019-08-16 19:05:27,867 ---------------------------------------------------------------------------------------------------- -2019-08-16 19:05:27,868 EPOCH 149 done: loss 0.5337 - lr 0.0250 -2019-08-16 19:05:27,868 BAD EPOCHS (no improvement): 1 -2019-08-16 19:05:27,868 ---------------------------------------------------------------------------------------------------- -2019-08-16 19:05:30,235 epoch 150 - iter 0/3720 - loss 0.61263156 throughput (samples/sec): 14056.88 -2019-08-16 19:09:39,869 epoch 150 - iter 372/3720 - loss 0.52670288 throughput (samples/sec): 49.13 -2019-08-16 19:13:18,213 epoch 150 - iter 744/3720 - loss 0.52680524 throughput (samples/sec): 56.57 -2019-08-16 19:17:30,823 epoch 150 - iter 1116/3720 - loss 0.52350596 throughput (samples/sec): 48.75 -2019-08-16 19:21:15,536 epoch 150 - iter 1488/3720 - loss 0.52232205 throughput (samples/sec): 54.94 -2019-08-16 19:25:27,106 epoch 150 - iter 1860/3720 - loss 0.52478020 throughput (samples/sec): 48.67 -2019-08-16 19:29:13,694 epoch 150 - iter 2232/3720 - loss 0.52661463 throughput (samples/sec): 54.39 -2019-08-16 19:33:22,534 epoch 150 - iter 2604/3720 - loss 0.52534755 throughput (samples/sec): 49.66 -2019-08-16 19:37:02,712 epoch 150 - iter 2976/3720 - loss 0.52854977 throughput (samples/sec): 56.14 -2019-08-16 19:41:19,684 epoch 150 - iter 3348/3720 - loss 0.52934089 throughput (samples/sec): 47.70 -2019-08-16 19:44:58,859 ---------------------------------------------------------------------------------------------------- -2019-08-16 19:44:58,860 EPOCH 150 done: loss 0.5292 - lr 0.0250 -2019-08-16 19:44:58,860 BAD EPOCHS (no improvement): 2 -2019-08-16 19:45:10,759 ---------------------------------------------------------------------------------------------------- -2019-08-16 19:45:10,759 Testing using best model ... -2019-08-16 19:52:54,354 0.9064 0.9058 0.9061 -2019-08-16 19:52:54,354 -MICRO_AVG: acc 0.8283 - f1-score 0.9061 -MACRO_AVG: acc 0.8118 - f1-score 0.89455 -LOC tp: 10354 - fp: 1214 - fn: 1119 - tn: 10354 - precision: 0.8951 - recall: 0.9025 - accuracy: 0.8161 - f1-score: 0.8988 -MISC tp: 3355 - fp: 575 - fn: 662 - tn: 3355 - precision: 0.8537 - recall: 0.8352 - accuracy: 0.7306 - f1-score: 0.8443 -ORG tp: 2115 - fp: 263 - fn: 335 - tn: 2115 - precision: 0.8894 - recall: 0.8633 - accuracy: 0.7796 - f1-score: 0.8762 -PER tp: 7299 - fp: 337 - fn: 288 - tn: 7299 - precision: 0.9559 - recall: 0.9620 - accuracy: 0.9211 - f1-score: 0.9589 -2019-08-16 19:52:54,354 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:27:04,698 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:27:04,698 Corpus: "MultiCorpus: 107128 train + 11903 dev + 13226 test sentences + - ColumnCorpus Corpus: 107128 train + 11903 dev + 13226 test sentences - /vol/home-vol2/ml/akbikala/.flair/datasets/ner_multi_wikiner/fr" +2023-04-05 22:27:04,698 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:27:04,698 Parameters: +2023-04-05 22:27:04,698 - learning_rate: "0.100000" +2023-04-05 22:27:04,698 - mini_batch_size: "32" +2023-04-05 22:27:04,698 - patience: "3" +2023-04-05 22:27:04,698 - anneal_factor: "0.5" +2023-04-05 22:27:04,699 - max_epochs: "150" +2023-04-05 22:27:04,699 - shuffle: "True" +2023-04-05 22:27:04,699 - train_with_dev: "True" +2023-04-05 22:27:04,699 - batch_growth_annealing: "False" +2023-04-05 22:27:04,699 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:27:04,699 Model training base path: "resources/taggers/release-fr-ner-0" +2023-04-05 22:27:04,699 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:27:04,699 Device: cuda:1 +2023-04-05 22:27:04,699 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:27:04,699 Embeddings storage mode: cpu +2023-04-05 22:27:04,699 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:28:33,936 epoch 1 - iter 372/3720 - loss 0.26668558 - time (sec): 89.24 - samples/sec: 3617.17 - lr: 0.100000 +2023-04-05 22:30:02,154 epoch 1 - iter 744/3720 - loss 0.18821172 - time (sec): 177.45 - samples/sec: 3623.68 - lr: 0.100000 +2023-04-05 22:31:33,098 epoch 1 - iter 1116/3720 - loss 0.15484475 - time (sec): 268.40 - samples/sec: 3598.78 - lr: 0.100000 +2023-04-05 22:32:59,874 epoch 1 - iter 1488/3720 - loss 0.13700614 - time (sec): 355.18 - samples/sec: 3593.73 - lr: 0.100000 +2023-04-05 22:34:26,533 epoch 1 - iter 1860/3720 - loss 0.12470905 - time (sec): 441.83 - samples/sec: 3593.17 - lr: 0.100000 +2023-04-05 22:35:52,865 epoch 1 - iter 2232/3720 - loss 0.11525106 - time (sec): 528.17 - samples/sec: 3587.74 - lr: 0.100000 +2023-04-05 22:37:20,753 epoch 1 - iter 2604/3720 - loss 0.10793162 - time (sec): 616.05 - samples/sec: 3579.76 - lr: 0.100000 +2023-04-05 22:38:49,774 epoch 1 - iter 2976/3720 - loss 0.10238419 - time (sec): 705.08 - samples/sec: 3570.50 - lr: 0.100000 +2023-04-05 22:39:54,061 epoch 1 - iter 3348/3720 - loss 0.09811850 - time (sec): 769.36 - samples/sec: 3686.03 - lr: 0.100000 +2023-04-05 22:40:56,945 epoch 1 - iter 3720/3720 - loss 0.09450245 - time (sec): 832.25 - samples/sec: 3787.00 - lr: 0.100000 +2023-04-05 22:40:56,945 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:40:56,945 EPOCH 1 done: loss 0.0945 - lr 0.100000 +2023-04-05 22:40:56,945 BAD EPOCHS (no improvement): 0 +2023-04-05 22:40:56,948 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:42:00,729 epoch 2 - iter 372/3720 - loss 0.06065240 - time (sec): 63.78 - samples/sec: 4924.62 - lr: 0.100000 +2023-04-05 22:43:05,463 epoch 2 - iter 744/3720 - loss 0.05924859 - time (sec): 128.52 - samples/sec: 4904.42 - lr: 0.100000 +2023-04-05 22:44:09,545 epoch 2 - iter 1116/3720 - loss 0.05885594 - time (sec): 192.60 - samples/sec: 4908.57 - lr: 0.100000 +2023-04-05 22:45:13,493 epoch 2 - iter 1488/3720 - loss 0.05818312 - time (sec): 256.55 - samples/sec: 4910.54 - lr: 0.100000 +2023-04-05 22:46:18,228 epoch 2 - iter 1860/3720 - loss 0.05786242 - time (sec): 321.28 - samples/sec: 4903.04 - lr: 0.100000 +2023-04-05 22:47:22,311 epoch 2 - iter 2232/3720 - loss 0.05702811 - time (sec): 385.36 - samples/sec: 4911.93 - lr: 0.100000 +2023-04-05 22:48:27,905 epoch 2 - iter 2604/3720 - loss 0.05644926 - time (sec): 450.96 - samples/sec: 4896.02 - lr: 0.100000 +2023-04-05 22:49:32,658 epoch 2 - iter 2976/3720 - loss 0.05594932 - time (sec): 515.71 - samples/sec: 4890.45 - lr: 0.100000 +2023-04-05 22:50:37,124 epoch 2 - iter 3348/3720 - loss 0.05562567 - time (sec): 580.18 - samples/sec: 4891.12 - lr: 0.100000 +2023-04-05 22:51:41,572 epoch 2 - iter 3720/3720 - loss 0.05521556 - time (sec): 644.62 - samples/sec: 4889.22 - lr: 0.100000 +2023-04-05 22:51:41,572 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:51:41,572 EPOCH 2 done: loss 0.0552 - lr 0.100000 +2023-04-05 22:51:41,572 BAD EPOCHS (no improvement): 0 +2023-04-05 22:51:41,575 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:52:45,931 epoch 3 - iter 372/3720 - loss 0.05046567 - time (sec): 64.36 - samples/sec: 4895.71 - lr: 0.100000 +2023-04-05 22:53:49,969 epoch 3 - iter 744/3720 - loss 0.05024878 - time (sec): 128.39 - samples/sec: 4895.63 - lr: 0.100000 +2023-04-05 22:54:55,129 epoch 3 - iter 1116/3720 - loss 0.05024194 - time (sec): 193.55 - samples/sec: 4876.90 - lr: 0.100000 +2023-04-05 22:55:59,149 epoch 3 - iter 1488/3720 - loss 0.05028535 - time (sec): 257.57 - samples/sec: 4890.33 - lr: 0.100000 +2023-04-05 22:57:04,010 epoch 3 - iter 1860/3720 - loss 0.05030635 - time (sec): 322.43 - samples/sec: 4888.14 - lr: 0.100000 +2023-04-05 22:58:07,595 epoch 3 - iter 2232/3720 - loss 0.05013778 - time (sec): 386.02 - samples/sec: 4902.42 - lr: 0.100000 +2023-04-05 22:59:11,614 epoch 3 - iter 2604/3720 - loss 0.05015459 - time (sec): 450.04 - samples/sec: 4901.46 - lr: 0.100000 +2023-04-05 23:00:15,174 epoch 3 - iter 2976/3720 - loss 0.04980648 - time (sec): 513.60 - samples/sec: 4911.18 - lr: 0.100000 +2023-04-05 23:01:19,651 epoch 3 - iter 3348/3720 - loss 0.04956168 - time (sec): 578.08 - samples/sec: 4910.97 - lr: 0.100000 +2023-04-05 23:02:23,440 epoch 3 - iter 3720/3720 - loss 0.04952181 - time (sec): 641.86 - samples/sec: 4910.24 - lr: 0.100000 +2023-04-05 23:02:23,440 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:02:23,440 EPOCH 3 done: loss 0.0495 - lr 0.100000 +2023-04-05 23:02:23,441 BAD EPOCHS (no improvement): 0 +2023-04-05 23:02:23,444 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:03:28,321 epoch 4 - iter 372/3720 - loss 0.04613959 - time (sec): 64.88 - samples/sec: 4888.98 - lr: 0.100000 +2023-04-05 23:04:32,814 epoch 4 - iter 744/3720 - loss 0.04723903 - time (sec): 129.37 - samples/sec: 4875.64 - lr: 0.100000 +2023-04-05 23:05:37,556 epoch 4 - iter 1116/3720 - loss 0.04692235 - time (sec): 194.11 - samples/sec: 4880.06 - lr: 0.100000 +2023-04-05 23:06:40,836 epoch 4 - iter 1488/3720 - loss 0.04683749 - time (sec): 257.39 - samples/sec: 4905.46 - lr: 0.100000 +2023-04-05 23:07:45,092 epoch 4 - iter 1860/3720 - loss 0.04668699 - time (sec): 321.65 - samples/sec: 4915.44 - lr: 0.100000 +2023-04-05 23:08:49,644 epoch 4 - iter 2232/3720 - loss 0.04665987 - time (sec): 386.20 - samples/sec: 4907.91 - lr: 0.100000 +2023-04-05 23:09:52,884 epoch 4 - iter 2604/3720 - loss 0.04664835 - time (sec): 449.44 - samples/sec: 4911.95 - lr: 0.100000 +2023-04-05 23:10:57,031 epoch 4 - iter 2976/3720 - loss 0.04652260 - time (sec): 513.59 - samples/sec: 4912.37 - lr: 0.100000 +2023-04-05 23:12:00,247 epoch 4 - iter 3348/3720 - loss 0.04657826 - time (sec): 576.80 - samples/sec: 4918.85 - lr: 0.100000 +2023-04-05 23:13:03,773 epoch 4 - iter 3720/3720 - loss 0.04654629 - time (sec): 640.33 - samples/sec: 4922.02 - lr: 0.100000 +2023-04-05 23:13:03,773 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:13:03,773 EPOCH 4 done: loss 0.0465 - lr 0.100000 +2023-04-05 23:13:03,774 BAD EPOCHS (no improvement): 0 +2023-04-05 23:13:03,776 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:14:07,173 epoch 5 - iter 372/3720 - loss 0.04491548 - time (sec): 63.40 - samples/sec: 4971.42 - lr: 0.100000 +2023-04-05 23:15:09,761 epoch 5 - iter 744/3720 - loss 0.04494219 - time (sec): 125.98 - samples/sec: 4985.63 - lr: 0.100000 +2023-04-05 23:16:15,361 epoch 5 - iter 1116/3720 - loss 0.04485739 - time (sec): 191.58 - samples/sec: 4925.37 - lr: 0.100000 +2023-04-05 23:17:20,769 epoch 5 - iter 1488/3720 - loss 0.04486438 - time (sec): 256.99 - samples/sec: 4901.50 - lr: 0.100000 +2023-04-05 23:18:25,883 epoch 5 - iter 1860/3720 - loss 0.04477035 - time (sec): 322.11 - samples/sec: 4894.20 - lr: 0.100000 +2023-04-05 23:19:29,636 epoch 5 - iter 2232/3720 - loss 0.04462821 - time (sec): 385.86 - samples/sec: 4893.28 - lr: 0.100000 +2023-04-05 23:20:34,474 epoch 5 - iter 2604/3720 - loss 0.04470493 - time (sec): 450.70 - samples/sec: 4884.85 - lr: 0.100000 +2023-04-05 23:21:39,925 epoch 5 - iter 2976/3720 - loss 0.04477533 - time (sec): 516.15 - samples/sec: 4879.53 - lr: 0.100000 +2023-04-05 23:22:44,993 epoch 5 - iter 3348/3720 - loss 0.04475228 - time (sec): 581.22 - samples/sec: 4877.68 - lr: 0.100000 +2023-04-05 23:23:50,164 epoch 5 - iter 3720/3720 - loss 0.04467442 - time (sec): 646.39 - samples/sec: 4875.88 - lr: 0.100000 +2023-04-05 23:23:50,165 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:23:50,165 EPOCH 5 done: loss 0.0447 - lr 0.100000 +2023-04-05 23:23:50,165 BAD EPOCHS (no improvement): 0 +2023-04-05 23:23:50,168 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:24:56,275 epoch 6 - iter 372/3720 - loss 0.04236946 - time (sec): 66.11 - samples/sec: 4800.02 - lr: 0.100000 +2023-04-05 23:26:00,676 epoch 6 - iter 744/3720 - loss 0.04346961 - time (sec): 130.51 - samples/sec: 4833.73 - lr: 0.100000 +2023-04-05 23:27:05,725 epoch 6 - iter 1116/3720 - loss 0.04341193 - time (sec): 195.56 - samples/sec: 4834.31 - lr: 0.100000 +2023-04-05 23:28:10,557 epoch 6 - iter 1488/3720 - loss 0.04353977 - time (sec): 260.39 - samples/sec: 4843.95 - lr: 0.100000 +2023-04-05 23:29:14,854 epoch 6 - iter 1860/3720 - loss 0.04356128 - time (sec): 324.69 - samples/sec: 4852.90 - lr: 0.100000 +2023-04-05 23:30:19,014 epoch 6 - iter 2232/3720 - loss 0.04363767 - time (sec): 388.85 - samples/sec: 4858.71 - lr: 0.100000 +2023-04-05 23:31:23,740 epoch 6 - iter 2604/3720 - loss 0.04364881 - time (sec): 453.57 - samples/sec: 4852.89 - lr: 0.100000 +2023-04-05 23:32:28,669 epoch 6 - iter 2976/3720 - loss 0.04361488 - time (sec): 518.50 - samples/sec: 4851.02 - lr: 0.100000 +2023-04-05 23:33:35,290 epoch 6 - iter 3348/3720 - loss 0.04342392 - time (sec): 585.12 - samples/sec: 4844.92 - lr: 0.100000 +2023-04-05 23:34:40,827 epoch 6 - iter 3720/3720 - loss 0.04337900 - time (sec): 650.66 - samples/sec: 4843.88 - lr: 0.100000 +2023-04-05 23:34:40,827 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:34:40,827 EPOCH 6 done: loss 0.0434 - lr 0.100000 +2023-04-05 23:34:40,827 BAD EPOCHS (no improvement): 0 +2023-04-05 23:34:40,830 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:35:46,776 epoch 7 - iter 372/3720 - loss 0.04216405 - time (sec): 65.95 - samples/sec: 4799.64 - lr: 0.100000 +2023-04-05 23:36:51,460 epoch 7 - iter 744/3720 - loss 0.04195712 - time (sec): 130.63 - samples/sec: 4816.10 - lr: 0.100000 +2023-04-05 23:37:55,121 epoch 7 - iter 1116/3720 - loss 0.04172125 - time (sec): 194.29 - samples/sec: 4864.28 - lr: 0.100000 +2023-04-05 23:39:00,044 epoch 7 - iter 1488/3720 - loss 0.04181797 - time (sec): 259.21 - samples/sec: 4867.10 - lr: 0.100000 +2023-04-05 23:40:05,144 epoch 7 - iter 1860/3720 - loss 0.04193096 - time (sec): 324.31 - samples/sec: 4859.06 - lr: 0.100000 +2023-04-05 23:41:10,633 epoch 7 - iter 2232/3720 - loss 0.04198594 - time (sec): 389.80 - samples/sec: 4849.47 - lr: 0.100000 +2023-04-05 23:42:14,072 epoch 7 - iter 2604/3720 - loss 0.04209685 - time (sec): 453.24 - samples/sec: 4862.50 - lr: 0.100000 +2023-04-05 23:43:18,823 epoch 7 - iter 2976/3720 - loss 0.04213716 - time (sec): 517.99 - samples/sec: 4863.88 - lr: 0.100000 +2023-04-05 23:44:23,416 epoch 7 - iter 3348/3720 - loss 0.04224028 - time (sec): 582.59 - samples/sec: 4868.17 - lr: 0.100000 +2023-04-05 23:45:29,396 epoch 7 - iter 3720/3720 - loss 0.04226558 - time (sec): 648.57 - samples/sec: 4859.51 - lr: 0.100000 +2023-04-05 23:45:29,396 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:45:29,396 EPOCH 7 done: loss 0.0423 - lr 0.100000 +2023-04-05 23:45:29,396 BAD EPOCHS (no improvement): 0 +2023-04-05 23:45:29,399 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:46:33,584 epoch 8 - iter 372/3720 - loss 0.04172150 - time (sec): 64.18 - samples/sec: 4911.49 - lr: 0.100000 +2023-04-05 23:47:37,938 epoch 8 - iter 744/3720 - loss 0.04180014 - time (sec): 128.54 - samples/sec: 4896.63 - lr: 0.100000 +2023-04-05 23:48:42,007 epoch 8 - iter 1116/3720 - loss 0.04179824 - time (sec): 192.61 - samples/sec: 4911.23 - lr: 0.100000 +2023-04-05 23:49:45,242 epoch 8 - iter 1488/3720 - loss 0.04151445 - time (sec): 255.84 - samples/sec: 4931.13 - lr: 0.100000 +2023-04-05 23:50:49,675 epoch 8 - iter 1860/3720 - loss 0.04166393 - time (sec): 320.28 - samples/sec: 4923.25 - lr: 0.100000 +2023-04-05 23:51:55,508 epoch 8 - iter 2232/3720 - loss 0.04150733 - time (sec): 386.11 - samples/sec: 4903.37 - lr: 0.100000 +2023-04-05 23:53:01,769 epoch 8 - iter 2604/3720 - loss 0.04146176 - time (sec): 452.37 - samples/sec: 4876.82 - lr: 0.100000 +2023-04-05 23:54:06,502 epoch 8 - iter 2976/3720 - loss 0.04150560 - time (sec): 517.10 - samples/sec: 4872.69 - lr: 0.100000 +2023-04-05 23:55:12,693 epoch 8 - iter 3348/3720 - loss 0.04151976 - time (sec): 583.29 - samples/sec: 4864.86 - lr: 0.100000 +2023-04-05 23:56:17,542 epoch 8 - iter 3720/3720 - loss 0.04164803 - time (sec): 648.14 - samples/sec: 4862.68 - lr: 0.100000 +2023-04-05 23:56:17,543 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:56:17,543 EPOCH 8 done: loss 0.0416 - lr 0.100000 +2023-04-05 23:56:17,543 BAD EPOCHS (no improvement): 0 +2023-04-05 23:56:17,545 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:57:22,891 epoch 9 - iter 372/3720 - loss 0.04059165 - time (sec): 65.35 - samples/sec: 4821.72 - lr: 0.100000 +2023-04-05 23:58:28,040 epoch 9 - iter 744/3720 - loss 0.04076265 - time (sec): 130.49 - samples/sec: 4826.48 - lr: 0.100000 +2023-04-05 23:59:32,267 epoch 9 - iter 1116/3720 - loss 0.04079673 - time (sec): 194.72 - samples/sec: 4845.58 - lr: 0.100000 +2023-04-06 00:00:37,866 epoch 9 - iter 1488/3720 - loss 0.04100264 - time (sec): 260.32 - samples/sec: 4838.91 - lr: 0.100000 +2023-04-06 00:01:42,188 epoch 9 - iter 1860/3720 - loss 0.04102605 - time (sec): 324.64 - samples/sec: 4848.46 - lr: 0.100000 +2023-04-06 00:02:46,538 epoch 9 - iter 2232/3720 - loss 0.04095108 - time (sec): 388.99 - samples/sec: 4859.31 - lr: 0.100000 +2023-04-06 00:03:51,285 epoch 9 - iter 2604/3720 - loss 0.04087753 - time (sec): 453.74 - samples/sec: 4866.60 - lr: 0.100000 +2023-04-06 00:04:55,279 epoch 9 - iter 2976/3720 - loss 0.04081089 - time (sec): 517.73 - samples/sec: 4872.21 - lr: 0.100000 +2023-04-06 00:06:01,561 epoch 9 - iter 3348/3720 - loss 0.04085946 - time (sec): 584.02 - samples/sec: 4859.40 - lr: 0.100000 +2023-04-06 00:07:06,309 epoch 9 - iter 3720/3720 - loss 0.04084458 - time (sec): 648.76 - samples/sec: 4858.03 - lr: 0.100000 +2023-04-06 00:07:06,309 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:07:06,309 EPOCH 9 done: loss 0.0408 - lr 0.100000 +2023-04-06 00:07:06,309 BAD EPOCHS (no improvement): 0 +2023-04-06 00:07:06,312 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:08:11,202 epoch 10 - iter 372/3720 - loss 0.03977085 - time (sec): 64.89 - samples/sec: 4857.10 - lr: 0.100000 +2023-04-06 00:09:16,581 epoch 10 - iter 744/3720 - loss 0.04042448 - time (sec): 130.27 - samples/sec: 4828.72 - lr: 0.100000 +2023-04-06 00:10:22,000 epoch 10 - iter 1116/3720 - loss 0.04021729 - time (sec): 195.69 - samples/sec: 4825.54 - lr: 0.100000 +2023-04-06 00:11:27,331 epoch 10 - iter 1488/3720 - loss 0.04006120 - time (sec): 261.02 - samples/sec: 4826.13 - lr: 0.100000 +2023-04-06 00:12:30,914 epoch 10 - iter 1860/3720 - loss 0.04018432 - time (sec): 324.60 - samples/sec: 4849.77 - lr: 0.100000 +2023-04-06 00:13:34,453 epoch 10 - iter 2232/3720 - loss 0.04038774 - time (sec): 388.14 - samples/sec: 4866.26 - lr: 0.100000 +2023-04-06 00:14:39,329 epoch 10 - iter 2604/3720 - loss 0.04035558 - time (sec): 453.02 - samples/sec: 4865.27 - lr: 0.100000 +2023-04-06 00:15:44,245 epoch 10 - iter 2976/3720 - loss 0.04031628 - time (sec): 517.93 - samples/sec: 4859.06 - lr: 0.100000 +2023-04-06 00:16:50,500 epoch 10 - iter 3348/3720 - loss 0.04030915 - time (sec): 584.19 - samples/sec: 4851.80 - lr: 0.100000 +2023-04-06 00:17:56,482 epoch 10 - iter 3720/3720 - loss 0.04028057 - time (sec): 650.17 - samples/sec: 4847.52 - lr: 0.100000 +2023-04-06 00:17:56,482 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:17:56,482 EPOCH 10 done: loss 0.0403 - lr 0.100000 +2023-04-06 00:17:56,482 BAD EPOCHS (no improvement): 0 +2023-04-06 00:17:56,485 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:19:02,260 epoch 11 - iter 372/3720 - loss 0.03881162 - time (sec): 65.78 - samples/sec: 4790.89 - lr: 0.100000 +2023-04-06 00:20:07,864 epoch 11 - iter 744/3720 - loss 0.03934850 - time (sec): 131.38 - samples/sec: 4801.79 - lr: 0.100000 +2023-04-06 00:21:12,756 epoch 11 - iter 1116/3720 - loss 0.03941690 - time (sec): 196.27 - samples/sec: 4817.33 - lr: 0.100000 +2023-04-06 00:22:17,917 epoch 11 - iter 1488/3720 - loss 0.03964001 - time (sec): 261.43 - samples/sec: 4819.91 - lr: 0.100000 +2023-04-06 00:23:23,428 epoch 11 - iter 1860/3720 - loss 0.03969471 - time (sec): 326.94 - samples/sec: 4821.40 - lr: 0.100000 +2023-04-06 00:24:28,856 epoch 11 - iter 2232/3720 - loss 0.03980826 - time (sec): 392.37 - samples/sec: 4822.24 - lr: 0.100000 +2023-04-06 00:25:34,439 epoch 11 - iter 2604/3720 - loss 0.03980274 - time (sec): 457.95 - samples/sec: 4817.42 - lr: 0.100000 +2023-04-06 00:26:40,245 epoch 11 - iter 2976/3720 - loss 0.03986743 - time (sec): 523.76 - samples/sec: 4815.16 - lr: 0.100000 +2023-04-06 00:27:44,010 epoch 11 - iter 3348/3720 - loss 0.03985353 - time (sec): 587.53 - samples/sec: 4829.76 - lr: 0.100000 +2023-04-06 00:28:49,148 epoch 11 - iter 3720/3720 - loss 0.03979586 - time (sec): 652.66 - samples/sec: 4829.00 - lr: 0.100000 +2023-04-06 00:28:49,148 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:28:49,148 EPOCH 11 done: loss 0.0398 - lr 0.100000 +2023-04-06 00:28:49,148 BAD EPOCHS (no improvement): 0 +2023-04-06 00:28:49,152 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:29:55,927 epoch 12 - iter 372/3720 - loss 0.03948977 - time (sec): 66.78 - samples/sec: 4753.05 - lr: 0.100000 +2023-04-06 00:31:00,559 epoch 12 - iter 744/3720 - loss 0.03857903 - time (sec): 131.41 - samples/sec: 4815.13 - lr: 0.100000 +2023-04-06 00:32:06,155 epoch 12 - iter 1116/3720 - loss 0.03863680 - time (sec): 197.00 - samples/sec: 4817.46 - lr: 0.100000 +2023-04-06 00:33:10,411 epoch 12 - iter 1488/3720 - loss 0.03888190 - time (sec): 261.26 - samples/sec: 4835.92 - lr: 0.100000 +2023-04-06 00:34:14,880 epoch 12 - iter 1860/3720 - loss 0.03894279 - time (sec): 325.73 - samples/sec: 4840.66 - lr: 0.100000 +2023-04-06 00:35:19,705 epoch 12 - iter 2232/3720 - loss 0.03904878 - time (sec): 390.55 - samples/sec: 4846.41 - lr: 0.100000 +2023-04-06 00:36:23,790 epoch 12 - iter 2604/3720 - loss 0.03926250 - time (sec): 454.64 - samples/sec: 4852.32 - lr: 0.100000 +2023-04-06 00:37:29,351 epoch 12 - iter 2976/3720 - loss 0.03935777 - time (sec): 520.20 - samples/sec: 4849.10 - lr: 0.100000 +2023-04-06 00:38:34,450 epoch 12 - iter 3348/3720 - loss 0.03927677 - time (sec): 585.30 - samples/sec: 4849.29 - lr: 0.100000 +2023-04-06 00:39:37,391 epoch 12 - iter 3720/3720 - loss 0.03929491 - time (sec): 648.24 - samples/sec: 4861.96 - lr: 0.100000 +2023-04-06 00:39:37,391 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:39:37,391 EPOCH 12 done: loss 0.0393 - lr 0.100000 +2023-04-06 00:39:37,391 BAD EPOCHS (no improvement): 0 +2023-04-06 00:39:37,395 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:40:42,023 epoch 13 - iter 372/3720 - loss 0.03793697 - time (sec): 64.63 - samples/sec: 4907.18 - lr: 0.100000 +2023-04-06 00:41:47,485 epoch 13 - iter 744/3720 - loss 0.03851898 - time (sec): 130.09 - samples/sec: 4872.84 - lr: 0.100000 +2023-04-06 00:42:53,288 epoch 13 - iter 1116/3720 - loss 0.03867673 - time (sec): 195.89 - samples/sec: 4836.38 - lr: 0.100000 +2023-04-06 00:43:58,372 epoch 13 - iter 1488/3720 - loss 0.03867665 - time (sec): 260.98 - samples/sec: 4841.98 - lr: 0.100000 +2023-04-06 00:45:04,638 epoch 13 - iter 1860/3720 - loss 0.03897579 - time (sec): 327.24 - samples/sec: 4830.30 - lr: 0.100000 +2023-04-06 00:46:09,680 epoch 13 - iter 2232/3720 - loss 0.03911655 - time (sec): 392.29 - samples/sec: 4833.13 - lr: 0.100000 +2023-04-06 00:47:14,113 epoch 13 - iter 2604/3720 - loss 0.03913999 - time (sec): 456.72 - samples/sec: 4839.97 - lr: 0.100000 +2023-04-06 00:48:19,561 epoch 13 - iter 2976/3720 - loss 0.03915125 - time (sec): 522.17 - samples/sec: 4833.02 - lr: 0.100000 +2023-04-06 00:49:25,258 epoch 13 - iter 3348/3720 - loss 0.03928003 - time (sec): 587.86 - samples/sec: 4827.79 - lr: 0.100000 +2023-04-06 00:50:30,379 epoch 13 - iter 3720/3720 - loss 0.03920813 - time (sec): 652.98 - samples/sec: 4826.63 - lr: 0.100000 +2023-04-06 00:50:30,379 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:50:30,379 EPOCH 13 done: loss 0.0392 - lr 0.100000 +2023-04-06 00:50:30,379 BAD EPOCHS (no improvement): 0 +2023-04-06 00:50:30,383 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:51:35,122 epoch 14 - iter 372/3720 - loss 0.03718396 - time (sec): 64.74 - samples/sec: 4874.25 - lr: 0.100000 +2023-04-06 00:52:39,958 epoch 14 - iter 744/3720 - loss 0.03795859 - time (sec): 129.58 - samples/sec: 4864.62 - lr: 0.100000 +2023-04-06 00:53:44,221 epoch 14 - iter 1116/3720 - loss 0.03814956 - time (sec): 193.84 - samples/sec: 4879.49 - lr: 0.100000 +2023-04-06 00:54:48,326 epoch 14 - iter 1488/3720 - loss 0.03824906 - time (sec): 257.94 - samples/sec: 4887.69 - lr: 0.100000 +2023-04-06 00:55:53,342 epoch 14 - iter 1860/3720 - loss 0.03841750 - time (sec): 322.96 - samples/sec: 4886.92 - lr: 0.100000 +2023-04-06 00:56:56,998 epoch 14 - iter 2232/3720 - loss 0.03869255 - time (sec): 386.62 - samples/sec: 4893.93 - lr: 0.100000 +2023-04-06 00:58:01,416 epoch 14 - iter 2604/3720 - loss 0.03867406 - time (sec): 451.03 - samples/sec: 4891.72 - lr: 0.100000 +2023-04-06 00:59:06,253 epoch 14 - iter 2976/3720 - loss 0.03879602 - time (sec): 515.87 - samples/sec: 4886.24 - lr: 0.100000 +2023-04-06 01:00:11,096 epoch 14 - iter 3348/3720 - loss 0.03868007 - time (sec): 580.71 - samples/sec: 4884.80 - lr: 0.100000 +2023-04-06 01:01:16,460 epoch 14 - iter 3720/3720 - loss 0.03875447 - time (sec): 646.08 - samples/sec: 4878.23 - lr: 0.100000 +2023-04-06 01:01:16,460 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:01:16,460 EPOCH 14 done: loss 0.0388 - lr 0.100000 +2023-04-06 01:01:16,460 BAD EPOCHS (no improvement): 0 +2023-04-06 01:01:16,464 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:02:21,589 epoch 15 - iter 372/3720 - loss 0.03884488 - time (sec): 65.12 - samples/sec: 4859.08 - lr: 0.100000 +2023-04-06 01:03:26,238 epoch 15 - iter 744/3720 - loss 0.03831782 - time (sec): 129.77 - samples/sec: 4871.54 - lr: 0.100000 +2023-04-06 01:04:29,717 epoch 15 - iter 1116/3720 - loss 0.03824842 - time (sec): 193.25 - samples/sec: 4896.28 - lr: 0.100000 +2023-04-06 01:05:33,584 epoch 15 - iter 1488/3720 - loss 0.03824843 - time (sec): 257.12 - samples/sec: 4903.13 - lr: 0.100000 +2023-04-06 01:06:38,784 epoch 15 - iter 1860/3720 - loss 0.03847771 - time (sec): 322.32 - samples/sec: 4896.35 - lr: 0.100000 +2023-04-06 01:07:43,045 epoch 15 - iter 2232/3720 - loss 0.03837810 - time (sec): 386.58 - samples/sec: 4895.60 - lr: 0.100000 +2023-04-06 01:08:47,591 epoch 15 - iter 2604/3720 - loss 0.03846540 - time (sec): 451.13 - samples/sec: 4887.26 - lr: 0.100000 +2023-04-06 01:09:52,730 epoch 15 - iter 2976/3720 - loss 0.03853469 - time (sec): 516.27 - samples/sec: 4884.77 - lr: 0.100000 +2023-04-06 01:10:58,427 epoch 15 - iter 3348/3720 - loss 0.03841999 - time (sec): 581.96 - samples/sec: 4877.72 - lr: 0.100000 +2023-04-06 01:12:02,191 epoch 15 - iter 3720/3720 - loss 0.03840150 - time (sec): 645.73 - samples/sec: 4880.88 - lr: 0.100000 +2023-04-06 01:12:02,191 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:12:02,191 EPOCH 15 done: loss 0.0384 - lr 0.100000 +2023-04-06 01:12:02,191 BAD EPOCHS (no improvement): 0 +2023-04-06 01:12:02,194 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:13:07,605 epoch 16 - iter 372/3720 - loss 0.03656534 - time (sec): 65.41 - samples/sec: 4811.92 - lr: 0.100000 +2023-04-06 01:14:13,165 epoch 16 - iter 744/3720 - loss 0.03768461 - time (sec): 130.97 - samples/sec: 4816.79 - lr: 0.100000 +2023-04-06 01:15:18,025 epoch 16 - iter 1116/3720 - loss 0.03769401 - time (sec): 195.83 - samples/sec: 4827.59 - lr: 0.100000 +2023-04-06 01:16:22,286 epoch 16 - iter 1488/3720 - loss 0.03801334 - time (sec): 260.09 - samples/sec: 4847.08 - lr: 0.100000 +2023-04-06 01:17:27,638 epoch 16 - iter 1860/3720 - loss 0.03814107 - time (sec): 325.44 - samples/sec: 4842.98 - lr: 0.100000 +2023-04-06 01:18:32,828 epoch 16 - iter 2232/3720 - loss 0.03806304 - time (sec): 390.63 - samples/sec: 4848.90 - lr: 0.100000 +2023-04-06 01:19:36,777 epoch 16 - iter 2604/3720 - loss 0.03810921 - time (sec): 454.58 - samples/sec: 4856.32 - lr: 0.100000 +2023-04-06 01:20:39,643 epoch 16 - iter 2976/3720 - loss 0.03800707 - time (sec): 517.45 - samples/sec: 4872.65 - lr: 0.100000 +2023-04-06 01:21:43,342 epoch 16 - iter 3348/3720 - loss 0.03808011 - time (sec): 581.15 - samples/sec: 4881.02 - lr: 0.100000 +2023-04-06 01:22:47,752 epoch 16 - iter 3720/3720 - loss 0.03817140 - time (sec): 645.56 - samples/sec: 4882.15 - lr: 0.100000 +2023-04-06 01:22:47,753 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:22:47,753 EPOCH 16 done: loss 0.0382 - lr 0.100000 +2023-04-06 01:22:47,753 BAD EPOCHS (no improvement): 0 +2023-04-06 01:22:47,756 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:23:52,545 epoch 17 - iter 372/3720 - loss 0.03777496 - time (sec): 64.79 - samples/sec: 4873.10 - lr: 0.100000 +2023-04-06 01:24:57,014 epoch 17 - iter 744/3720 - loss 0.03762120 - time (sec): 129.26 - samples/sec: 4875.10 - lr: 0.100000 +2023-04-06 01:26:02,115 epoch 17 - iter 1116/3720 - loss 0.03794625 - time (sec): 194.36 - samples/sec: 4871.71 - lr: 0.100000 +2023-04-06 01:27:07,547 epoch 17 - iter 1488/3720 - loss 0.03782393 - time (sec): 259.79 - samples/sec: 4864.06 - lr: 0.100000 +2023-04-06 01:28:11,650 epoch 17 - iter 1860/3720 - loss 0.03782723 - time (sec): 323.89 - samples/sec: 4874.57 - lr: 0.100000 +2023-04-06 01:29:15,043 epoch 17 - iter 2232/3720 - loss 0.03774844 - time (sec): 387.29 - samples/sec: 4893.80 - lr: 0.100000 +2023-04-06 01:30:19,164 epoch 17 - iter 2604/3720 - loss 0.03766911 - time (sec): 451.41 - samples/sec: 4902.54 - lr: 0.100000 +2023-04-06 01:31:22,179 epoch 17 - iter 2976/3720 - loss 0.03783737 - time (sec): 514.42 - samples/sec: 4911.87 - lr: 0.100000 +2023-04-06 01:32:24,708 epoch 17 - iter 3348/3720 - loss 0.03791902 - time (sec): 576.95 - samples/sec: 4920.71 - lr: 0.100000 +2023-04-06 01:33:29,291 epoch 17 - iter 3720/3720 - loss 0.03798204 - time (sec): 641.53 - samples/sec: 4912.77 - lr: 0.100000 +2023-04-06 01:33:29,291 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:33:29,291 EPOCH 17 done: loss 0.0380 - lr 0.100000 +2023-04-06 01:33:29,291 BAD EPOCHS (no improvement): 0 +2023-04-06 01:33:29,295 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:34:33,127 epoch 18 - iter 372/3720 - loss 0.03717692 - time (sec): 63.83 - samples/sec: 4943.40 - lr: 0.100000 +2023-04-06 01:35:36,821 epoch 18 - iter 744/3720 - loss 0.03806882 - time (sec): 127.53 - samples/sec: 4946.33 - lr: 0.100000 +2023-04-06 01:36:40,369 epoch 18 - iter 1116/3720 - loss 0.03788397 - time (sec): 191.07 - samples/sec: 4950.24 - lr: 0.100000 +2023-04-06 01:37:45,086 epoch 18 - iter 1488/3720 - loss 0.03811433 - time (sec): 255.79 - samples/sec: 4941.13 - lr: 0.100000 +2023-04-06 01:38:50,149 epoch 18 - iter 1860/3720 - loss 0.03789941 - time (sec): 320.85 - samples/sec: 4923.11 - lr: 0.100000 +2023-04-06 01:39:53,735 epoch 18 - iter 2232/3720 - loss 0.03799931 - time (sec): 384.44 - samples/sec: 4923.81 - lr: 0.100000 +2023-04-06 01:40:57,148 epoch 18 - iter 2604/3720 - loss 0.03787706 - time (sec): 447.85 - samples/sec: 4928.18 - lr: 0.100000 +2023-04-06 01:42:01,906 epoch 18 - iter 2976/3720 - loss 0.03800637 - time (sec): 512.61 - samples/sec: 4925.40 - lr: 0.100000 +2023-04-06 01:43:05,441 epoch 18 - iter 3348/3720 - loss 0.03806865 - time (sec): 576.15 - samples/sec: 4928.27 - lr: 0.100000 +2023-04-06 01:44:09,375 epoch 18 - iter 3720/3720 - loss 0.03801343 - time (sec): 640.08 - samples/sec: 4923.93 - lr: 0.100000 +2023-04-06 01:44:09,376 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:44:09,376 EPOCH 18 done: loss 0.0380 - lr 0.100000 +2023-04-06 01:44:09,376 BAD EPOCHS (no improvement): 1 +2023-04-06 01:44:09,379 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:45:13,657 epoch 19 - iter 372/3720 - loss 0.03779553 - time (sec): 64.28 - samples/sec: 4898.67 - lr: 0.100000 +2023-04-06 01:46:16,968 epoch 19 - iter 744/3720 - loss 0.03734848 - time (sec): 127.59 - samples/sec: 4932.26 - lr: 0.100000 +2023-04-06 01:47:20,913 epoch 19 - iter 1116/3720 - loss 0.03732153 - time (sec): 191.53 - samples/sec: 4933.50 - lr: 0.100000 +2023-04-06 01:48:24,318 epoch 19 - iter 1488/3720 - loss 0.03741383 - time (sec): 254.94 - samples/sec: 4928.21 - lr: 0.100000 +2023-04-06 01:49:28,405 epoch 19 - iter 1860/3720 - loss 0.03746305 - time (sec): 319.03 - samples/sec: 4928.28 - lr: 0.100000 +2023-04-06 01:50:33,078 epoch 19 - iter 2232/3720 - loss 0.03737705 - time (sec): 383.70 - samples/sec: 4924.75 - lr: 0.100000 +2023-04-06 01:51:36,689 epoch 19 - iter 2604/3720 - loss 0.03751033 - time (sec): 447.31 - samples/sec: 4933.01 - lr: 0.100000 +2023-04-06 01:52:39,422 epoch 19 - iter 2976/3720 - loss 0.03767277 - time (sec): 510.04 - samples/sec: 4945.22 - lr: 0.100000 +2023-04-06 01:53:41,842 epoch 19 - iter 3348/3720 - loss 0.03771265 - time (sec): 572.46 - samples/sec: 4956.63 - lr: 0.100000 +2023-04-06 01:54:44,403 epoch 19 - iter 3720/3720 - loss 0.03780869 - time (sec): 635.02 - samples/sec: 4963.14 - lr: 0.100000 +2023-04-06 01:54:44,404 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:54:44,404 EPOCH 19 done: loss 0.0378 - lr 0.100000 +2023-04-06 01:54:44,404 BAD EPOCHS (no improvement): 0 +2023-04-06 01:54:44,406 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:55:47,875 epoch 20 - iter 372/3720 - loss 0.03785798 - time (sec): 63.47 - samples/sec: 4947.77 - lr: 0.100000 +2023-04-06 01:56:51,003 epoch 20 - iter 744/3720 - loss 0.03783281 - time (sec): 126.60 - samples/sec: 4952.04 - lr: 0.100000 +2023-04-06 01:57:53,716 epoch 20 - iter 1116/3720 - loss 0.03755687 - time (sec): 189.31 - samples/sec: 4981.33 - lr: 0.100000 +2023-04-06 01:58:56,752 epoch 20 - iter 1488/3720 - loss 0.03759708 - time (sec): 252.35 - samples/sec: 4986.73 - lr: 0.100000 +2023-04-06 02:00:01,439 epoch 20 - iter 1860/3720 - loss 0.03753506 - time (sec): 317.03 - samples/sec: 4970.13 - lr: 0.100000 +2023-04-06 02:01:05,828 epoch 20 - iter 2232/3720 - loss 0.03742842 - time (sec): 381.42 - samples/sec: 4959.00 - lr: 0.100000 +2023-04-06 02:02:08,245 epoch 20 - iter 2604/3720 - loss 0.03733267 - time (sec): 443.84 - samples/sec: 4973.81 - lr: 0.100000 +2023-04-06 02:03:11,107 epoch 20 - iter 2976/3720 - loss 0.03736629 - time (sec): 506.70 - samples/sec: 4976.22 - lr: 0.100000 +2023-04-06 02:04:13,467 epoch 20 - iter 3348/3720 - loss 0.03749929 - time (sec): 569.06 - samples/sec: 4982.46 - lr: 0.100000 +2023-04-06 02:05:16,497 epoch 20 - iter 3720/3720 - loss 0.03755917 - time (sec): 632.09 - samples/sec: 4986.17 - lr: 0.100000 +2023-04-06 02:05:16,498 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:05:16,498 EPOCH 20 done: loss 0.0376 - lr 0.100000 +2023-04-06 02:05:16,498 BAD EPOCHS (no improvement): 0 +2023-04-06 02:05:16,501 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:06:19,401 epoch 21 - iter 372/3720 - loss 0.03719930 - time (sec): 62.90 - samples/sec: 5020.08 - lr: 0.100000 +2023-04-06 02:07:21,749 epoch 21 - iter 744/3720 - loss 0.03706269 - time (sec): 125.25 - samples/sec: 5043.64 - lr: 0.100000 +2023-04-06 02:08:23,831 epoch 21 - iter 1116/3720 - loss 0.03711430 - time (sec): 187.33 - samples/sec: 5051.85 - lr: 0.100000 +2023-04-06 02:09:26,831 epoch 21 - iter 1488/3720 - loss 0.03725920 - time (sec): 250.33 - samples/sec: 5039.63 - lr: 0.100000 +2023-04-06 02:10:29,874 epoch 21 - iter 1860/3720 - loss 0.03730278 - time (sec): 313.37 - samples/sec: 5027.99 - lr: 0.100000 +2023-04-06 02:11:32,149 epoch 21 - iter 2232/3720 - loss 0.03721740 - time (sec): 375.65 - samples/sec: 5032.88 - lr: 0.100000 +2023-04-06 02:12:34,707 epoch 21 - iter 2604/3720 - loss 0.03732940 - time (sec): 438.21 - samples/sec: 5035.33 - lr: 0.100000 +2023-04-06 02:13:37,977 epoch 21 - iter 2976/3720 - loss 0.03738477 - time (sec): 501.48 - samples/sec: 5033.70 - lr: 0.100000 +2023-04-06 02:14:41,524 epoch 21 - iter 3348/3720 - loss 0.03738079 - time (sec): 565.02 - samples/sec: 5023.15 - lr: 0.100000 +2023-04-06 02:15:44,618 epoch 21 - iter 3720/3720 - loss 0.03743202 - time (sec): 628.12 - samples/sec: 5017.71 - lr: 0.100000 +2023-04-06 02:15:44,618 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:15:44,618 EPOCH 21 done: loss 0.0374 - lr 0.100000 +2023-04-06 02:15:44,618 BAD EPOCHS (no improvement): 0 +2023-04-06 02:15:44,621 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:16:47,511 epoch 22 - iter 372/3720 - loss 0.03606527 - time (sec): 62.89 - samples/sec: 4997.69 - lr: 0.100000 +2023-04-06 02:17:49,824 epoch 22 - iter 744/3720 - loss 0.03654979 - time (sec): 125.20 - samples/sec: 5013.71 - lr: 0.100000 +2023-04-06 02:18:53,656 epoch 22 - iter 1116/3720 - loss 0.03663016 - time (sec): 189.03 - samples/sec: 4987.13 - lr: 0.100000 +2023-04-06 02:19:57,426 epoch 22 - iter 1488/3720 - loss 0.03682940 - time (sec): 252.80 - samples/sec: 4978.60 - lr: 0.100000 +2023-04-06 02:21:00,182 epoch 22 - iter 1860/3720 - loss 0.03683460 - time (sec): 315.56 - samples/sec: 4992.24 - lr: 0.100000 +2023-04-06 02:22:04,607 epoch 22 - iter 2232/3720 - loss 0.03700043 - time (sec): 379.99 - samples/sec: 4981.35 - lr: 0.100000 +2023-04-06 02:23:08,231 epoch 22 - iter 2604/3720 - loss 0.03707551 - time (sec): 443.61 - samples/sec: 4973.72 - lr: 0.100000 +2023-04-06 02:24:11,920 epoch 22 - iter 2976/3720 - loss 0.03710649 - time (sec): 507.30 - samples/sec: 4968.95 - lr: 0.100000 +2023-04-06 02:25:15,697 epoch 22 - iter 3348/3720 - loss 0.03725444 - time (sec): 571.07 - samples/sec: 4965.36 - lr: 0.100000 +2023-04-06 02:26:19,110 epoch 22 - iter 3720/3720 - loss 0.03728125 - time (sec): 634.49 - samples/sec: 4967.33 - lr: 0.100000 +2023-04-06 02:26:19,110 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:26:19,110 EPOCH 22 done: loss 0.0373 - lr 0.100000 +2023-04-06 02:26:19,110 BAD EPOCHS (no improvement): 0 +2023-04-06 02:26:19,113 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:27:22,264 epoch 23 - iter 372/3720 - loss 0.03708948 - time (sec): 63.15 - samples/sec: 4991.98 - lr: 0.100000 +2023-04-06 02:28:24,744 epoch 23 - iter 744/3720 - loss 0.03701560 - time (sec): 125.63 - samples/sec: 5019.13 - lr: 0.100000 +2023-04-06 02:29:27,416 epoch 23 - iter 1116/3720 - loss 0.03711337 - time (sec): 188.30 - samples/sec: 5006.78 - lr: 0.100000 +2023-04-06 02:30:30,607 epoch 23 - iter 1488/3720 - loss 0.03713993 - time (sec): 251.49 - samples/sec: 4995.53 - lr: 0.100000 +2023-04-06 02:31:31,911 epoch 23 - iter 1860/3720 - loss 0.03718061 - time (sec): 312.80 - samples/sec: 5019.09 - lr: 0.100000 +2023-04-06 02:32:36,140 epoch 23 - iter 2232/3720 - loss 0.03707327 - time (sec): 377.03 - samples/sec: 5010.33 - lr: 0.100000 +2023-04-06 02:33:39,471 epoch 23 - iter 2604/3720 - loss 0.03709395 - time (sec): 440.36 - samples/sec: 5009.17 - lr: 0.100000 +2023-04-06 02:34:43,117 epoch 23 - iter 2976/3720 - loss 0.03709204 - time (sec): 504.00 - samples/sec: 5002.85 - lr: 0.100000 +2023-04-06 02:35:45,820 epoch 23 - iter 3348/3720 - loss 0.03713828 - time (sec): 566.71 - samples/sec: 5004.31 - lr: 0.100000 +2023-04-06 02:36:48,575 epoch 23 - iter 3720/3720 - loss 0.03713727 - time (sec): 629.46 - samples/sec: 5006.99 - lr: 0.100000 +2023-04-06 02:36:48,576 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:36:48,576 EPOCH 23 done: loss 0.0371 - lr 0.100000 +2023-04-06 02:36:48,576 BAD EPOCHS (no improvement): 0 +2023-04-06 02:36:48,579 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:37:51,265 epoch 24 - iter 372/3720 - loss 0.03669695 - time (sec): 62.69 - samples/sec: 5040.67 - lr: 0.100000 +2023-04-06 02:38:53,921 epoch 24 - iter 744/3720 - loss 0.03662117 - time (sec): 125.34 - samples/sec: 5035.38 - lr: 0.100000 +2023-04-06 02:39:57,107 epoch 24 - iter 1116/3720 - loss 0.03658693 - time (sec): 188.53 - samples/sec: 5012.98 - lr: 0.100000 +2023-04-06 02:40:59,524 epoch 24 - iter 1488/3720 - loss 0.03647600 - time (sec): 250.94 - samples/sec: 5008.04 - lr: 0.100000 +2023-04-06 02:42:02,608 epoch 24 - iter 1860/3720 - loss 0.03640431 - time (sec): 314.03 - samples/sec: 5009.09 - lr: 0.100000 +2023-04-06 02:43:05,716 epoch 24 - iter 2232/3720 - loss 0.03666376 - time (sec): 377.14 - samples/sec: 5004.81 - lr: 0.100000 +2023-04-06 02:44:09,570 epoch 24 - iter 2604/3720 - loss 0.03676543 - time (sec): 440.99 - samples/sec: 5000.25 - lr: 0.100000 +2023-04-06 02:45:13,636 epoch 24 - iter 2976/3720 - loss 0.03679277 - time (sec): 505.06 - samples/sec: 4994.02 - lr: 0.100000 +2023-04-06 02:46:16,146 epoch 24 - iter 3348/3720 - loss 0.03692790 - time (sec): 567.57 - samples/sec: 5000.04 - lr: 0.100000 +2023-04-06 02:47:18,346 epoch 24 - iter 3720/3720 - loss 0.03693011 - time (sec): 629.77 - samples/sec: 5004.57 - lr: 0.100000 +2023-04-06 02:47:18,346 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:47:18,346 EPOCH 24 done: loss 0.0369 - lr 0.100000 +2023-04-06 02:47:18,346 BAD EPOCHS (no improvement): 0 +2023-04-06 02:47:18,350 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:48:22,056 epoch 25 - iter 372/3720 - loss 0.03576623 - time (sec): 63.71 - samples/sec: 4970.15 - lr: 0.100000 +2023-04-06 02:49:26,057 epoch 25 - iter 744/3720 - loss 0.03617317 - time (sec): 127.71 - samples/sec: 4948.50 - lr: 0.100000 +2023-04-06 02:50:28,898 epoch 25 - iter 1116/3720 - loss 0.03635723 - time (sec): 190.55 - samples/sec: 4975.37 - lr: 0.100000 +2023-04-06 02:51:32,665 epoch 25 - iter 1488/3720 - loss 0.03677751 - time (sec): 254.32 - samples/sec: 4972.70 - lr: 0.100000 +2023-04-06 02:52:35,999 epoch 25 - iter 1860/3720 - loss 0.03665019 - time (sec): 317.65 - samples/sec: 4971.71 - lr: 0.100000 +2023-04-06 02:53:38,392 epoch 25 - iter 2232/3720 - loss 0.03671172 - time (sec): 380.04 - samples/sec: 4980.30 - lr: 0.100000 +2023-04-06 02:54:41,734 epoch 25 - iter 2604/3720 - loss 0.03675279 - time (sec): 443.38 - samples/sec: 4982.06 - lr: 0.100000 +2023-04-06 02:55:45,716 epoch 25 - iter 2976/3720 - loss 0.03678682 - time (sec): 507.37 - samples/sec: 4976.74 - lr: 0.100000 +2023-04-06 02:56:48,279 epoch 25 - iter 3348/3720 - loss 0.03686545 - time (sec): 569.93 - samples/sec: 4980.01 - lr: 0.100000 +2023-04-06 02:57:50,665 epoch 25 - iter 3720/3720 - loss 0.03688441 - time (sec): 632.31 - samples/sec: 4984.40 - lr: 0.100000 +2023-04-06 02:57:50,665 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:57:50,666 EPOCH 25 done: loss 0.0369 - lr 0.100000 +2023-04-06 02:57:50,666 BAD EPOCHS (no improvement): 0 +2023-04-06 02:57:50,669 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:58:52,529 epoch 26 - iter 372/3720 - loss 0.03575018 - time (sec): 61.86 - samples/sec: 5080.71 - lr: 0.100000 +2023-04-06 02:59:54,967 epoch 26 - iter 744/3720 - loss 0.03589772 - time (sec): 124.30 - samples/sec: 5054.73 - lr: 0.100000 +2023-04-06 03:00:57,363 epoch 26 - iter 1116/3720 - loss 0.03617339 - time (sec): 186.69 - samples/sec: 5062.93 - lr: 0.100000 +2023-04-06 03:02:00,007 epoch 26 - iter 1488/3720 - loss 0.03617761 - time (sec): 249.34 - samples/sec: 5061.16 - lr: 0.100000 +2023-04-06 03:03:03,023 epoch 26 - iter 1860/3720 - loss 0.03626125 - time (sec): 312.35 - samples/sec: 5041.33 - lr: 0.100000 +2023-04-06 03:04:06,741 epoch 26 - iter 2232/3720 - loss 0.03657375 - time (sec): 376.07 - samples/sec: 5021.13 - lr: 0.100000 +2023-04-06 03:05:09,733 epoch 26 - iter 2604/3720 - loss 0.03664309 - time (sec): 439.06 - samples/sec: 5016.93 - lr: 0.100000 +2023-04-06 03:06:12,591 epoch 26 - iter 2976/3720 - loss 0.03668327 - time (sec): 501.92 - samples/sec: 5022.02 - lr: 0.100000 +2023-04-06 03:07:14,762 epoch 26 - iter 3348/3720 - loss 0.03666879 - time (sec): 564.09 - samples/sec: 5025.53 - lr: 0.100000 +2023-04-06 03:08:19,046 epoch 26 - iter 3720/3720 - loss 0.03682200 - time (sec): 628.38 - samples/sec: 5015.64 - lr: 0.100000 +2023-04-06 03:08:19,046 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:08:19,046 EPOCH 26 done: loss 0.0368 - lr 0.100000 +2023-04-06 03:08:19,046 BAD EPOCHS (no improvement): 0 +2023-04-06 03:08:19,049 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:09:22,636 epoch 27 - iter 372/3720 - loss 0.03591577 - time (sec): 63.59 - samples/sec: 4994.14 - lr: 0.100000 +2023-04-06 03:10:25,528 epoch 27 - iter 744/3720 - loss 0.03638401 - time (sec): 126.48 - samples/sec: 5006.03 - lr: 0.100000 +2023-04-06 03:11:27,613 epoch 27 - iter 1116/3720 - loss 0.03619447 - time (sec): 188.56 - samples/sec: 5019.48 - lr: 0.100000 +2023-04-06 03:12:30,143 epoch 27 - iter 1488/3720 - loss 0.03647944 - time (sec): 251.09 - samples/sec: 5027.02 - lr: 0.100000 +2023-04-06 03:13:32,505 epoch 27 - iter 1860/3720 - loss 0.03656158 - time (sec): 313.46 - samples/sec: 5030.90 - lr: 0.100000 +2023-04-06 03:14:36,285 epoch 27 - iter 2232/3720 - loss 0.03654736 - time (sec): 377.24 - samples/sec: 5014.81 - lr: 0.100000 +2023-04-06 03:15:39,734 epoch 27 - iter 2604/3720 - loss 0.03661380 - time (sec): 440.68 - samples/sec: 5008.20 - lr: 0.100000 +2023-04-06 03:16:44,611 epoch 27 - iter 2976/3720 - loss 0.03667561 - time (sec): 505.56 - samples/sec: 4991.99 - lr: 0.100000 +2023-04-06 03:17:47,683 epoch 27 - iter 3348/3720 - loss 0.03672948 - time (sec): 568.63 - samples/sec: 4992.51 - lr: 0.100000 +2023-04-06 03:18:49,995 epoch 27 - iter 3720/3720 - loss 0.03675441 - time (sec): 630.95 - samples/sec: 4995.22 - lr: 0.100000 +2023-04-06 03:18:49,995 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:18:49,995 EPOCH 27 done: loss 0.0368 - lr 0.100000 +2023-04-06 03:18:49,995 BAD EPOCHS (no improvement): 0 +2023-04-06 03:18:49,998 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:19:53,813 epoch 28 - iter 372/3720 - loss 0.03629755 - time (sec): 63.82 - samples/sec: 4956.29 - lr: 0.100000 +2023-04-06 03:20:56,823 epoch 28 - iter 744/3720 - loss 0.03569959 - time (sec): 126.82 - samples/sec: 4979.95 - lr: 0.100000 +2023-04-06 03:21:59,289 epoch 28 - iter 1116/3720 - loss 0.03576099 - time (sec): 189.29 - samples/sec: 4991.02 - lr: 0.100000 +2023-04-06 03:23:02,352 epoch 28 - iter 1488/3720 - loss 0.03573978 - time (sec): 252.35 - samples/sec: 4987.32 - lr: 0.100000 +2023-04-06 03:24:06,746 epoch 28 - iter 1860/3720 - loss 0.03585206 - time (sec): 316.75 - samples/sec: 4969.49 - lr: 0.100000 +2023-04-06 03:25:09,793 epoch 28 - iter 2232/3720 - loss 0.03610828 - time (sec): 379.79 - samples/sec: 4975.70 - lr: 0.100000 +2023-04-06 03:26:12,683 epoch 28 - iter 2604/3720 - loss 0.03606630 - time (sec): 442.69 - samples/sec: 4979.70 - lr: 0.100000 +2023-04-06 03:27:15,150 epoch 28 - iter 2976/3720 - loss 0.03629244 - time (sec): 505.15 - samples/sec: 4987.77 - lr: 0.100000 +2023-04-06 03:28:17,959 epoch 28 - iter 3348/3720 - loss 0.03635761 - time (sec): 567.96 - samples/sec: 4990.24 - lr: 0.100000 +2023-04-06 03:29:22,429 epoch 28 - iter 3720/3720 - loss 0.03647368 - time (sec): 632.43 - samples/sec: 4983.49 - lr: 0.100000 +2023-04-06 03:29:22,429 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:29:22,429 EPOCH 28 done: loss 0.0365 - lr 0.100000 +2023-04-06 03:29:22,429 BAD EPOCHS (no improvement): 0 +2023-04-06 03:29:22,432 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:30:26,512 epoch 29 - iter 372/3720 - loss 0.03580840 - time (sec): 64.08 - samples/sec: 4913.90 - lr: 0.100000 +2023-04-06 03:31:29,880 epoch 29 - iter 744/3720 - loss 0.03558584 - time (sec): 127.45 - samples/sec: 4946.21 - lr: 0.100000 +2023-04-06 03:32:33,002 epoch 29 - iter 1116/3720 - loss 0.03595706 - time (sec): 190.57 - samples/sec: 4968.49 - lr: 0.100000 +2023-04-06 03:33:35,317 epoch 29 - iter 1488/3720 - loss 0.03607640 - time (sec): 252.89 - samples/sec: 4996.88 - lr: 0.100000 +2023-04-06 03:34:37,513 epoch 29 - iter 1860/3720 - loss 0.03631701 - time (sec): 315.08 - samples/sec: 5010.68 - lr: 0.100000 +2023-04-06 03:35:40,490 epoch 29 - iter 2232/3720 - loss 0.03634836 - time (sec): 378.06 - samples/sec: 5019.47 - lr: 0.100000 +2023-04-06 03:36:42,442 epoch 29 - iter 2604/3720 - loss 0.03643398 - time (sec): 440.01 - samples/sec: 5023.07 - lr: 0.100000 +2023-04-06 03:37:44,939 epoch 29 - iter 2976/3720 - loss 0.03647132 - time (sec): 502.51 - samples/sec: 5025.27 - lr: 0.100000 +2023-04-06 03:38:48,775 epoch 29 - iter 3348/3720 - loss 0.03648527 - time (sec): 566.34 - samples/sec: 5013.01 - lr: 0.100000 +2023-04-06 03:39:51,756 epoch 29 - iter 3720/3720 - loss 0.03656561 - time (sec): 629.32 - samples/sec: 5008.09 - lr: 0.100000 +2023-04-06 03:39:51,757 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:39:51,757 EPOCH 29 done: loss 0.0366 - lr 0.100000 +2023-04-06 03:39:51,757 BAD EPOCHS (no improvement): 1 +2023-04-06 03:39:51,759 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:40:54,782 epoch 30 - iter 372/3720 - loss 0.03622456 - time (sec): 63.02 - samples/sec: 5011.96 - lr: 0.100000 +2023-04-06 03:41:58,477 epoch 30 - iter 744/3720 - loss 0.03596512 - time (sec): 126.72 - samples/sec: 4993.34 - lr: 0.100000 +2023-04-06 03:43:00,990 epoch 30 - iter 1116/3720 - loss 0.03581400 - time (sec): 189.23 - samples/sec: 4991.87 - lr: 0.100000 +2023-04-06 03:44:03,955 epoch 30 - iter 1488/3720 - loss 0.03595400 - time (sec): 252.20 - samples/sec: 4997.03 - lr: 0.100000 +2023-04-06 03:45:05,948 epoch 30 - iter 1860/3720 - loss 0.03586498 - time (sec): 314.19 - samples/sec: 5012.81 - lr: 0.100000 +2023-04-06 03:46:08,866 epoch 30 - iter 2232/3720 - loss 0.03587263 - time (sec): 377.11 - samples/sec: 5013.25 - lr: 0.100000 +2023-04-06 03:47:12,458 epoch 30 - iter 2604/3720 - loss 0.03601574 - time (sec): 440.70 - samples/sec: 5004.52 - lr: 0.100000 +2023-04-06 03:48:15,915 epoch 30 - iter 2976/3720 - loss 0.03621407 - time (sec): 504.16 - samples/sec: 5002.41 - lr: 0.100000 +2023-04-06 03:49:19,611 epoch 30 - iter 3348/3720 - loss 0.03629892 - time (sec): 567.85 - samples/sec: 4995.75 - lr: 0.100000 +2023-04-06 03:50:23,857 epoch 30 - iter 3720/3720 - loss 0.03638563 - time (sec): 632.10 - samples/sec: 4986.12 - lr: 0.100000 +2023-04-06 03:50:23,857 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:50:23,857 EPOCH 30 done: loss 0.0364 - lr 0.100000 +2023-04-06 03:50:23,857 BAD EPOCHS (no improvement): 0 +2023-04-06 03:50:23,861 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:51:27,597 epoch 31 - iter 372/3720 - loss 0.03589866 - time (sec): 63.74 - samples/sec: 4935.55 - lr: 0.100000 +2023-04-06 03:52:30,594 epoch 31 - iter 744/3720 - loss 0.03591985 - time (sec): 126.73 - samples/sec: 4980.31 - lr: 0.100000 +2023-04-06 03:53:34,478 epoch 31 - iter 1116/3720 - loss 0.03608791 - time (sec): 190.62 - samples/sec: 4969.68 - lr: 0.100000 +2023-04-06 03:54:37,550 epoch 31 - iter 1488/3720 - loss 0.03605652 - time (sec): 253.69 - samples/sec: 4976.81 - lr: 0.100000 +2023-04-06 03:55:40,506 epoch 31 - iter 1860/3720 - loss 0.03627127 - time (sec): 316.65 - samples/sec: 4975.40 - lr: 0.100000 +2023-04-06 03:56:45,133 epoch 31 - iter 2232/3720 - loss 0.03623942 - time (sec): 381.27 - samples/sec: 4961.76 - lr: 0.100000 +2023-04-06 03:57:48,120 epoch 31 - iter 2604/3720 - loss 0.03643650 - time (sec): 444.26 - samples/sec: 4962.42 - lr: 0.100000 +2023-04-06 03:58:51,606 epoch 31 - iter 2976/3720 - loss 0.03644714 - time (sec): 507.74 - samples/sec: 4962.08 - lr: 0.100000 +2023-04-06 03:59:55,671 epoch 31 - iter 3348/3720 - loss 0.03651080 - time (sec): 571.81 - samples/sec: 4959.66 - lr: 0.100000 +2023-04-06 04:00:59,712 epoch 31 - iter 3720/3720 - loss 0.03653519 - time (sec): 635.85 - samples/sec: 4956.68 - lr: 0.100000 +2023-04-06 04:00:59,713 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:00:59,713 EPOCH 31 done: loss 0.0365 - lr 0.100000 +2023-04-06 04:00:59,713 BAD EPOCHS (no improvement): 1 +2023-04-06 04:00:59,716 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:02:03,637 epoch 32 - iter 372/3720 - loss 0.03422510 - time (sec): 63.92 - samples/sec: 4951.84 - lr: 0.100000 +2023-04-06 04:03:05,658 epoch 32 - iter 744/3720 - loss 0.03547466 - time (sec): 125.94 - samples/sec: 5019.51 - lr: 0.100000 +2023-04-06 04:04:08,997 epoch 32 - iter 1116/3720 - loss 0.03580223 - time (sec): 189.28 - samples/sec: 4997.24 - lr: 0.100000 +2023-04-06 04:05:13,508 epoch 32 - iter 1488/3720 - loss 0.03599954 - time (sec): 253.79 - samples/sec: 4977.40 - lr: 0.100000 +2023-04-06 04:06:16,227 epoch 32 - iter 1860/3720 - loss 0.03621192 - time (sec): 316.51 - samples/sec: 4983.23 - lr: 0.100000 +2023-04-06 04:07:18,991 epoch 32 - iter 2232/3720 - loss 0.03622746 - time (sec): 379.28 - samples/sec: 4987.48 - lr: 0.100000 +2023-04-06 04:08:22,113 epoch 32 - iter 2604/3720 - loss 0.03620039 - time (sec): 442.40 - samples/sec: 4988.51 - lr: 0.100000 +2023-04-06 04:09:25,150 epoch 32 - iter 2976/3720 - loss 0.03629937 - time (sec): 505.43 - samples/sec: 4990.05 - lr: 0.100000 +2023-04-06 04:10:28,052 epoch 32 - iter 3348/3720 - loss 0.03632866 - time (sec): 568.34 - samples/sec: 4988.58 - lr: 0.100000 +2023-04-06 04:11:32,068 epoch 32 - iter 3720/3720 - loss 0.03640496 - time (sec): 632.35 - samples/sec: 4984.11 - lr: 0.100000 +2023-04-06 04:11:32,068 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:11:32,069 EPOCH 32 done: loss 0.0364 - lr 0.100000 +2023-04-06 04:11:32,069 BAD EPOCHS (no improvement): 2 +2023-04-06 04:11:32,072 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:12:34,566 epoch 33 - iter 372/3720 - loss 0.03615619 - time (sec): 62.49 - samples/sec: 5045.81 - lr: 0.100000 +2023-04-06 04:13:39,034 epoch 33 - iter 744/3720 - loss 0.03617709 - time (sec): 126.96 - samples/sec: 4972.09 - lr: 0.100000 +2023-04-06 04:14:42,381 epoch 33 - iter 1116/3720 - loss 0.03629354 - time (sec): 190.31 - samples/sec: 4975.96 - lr: 0.100000 +2023-04-06 04:15:45,322 epoch 33 - iter 1488/3720 - loss 0.03613818 - time (sec): 253.25 - samples/sec: 4977.67 - lr: 0.100000 +2023-04-06 04:16:47,594 epoch 33 - iter 1860/3720 - loss 0.03617935 - time (sec): 315.52 - samples/sec: 4996.51 - lr: 0.100000 +2023-04-06 04:17:51,516 epoch 33 - iter 2232/3720 - loss 0.03633921 - time (sec): 379.44 - samples/sec: 4979.41 - lr: 0.100000 +2023-04-06 04:18:55,881 epoch 33 - iter 2604/3720 - loss 0.03629361 - time (sec): 443.81 - samples/sec: 4968.91 - lr: 0.100000 +2023-04-06 04:19:59,049 epoch 33 - iter 2976/3720 - loss 0.03635164 - time (sec): 506.98 - samples/sec: 4971.74 - lr: 0.100000 +2023-04-06 04:21:03,289 epoch 33 - iter 3348/3720 - loss 0.03624671 - time (sec): 571.22 - samples/sec: 4965.33 - lr: 0.100000 +2023-04-06 04:22:06,801 epoch 33 - iter 3720/3720 - loss 0.03622238 - time (sec): 634.73 - samples/sec: 4965.45 - lr: 0.100000 +2023-04-06 04:22:06,801 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:22:06,802 EPOCH 33 done: loss 0.0362 - lr 0.100000 +2023-04-06 04:22:06,802 BAD EPOCHS (no improvement): 0 +2023-04-06 04:22:06,805 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:23:10,915 epoch 34 - iter 372/3720 - loss 0.03661503 - time (sec): 64.11 - samples/sec: 4942.61 - lr: 0.100000 +2023-04-06 04:24:13,440 epoch 34 - iter 744/3720 - loss 0.03657963 - time (sec): 126.64 - samples/sec: 4990.14 - lr: 0.100000 +2023-04-06 04:25:16,466 epoch 34 - iter 1116/3720 - loss 0.03647274 - time (sec): 189.66 - samples/sec: 4981.26 - lr: 0.100000 +2023-04-06 04:26:17,810 epoch 34 - iter 1488/3720 - loss 0.03660441 - time (sec): 251.01 - samples/sec: 5009.35 - lr: 0.100000 +2023-04-06 04:27:21,461 epoch 34 - iter 1860/3720 - loss 0.03655032 - time (sec): 314.66 - samples/sec: 5000.17 - lr: 0.100000 +2023-04-06 04:28:25,783 epoch 34 - iter 2232/3720 - loss 0.03654797 - time (sec): 378.98 - samples/sec: 4988.08 - lr: 0.100000 +2023-04-06 04:29:30,360 epoch 34 - iter 2604/3720 - loss 0.03664691 - time (sec): 443.55 - samples/sec: 4975.96 - lr: 0.100000 +2023-04-06 04:30:33,471 epoch 34 - iter 2976/3720 - loss 0.03655137 - time (sec): 506.67 - samples/sec: 4977.32 - lr: 0.100000 +2023-04-06 04:31:35,798 epoch 34 - iter 3348/3720 - loss 0.03650225 - time (sec): 568.99 - samples/sec: 4981.06 - lr: 0.100000 +2023-04-06 04:32:38,474 epoch 34 - iter 3720/3720 - loss 0.03654818 - time (sec): 631.67 - samples/sec: 4989.50 - lr: 0.100000 +2023-04-06 04:32:38,474 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:32:38,474 EPOCH 34 done: loss 0.0365 - lr 0.100000 +2023-04-06 04:32:38,474 BAD EPOCHS (no improvement): 1 +2023-04-06 04:32:38,477 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:33:40,730 epoch 35 - iter 372/3720 - loss 0.03554340 - time (sec): 62.25 - samples/sec: 5068.43 - lr: 0.100000 +2023-04-06 04:34:44,385 epoch 35 - iter 744/3720 - loss 0.03577875 - time (sec): 125.91 - samples/sec: 5018.61 - lr: 0.100000 +2023-04-06 04:35:47,589 epoch 35 - iter 1116/3720 - loss 0.03598251 - time (sec): 189.11 - samples/sec: 5003.48 - lr: 0.100000 +2023-04-06 04:36:51,082 epoch 35 - iter 1488/3720 - loss 0.03586585 - time (sec): 252.60 - samples/sec: 4989.90 - lr: 0.100000 +2023-04-06 04:37:53,233 epoch 35 - iter 1860/3720 - loss 0.03602181 - time (sec): 314.76 - samples/sec: 5006.38 - lr: 0.100000 +2023-04-06 04:38:56,781 epoch 35 - iter 2232/3720 - loss 0.03594249 - time (sec): 378.30 - samples/sec: 4997.93 - lr: 0.100000 +2023-04-06 04:40:01,588 epoch 35 - iter 2604/3720 - loss 0.03596076 - time (sec): 443.11 - samples/sec: 4982.08 - lr: 0.100000 +2023-04-06 04:41:05,095 epoch 35 - iter 2976/3720 - loss 0.03609682 - time (sec): 506.62 - samples/sec: 4975.33 - lr: 0.100000 +2023-04-06 04:42:08,145 epoch 35 - iter 3348/3720 - loss 0.03609989 - time (sec): 569.67 - samples/sec: 4978.05 - lr: 0.100000 +2023-04-06 04:43:10,774 epoch 35 - iter 3720/3720 - loss 0.03625924 - time (sec): 632.30 - samples/sec: 4984.55 - lr: 0.100000 +2023-04-06 04:43:10,775 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:43:10,775 EPOCH 35 done: loss 0.0363 - lr 0.100000 +2023-04-06 04:43:10,775 BAD EPOCHS (no improvement): 2 +2023-04-06 04:43:10,777 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:44:13,548 epoch 36 - iter 372/3720 - loss 0.03547997 - time (sec): 62.77 - samples/sec: 5023.36 - lr: 0.100000 +2023-04-06 04:45:17,165 epoch 36 - iter 744/3720 - loss 0.03556230 - time (sec): 126.39 - samples/sec: 4987.40 - lr: 0.100000 +2023-04-06 04:46:19,825 epoch 36 - iter 1116/3720 - loss 0.03557631 - time (sec): 189.05 - samples/sec: 5008.21 - lr: 0.100000 +2023-04-06 04:47:21,810 epoch 36 - iter 1488/3720 - loss 0.03593285 - time (sec): 251.03 - samples/sec: 5024.33 - lr: 0.100000 +2023-04-06 04:48:24,759 epoch 36 - iter 1860/3720 - loss 0.03604706 - time (sec): 313.98 - samples/sec: 5021.56 - lr: 0.100000 +2023-04-06 04:49:28,723 epoch 36 - iter 2232/3720 - loss 0.03585887 - time (sec): 377.95 - samples/sec: 5012.08 - lr: 0.100000 +2023-04-06 04:50:31,251 epoch 36 - iter 2604/3720 - loss 0.03595801 - time (sec): 440.47 - samples/sec: 5015.64 - lr: 0.100000 +2023-04-06 04:51:33,011 epoch 36 - iter 2976/3720 - loss 0.03602714 - time (sec): 502.23 - samples/sec: 5023.84 - lr: 0.100000 +2023-04-06 04:52:36,148 epoch 36 - iter 3348/3720 - loss 0.03612962 - time (sec): 565.37 - samples/sec: 5022.99 - lr: 0.100000 +2023-04-06 04:53:39,499 epoch 36 - iter 3720/3720 - loss 0.03613866 - time (sec): 628.72 - samples/sec: 5012.89 - lr: 0.100000 +2023-04-06 04:53:39,499 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:53:39,499 EPOCH 36 done: loss 0.0361 - lr 0.100000 +2023-04-06 04:53:39,499 BAD EPOCHS (no improvement): 0 +2023-04-06 04:53:39,506 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:54:43,630 epoch 37 - iter 372/3720 - loss 0.03588182 - time (sec): 64.12 - samples/sec: 4935.21 - lr: 0.100000 +2023-04-06 04:55:46,708 epoch 37 - iter 744/3720 - loss 0.03648884 - time (sec): 127.20 - samples/sec: 4972.26 - lr: 0.100000 +2023-04-06 04:56:49,734 epoch 37 - iter 1116/3720 - loss 0.03638007 - time (sec): 190.23 - samples/sec: 4976.04 - lr: 0.100000 +2023-04-06 04:57:53,201 epoch 37 - iter 1488/3720 - loss 0.03629532 - time (sec): 253.69 - samples/sec: 4976.37 - lr: 0.100000 +2023-04-06 04:58:56,851 epoch 37 - iter 1860/3720 - loss 0.03628672 - time (sec): 317.34 - samples/sec: 4974.04 - lr: 0.100000 +2023-04-06 05:00:00,942 epoch 37 - iter 2232/3720 - loss 0.03624483 - time (sec): 381.44 - samples/sec: 4967.68 - lr: 0.100000 +2023-04-06 05:01:02,835 epoch 37 - iter 2604/3720 - loss 0.03630287 - time (sec): 443.33 - samples/sec: 4979.32 - lr: 0.100000 +2023-04-06 05:02:05,858 epoch 37 - iter 2976/3720 - loss 0.03618145 - time (sec): 506.35 - samples/sec: 4982.41 - lr: 0.100000 +2023-04-06 05:03:08,739 epoch 37 - iter 3348/3720 - loss 0.03627277 - time (sec): 569.23 - samples/sec: 4983.45 - lr: 0.100000 +2023-04-06 05:04:12,014 epoch 37 - iter 3720/3720 - loss 0.03621617 - time (sec): 632.51 - samples/sec: 4982.88 - lr: 0.100000 +2023-04-06 05:04:12,015 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:04:12,015 EPOCH 37 done: loss 0.0362 - lr 0.100000 +2023-04-06 05:04:12,015 BAD EPOCHS (no improvement): 1 +2023-04-06 05:04:12,022 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:05:15,649 epoch 38 - iter 372/3720 - loss 0.03581758 - time (sec): 63.63 - samples/sec: 4951.67 - lr: 0.100000 +2023-04-06 05:06:18,889 epoch 38 - iter 744/3720 - loss 0.03530465 - time (sec): 126.87 - samples/sec: 4966.09 - lr: 0.100000 +2023-04-06 05:07:22,777 epoch 38 - iter 1116/3720 - loss 0.03588757 - time (sec): 190.75 - samples/sec: 4956.01 - lr: 0.100000 +2023-04-06 05:08:25,250 epoch 38 - iter 1488/3720 - loss 0.03595468 - time (sec): 253.23 - samples/sec: 4976.78 - lr: 0.100000 +2023-04-06 05:09:30,429 epoch 38 - iter 1860/3720 - loss 0.03604632 - time (sec): 318.41 - samples/sec: 4957.88 - lr: 0.100000 +2023-04-06 05:10:33,993 epoch 38 - iter 2232/3720 - loss 0.03612242 - time (sec): 381.97 - samples/sec: 4957.49 - lr: 0.100000 +2023-04-06 05:11:36,193 epoch 38 - iter 2604/3720 - loss 0.03620231 - time (sec): 444.17 - samples/sec: 4971.41 - lr: 0.100000 +2023-04-06 05:12:38,101 epoch 38 - iter 2976/3720 - loss 0.03629202 - time (sec): 506.08 - samples/sec: 4986.44 - lr: 0.100000 +2023-04-06 05:13:40,885 epoch 38 - iter 3348/3720 - loss 0.03627942 - time (sec): 568.86 - samples/sec: 4990.85 - lr: 0.100000 +2023-04-06 05:14:42,225 epoch 38 - iter 3720/3720 - loss 0.03628093 - time (sec): 630.20 - samples/sec: 5001.11 - lr: 0.100000 +2023-04-06 05:14:42,225 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:14:42,225 EPOCH 38 done: loss 0.0363 - lr 0.100000 +2023-04-06 05:14:42,225 BAD EPOCHS (no improvement): 2 +2023-04-06 05:14:42,232 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:15:45,821 epoch 39 - iter 372/3720 - loss 0.03618891 - time (sec): 63.59 - samples/sec: 4972.35 - lr: 0.100000 +2023-04-06 05:16:48,199 epoch 39 - iter 744/3720 - loss 0.03589596 - time (sec): 125.97 - samples/sec: 5003.42 - lr: 0.100000 +2023-04-06 05:17:52,287 epoch 39 - iter 1116/3720 - loss 0.03577781 - time (sec): 190.06 - samples/sec: 4987.77 - lr: 0.100000 +2023-04-06 05:18:56,385 epoch 39 - iter 1488/3720 - loss 0.03605000 - time (sec): 254.15 - samples/sec: 4963.34 - lr: 0.100000 +2023-04-06 05:19:59,898 epoch 39 - iter 1860/3720 - loss 0.03619938 - time (sec): 317.67 - samples/sec: 4963.72 - lr: 0.100000 +2023-04-06 05:21:02,956 epoch 39 - iter 2232/3720 - loss 0.03616054 - time (sec): 380.72 - samples/sec: 4972.71 - lr: 0.100000 +2023-04-06 05:22:05,380 epoch 39 - iter 2604/3720 - loss 0.03631325 - time (sec): 443.15 - samples/sec: 4981.75 - lr: 0.100000 +2023-04-06 05:23:09,479 epoch 39 - iter 2976/3720 - loss 0.03629390 - time (sec): 507.25 - samples/sec: 4974.63 - lr: 0.100000 +2023-04-06 05:24:13,514 epoch 39 - iter 3348/3720 - loss 0.03627535 - time (sec): 571.28 - samples/sec: 4971.41 - lr: 0.100000 +2023-04-06 05:25:15,345 epoch 39 - iter 3720/3720 - loss 0.03633764 - time (sec): 633.11 - samples/sec: 4978.12 - lr: 0.100000 +2023-04-06 05:25:15,345 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:25:15,345 EPOCH 39 done: loss 0.0363 - lr 0.100000 +2023-04-06 05:25:15,345 BAD EPOCHS (no improvement): 3 +2023-04-06 05:25:15,352 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:26:18,619 epoch 40 - iter 372/3720 - loss 0.03507705 - time (sec): 63.27 - samples/sec: 4954.03 - lr: 0.100000 +2023-04-06 05:27:22,411 epoch 40 - iter 744/3720 - loss 0.03569404 - time (sec): 127.06 - samples/sec: 4954.66 - lr: 0.100000 +2023-04-06 05:28:25,575 epoch 40 - iter 1116/3720 - loss 0.03568844 - time (sec): 190.22 - samples/sec: 4965.57 - lr: 0.100000 +2023-04-06 05:29:28,086 epoch 40 - iter 1488/3720 - loss 0.03588809 - time (sec): 252.73 - samples/sec: 4973.71 - lr: 0.100000 +2023-04-06 05:30:31,282 epoch 40 - iter 1860/3720 - loss 0.03564235 - time (sec): 315.93 - samples/sec: 4980.29 - lr: 0.100000 +2023-04-06 05:31:33,392 epoch 40 - iter 2232/3720 - loss 0.03576474 - time (sec): 378.04 - samples/sec: 4997.67 - lr: 0.100000 +2023-04-06 05:32:35,991 epoch 40 - iter 2604/3720 - loss 0.03580354 - time (sec): 440.64 - samples/sec: 5006.35 - lr: 0.100000 +2023-04-06 05:33:37,763 epoch 40 - iter 2976/3720 - loss 0.03594209 - time (sec): 502.41 - samples/sec: 5014.35 - lr: 0.100000 +2023-04-06 05:34:40,953 epoch 40 - iter 3348/3720 - loss 0.03600140 - time (sec): 565.60 - samples/sec: 5014.46 - lr: 0.100000 +2023-04-06 05:35:45,443 epoch 40 - iter 3720/3720 - loss 0.03603039 - time (sec): 630.09 - samples/sec: 5002.00 - lr: 0.100000 +2023-04-06 05:35:45,443 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:35:45,443 EPOCH 40 done: loss 0.0360 - lr 0.100000 +2023-04-06 05:35:45,443 BAD EPOCHS (no improvement): 0 +2023-04-06 05:35:45,450 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:36:47,700 epoch 41 - iter 372/3720 - loss 0.03518475 - time (sec): 62.25 - samples/sec: 5053.76 - lr: 0.100000 +2023-04-06 05:37:51,556 epoch 41 - iter 744/3720 - loss 0.03588227 - time (sec): 126.11 - samples/sec: 4992.75 - lr: 0.100000 +2023-04-06 05:38:55,132 epoch 41 - iter 1116/3720 - loss 0.03591225 - time (sec): 189.68 - samples/sec: 4978.53 - lr: 0.100000 +2023-04-06 05:39:57,749 epoch 41 - iter 1488/3720 - loss 0.03580877 - time (sec): 252.30 - samples/sec: 4992.88 - lr: 0.100000 +2023-04-06 05:41:01,212 epoch 41 - iter 1860/3720 - loss 0.03578007 - time (sec): 315.76 - samples/sec: 4998.42 - lr: 0.100000 +2023-04-06 05:42:03,400 epoch 41 - iter 2232/3720 - loss 0.03604466 - time (sec): 377.95 - samples/sec: 5002.20 - lr: 0.100000 +2023-04-06 05:43:07,825 epoch 41 - iter 2604/3720 - loss 0.03592712 - time (sec): 442.38 - samples/sec: 4987.97 - lr: 0.100000 +2023-04-06 05:44:10,741 epoch 41 - iter 2976/3720 - loss 0.03602655 - time (sec): 505.29 - samples/sec: 4987.93 - lr: 0.100000 +2023-04-06 05:45:14,930 epoch 41 - iter 3348/3720 - loss 0.03605697 - time (sec): 569.48 - samples/sec: 4982.72 - lr: 0.100000 +2023-04-06 05:46:18,175 epoch 41 - iter 3720/3720 - loss 0.03612727 - time (sec): 632.73 - samples/sec: 4981.17 - lr: 0.100000 +2023-04-06 05:46:18,175 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:46:18,176 EPOCH 41 done: loss 0.0361 - lr 0.100000 +2023-04-06 05:46:18,176 BAD EPOCHS (no improvement): 1 +2023-04-06 05:46:18,179 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:47:21,888 epoch 42 - iter 372/3720 - loss 0.03501414 - time (sec): 63.71 - samples/sec: 4942.95 - lr: 0.100000 +2023-04-06 05:48:25,521 epoch 42 - iter 744/3720 - loss 0.03538114 - time (sec): 127.34 - samples/sec: 4951.75 - lr: 0.100000 +2023-04-06 05:49:28,818 epoch 42 - iter 1116/3720 - loss 0.03564249 - time (sec): 190.64 - samples/sec: 4964.53 - lr: 0.100000 +2023-04-06 05:50:31,722 epoch 42 - iter 1488/3720 - loss 0.03576905 - time (sec): 253.54 - samples/sec: 4973.25 - lr: 0.100000 +2023-04-06 05:51:35,060 epoch 42 - iter 1860/3720 - loss 0.03575105 - time (sec): 316.88 - samples/sec: 4973.78 - lr: 0.100000 +2023-04-06 05:52:37,857 epoch 42 - iter 2232/3720 - loss 0.03583953 - time (sec): 379.68 - samples/sec: 4976.50 - lr: 0.100000 +2023-04-06 05:53:41,974 epoch 42 - iter 2604/3720 - loss 0.03599862 - time (sec): 443.80 - samples/sec: 4967.95 - lr: 0.100000 +2023-04-06 05:54:44,560 epoch 42 - iter 2976/3720 - loss 0.03603327 - time (sec): 506.38 - samples/sec: 4976.54 - lr: 0.100000 +2023-04-06 05:55:48,409 epoch 42 - iter 3348/3720 - loss 0.03596564 - time (sec): 570.23 - samples/sec: 4975.43 - lr: 0.100000 +2023-04-06 05:56:52,312 epoch 42 - iter 3720/3720 - loss 0.03602839 - time (sec): 634.13 - samples/sec: 4970.11 - lr: 0.100000 +2023-04-06 05:56:52,313 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:56:52,313 EPOCH 42 done: loss 0.0360 - lr 0.100000 +2023-04-06 05:56:52,313 BAD EPOCHS (no improvement): 0 +2023-04-06 05:56:52,316 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:57:55,724 epoch 43 - iter 372/3720 - loss 0.03555848 - time (sec): 63.41 - samples/sec: 5039.09 - lr: 0.100000 +2023-04-06 05:58:58,889 epoch 43 - iter 744/3720 - loss 0.03560942 - time (sec): 126.57 - samples/sec: 5011.99 - lr: 0.100000 +2023-04-06 06:00:02,000 epoch 43 - iter 1116/3720 - loss 0.03581274 - time (sec): 189.68 - samples/sec: 5002.83 - lr: 0.100000 +2023-04-06 06:01:04,999 epoch 43 - iter 1488/3720 - loss 0.03581777 - time (sec): 252.68 - samples/sec: 4999.78 - lr: 0.100000 +2023-04-06 06:02:09,423 epoch 43 - iter 1860/3720 - loss 0.03587032 - time (sec): 317.11 - samples/sec: 4983.13 - lr: 0.100000 +2023-04-06 06:03:13,413 epoch 43 - iter 2232/3720 - loss 0.03602507 - time (sec): 381.10 - samples/sec: 4968.34 - lr: 0.100000 +2023-04-06 06:04:16,662 epoch 43 - iter 2604/3720 - loss 0.03608633 - time (sec): 444.35 - samples/sec: 4969.57 - lr: 0.100000 +2023-04-06 06:05:20,951 epoch 43 - iter 2976/3720 - loss 0.03607723 - time (sec): 508.63 - samples/sec: 4960.06 - lr: 0.100000 +2023-04-06 06:06:24,950 epoch 43 - iter 3348/3720 - loss 0.03619460 - time (sec): 572.63 - samples/sec: 4954.04 - lr: 0.100000 +2023-04-06 06:07:28,532 epoch 43 - iter 3720/3720 - loss 0.03611081 - time (sec): 636.22 - samples/sec: 4953.84 - lr: 0.100000 +2023-04-06 06:07:28,533 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:07:28,533 EPOCH 43 done: loss 0.0361 - lr 0.100000 +2023-04-06 06:07:28,533 BAD EPOCHS (no improvement): 1 +2023-04-06 06:07:28,539 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:08:31,206 epoch 44 - iter 372/3720 - loss 0.03589108 - time (sec): 62.67 - samples/sec: 5020.94 - lr: 0.100000 +2023-04-06 06:09:34,097 epoch 44 - iter 744/3720 - loss 0.03586768 - time (sec): 125.56 - samples/sec: 5028.57 - lr: 0.100000 +2023-04-06 06:10:37,457 epoch 44 - iter 1116/3720 - loss 0.03612357 - time (sec): 188.92 - samples/sec: 5009.90 - lr: 0.100000 +2023-04-06 06:11:40,707 epoch 44 - iter 1488/3720 - loss 0.03610499 - time (sec): 252.17 - samples/sec: 5001.98 - lr: 0.100000 +2023-04-06 06:12:43,165 epoch 44 - iter 1860/3720 - loss 0.03594915 - time (sec): 314.63 - samples/sec: 5011.35 - lr: 0.100000 +2023-04-06 06:13:45,140 epoch 44 - iter 2232/3720 - loss 0.03609889 - time (sec): 376.60 - samples/sec: 5020.84 - lr: 0.100000 +2023-04-06 06:14:48,197 epoch 44 - iter 2604/3720 - loss 0.03615081 - time (sec): 439.66 - samples/sec: 5015.06 - lr: 0.100000 +2023-04-06 06:15:51,641 epoch 44 - iter 2976/3720 - loss 0.03602430 - time (sec): 503.10 - samples/sec: 5007.21 - lr: 0.100000 +2023-04-06 06:16:56,633 epoch 44 - iter 3348/3720 - loss 0.03602352 - time (sec): 568.09 - samples/sec: 4990.70 - lr: 0.100000 +2023-04-06 06:18:01,163 epoch 44 - iter 3720/3720 - loss 0.03604926 - time (sec): 632.62 - samples/sec: 4981.97 - lr: 0.100000 +2023-04-06 06:18:01,164 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:18:01,164 EPOCH 44 done: loss 0.0360 - lr 0.100000 +2023-04-06 06:18:01,164 BAD EPOCHS (no improvement): 2 +2023-04-06 06:18:01,170 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:19:05,090 epoch 45 - iter 372/3720 - loss 0.03615835 - time (sec): 63.92 - samples/sec: 4940.37 - lr: 0.100000 +2023-04-06 06:20:08,176 epoch 45 - iter 744/3720 - loss 0.03552771 - time (sec): 127.01 - samples/sec: 4975.27 - lr: 0.100000 +2023-04-06 06:21:12,225 epoch 45 - iter 1116/3720 - loss 0.03555194 - time (sec): 191.06 - samples/sec: 4949.78 - lr: 0.100000 +2023-04-06 06:22:13,586 epoch 45 - iter 1488/3720 - loss 0.03556429 - time (sec): 252.42 - samples/sec: 4983.47 - lr: 0.100000 +2023-04-06 06:23:16,041 epoch 45 - iter 1860/3720 - loss 0.03557876 - time (sec): 314.87 - samples/sec: 4997.62 - lr: 0.100000 +2023-04-06 06:24:18,043 epoch 45 - iter 2232/3720 - loss 0.03578220 - time (sec): 376.87 - samples/sec: 5008.33 - lr: 0.100000 +2023-04-06 06:25:21,526 epoch 45 - iter 2604/3720 - loss 0.03584423 - time (sec): 440.36 - samples/sec: 5003.44 - lr: 0.100000 +2023-04-06 06:26:25,628 epoch 45 - iter 2976/3720 - loss 0.03575174 - time (sec): 504.46 - samples/sec: 4997.42 - lr: 0.100000 +2023-04-06 06:27:29,722 epoch 45 - iter 3348/3720 - loss 0.03583934 - time (sec): 568.55 - samples/sec: 4990.60 - lr: 0.100000 +2023-04-06 06:28:33,643 epoch 45 - iter 3720/3720 - loss 0.03588281 - time (sec): 632.47 - samples/sec: 4983.16 - lr: 0.100000 +2023-04-06 06:28:33,643 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:28:33,643 EPOCH 45 done: loss 0.0359 - lr 0.100000 +2023-04-06 06:28:33,643 BAD EPOCHS (no improvement): 0 +2023-04-06 06:28:33,648 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:29:36,550 epoch 46 - iter 372/3720 - loss 0.03630327 - time (sec): 62.90 - samples/sec: 4974.87 - lr: 0.100000 +2023-04-06 06:30:40,187 epoch 46 - iter 744/3720 - loss 0.03559881 - time (sec): 126.54 - samples/sec: 4984.12 - lr: 0.100000 +2023-04-06 06:31:44,689 epoch 46 - iter 1116/3720 - loss 0.03595745 - time (sec): 191.04 - samples/sec: 4963.69 - lr: 0.100000 +2023-04-06 06:32:48,098 epoch 46 - iter 1488/3720 - loss 0.03574153 - time (sec): 254.45 - samples/sec: 4961.50 - lr: 0.100000 +2023-04-06 06:33:51,369 epoch 46 - iter 1860/3720 - loss 0.03583519 - time (sec): 317.72 - samples/sec: 4969.38 - lr: 0.100000 +2023-04-06 06:34:53,314 epoch 46 - iter 2232/3720 - loss 0.03585869 - time (sec): 379.67 - samples/sec: 4982.85 - lr: 0.100000 +2023-04-06 06:35:55,870 epoch 46 - iter 2604/3720 - loss 0.03613151 - time (sec): 442.22 - samples/sec: 4991.54 - lr: 0.100000 +2023-04-06 06:36:57,688 epoch 46 - iter 2976/3720 - loss 0.03613827 - time (sec): 504.04 - samples/sec: 5000.94 - lr: 0.100000 +2023-04-06 06:38:01,506 epoch 46 - iter 3348/3720 - loss 0.03615893 - time (sec): 567.86 - samples/sec: 4994.24 - lr: 0.100000 +2023-04-06 06:39:06,195 epoch 46 - iter 3720/3720 - loss 0.03607414 - time (sec): 632.55 - samples/sec: 4982.58 - lr: 0.100000 +2023-04-06 06:39:06,195 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:39:06,195 EPOCH 46 done: loss 0.0361 - lr 0.100000 +2023-04-06 06:39:06,196 BAD EPOCHS (no improvement): 1 +2023-04-06 06:39:06,199 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:40:10,485 epoch 47 - iter 372/3720 - loss 0.03617819 - time (sec): 64.29 - samples/sec: 4897.36 - lr: 0.100000 +2023-04-06 06:41:12,875 epoch 47 - iter 744/3720 - loss 0.03616579 - time (sec): 126.68 - samples/sec: 4974.47 - lr: 0.100000 +2023-04-06 06:42:15,327 epoch 47 - iter 1116/3720 - loss 0.03586013 - time (sec): 189.13 - samples/sec: 4991.27 - lr: 0.100000 +2023-04-06 06:43:19,618 epoch 47 - iter 1488/3720 - loss 0.03567191 - time (sec): 253.42 - samples/sec: 4975.30 - lr: 0.100000 +2023-04-06 06:44:22,746 epoch 47 - iter 1860/3720 - loss 0.03560712 - time (sec): 316.55 - samples/sec: 4979.93 - lr: 0.100000 +2023-04-06 06:45:24,829 epoch 47 - iter 2232/3720 - loss 0.03572832 - time (sec): 378.63 - samples/sec: 4993.69 - lr: 0.100000 +2023-04-06 06:46:28,144 epoch 47 - iter 2604/3720 - loss 0.03585095 - time (sec): 441.95 - samples/sec: 4988.66 - lr: 0.100000 +2023-04-06 06:47:32,397 epoch 47 - iter 2976/3720 - loss 0.03587577 - time (sec): 506.20 - samples/sec: 4978.63 - lr: 0.100000 +2023-04-06 06:48:37,163 epoch 47 - iter 3348/3720 - loss 0.03588128 - time (sec): 570.96 - samples/sec: 4968.15 - lr: 0.100000 +2023-04-06 06:49:40,834 epoch 47 - iter 3720/3720 - loss 0.03594796 - time (sec): 634.64 - samples/sec: 4966.18 - lr: 0.100000 +2023-04-06 06:49:40,834 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:49:40,834 EPOCH 47 done: loss 0.0359 - lr 0.100000 +2023-04-06 06:49:40,834 BAD EPOCHS (no improvement): 2 +2023-04-06 06:49:40,841 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:50:44,233 epoch 48 - iter 372/3720 - loss 0.03554580 - time (sec): 63.39 - samples/sec: 4933.11 - lr: 0.100000 +2023-04-06 06:51:47,269 epoch 48 - iter 744/3720 - loss 0.03555960 - time (sec): 126.43 - samples/sec: 4996.62 - lr: 0.100000 +2023-04-06 06:52:49,964 epoch 48 - iter 1116/3720 - loss 0.03584024 - time (sec): 189.12 - samples/sec: 4999.42 - lr: 0.100000 +2023-04-06 06:53:53,479 epoch 48 - iter 1488/3720 - loss 0.03588851 - time (sec): 252.64 - samples/sec: 4988.01 - lr: 0.100000 +2023-04-06 06:54:56,070 epoch 48 - iter 1860/3720 - loss 0.03575096 - time (sec): 315.23 - samples/sec: 4997.40 - lr: 0.100000 +2023-04-06 06:55:58,504 epoch 48 - iter 2232/3720 - loss 0.03572593 - time (sec): 377.66 - samples/sec: 5006.22 - lr: 0.100000 +2023-04-06 06:57:01,545 epoch 48 - iter 2604/3720 - loss 0.03571595 - time (sec): 440.70 - samples/sec: 5007.16 - lr: 0.100000 +2023-04-06 06:58:05,462 epoch 48 - iter 2976/3720 - loss 0.03582259 - time (sec): 504.62 - samples/sec: 4997.59 - lr: 0.100000 +2023-04-06 06:59:10,299 epoch 48 - iter 3348/3720 - loss 0.03577259 - time (sec): 569.46 - samples/sec: 4985.30 - lr: 0.100000 +2023-04-06 07:00:13,789 epoch 48 - iter 3720/3720 - loss 0.03577572 - time (sec): 632.95 - samples/sec: 4979.42 - lr: 0.100000 +2023-04-06 07:00:13,789 ---------------------------------------------------------------------------------------------------- +2023-04-06 07:00:13,789 EPOCH 48 done: loss 0.0358 - lr 0.100000 +2023-04-06 07:00:13,789 BAD EPOCHS (no improvement): 0 +2023-04-06 07:00:13,796 ---------------------------------------------------------------------------------------------------- +2023-04-06 07:01:17,203 epoch 49 - iter 372/3720 - loss 0.03554267 - time (sec): 63.41 - samples/sec: 4962.01 - lr: 0.100000 +2023-04-06 07:02:21,293 epoch 49 - iter 744/3720 - loss 0.03562803 - time (sec): 127.50 - samples/sec: 4939.84 - lr: 0.100000 +2023-04-06 07:03:25,257 epoch 49 - iter 1116/3720 - loss 0.03544781 - time (sec): 191.46 - samples/sec: 4933.92 - lr: 0.100000 +2023-04-06 07:04:30,417 epoch 49 - iter 1488/3720 - loss 0.03547625 - time (sec): 256.62 - samples/sec: 4925.15 - lr: 0.100000 +2023-04-06 07:05:33,971 epoch 49 - iter 1860/3720 - loss 0.03561882 - time (sec): 320.17 - samples/sec: 4931.75 - lr: 0.100000 +2023-04-06 07:06:38,334 epoch 49 - iter 2232/3720 - loss 0.03562794 - time (sec): 384.54 - samples/sec: 4924.24 - lr: 0.100000 +2023-04-06 07:07:41,637 epoch 49 - iter 2604/3720 - loss 0.03558202 - time (sec): 447.84 - samples/sec: 4925.04 - lr: 0.100000 +2023-04-06 07:08:46,559 epoch 49 - iter 2976/3720 - loss 0.03573090 - time (sec): 512.76 - samples/sec: 4922.24 - lr: 0.100000 +2023-04-06 07:09:49,950 epoch 49 - iter 3348/3720 - loss 0.03567211 - time (sec): 576.15 - samples/sec: 4926.28 - lr: 0.100000 +2023-04-06 07:10:53,102 epoch 49 - iter 3720/3720 - loss 0.03593851 - time (sec): 639.31 - samples/sec: 4929.90 - lr: 0.100000 +2023-04-06 07:10:53,102 ---------------------------------------------------------------------------------------------------- +2023-04-06 07:10:53,103 EPOCH 49 done: loss 0.0359 - lr 0.100000 +2023-04-06 07:10:53,103 BAD EPOCHS (no improvement): 1 +2023-04-06 07:10:53,106 ---------------------------------------------------------------------------------------------------- +2023-04-06 07:11:57,194 epoch 50 - iter 372/3720 - loss 0.03592104 - time (sec): 64.09 - samples/sec: 4918.69 - lr: 0.100000 +2023-04-06 07:13:01,310 epoch 50 - iter 744/3720 - loss 0.03541568 - time (sec): 128.20 - samples/sec: 4905.25 - lr: 0.100000 +2023-04-06 07:14:05,523 epoch 50 - iter 1116/3720 - loss 0.03570905 - time (sec): 192.42 - samples/sec: 4907.23 - lr: 0.100000 +2023-04-06 07:15:09,667 epoch 50 - iter 1488/3720 - loss 0.03571792 - time (sec): 256.56 - samples/sec: 4905.33 - lr: 0.100000 +2023-04-06 07:16:13,919 epoch 50 - iter 1860/3720 - loss 0.03584356 - time (sec): 320.81 - samples/sec: 4905.96 - lr: 0.100000 +2023-04-06 07:17:17,370 epoch 50 - iter 2232/3720 - loss 0.03600621 - time (sec): 384.26 - samples/sec: 4919.86 - lr: 0.100000 +2023-04-06 07:18:21,980 epoch 50 - iter 2604/3720 - loss 0.03591886 - time (sec): 448.87 - samples/sec: 4915.19 - lr: 0.100000 +2023-04-06 07:19:24,867 epoch 50 - iter 2976/3720 - loss 0.03588801 - time (sec): 511.76 - samples/sec: 4924.26 - lr: 0.100000 +2023-04-06 07:20:27,929 epoch 50 - iter 3348/3720 - loss 0.03591384 - time (sec): 574.82 - samples/sec: 4931.97 - lr: 0.100000 +2023-04-06 07:21:31,603 epoch 50 - iter 3720/3720 - loss 0.03593144 - time (sec): 638.50 - samples/sec: 4936.14 - lr: 0.100000 +2023-04-06 07:21:31,604 ---------------------------------------------------------------------------------------------------- +2023-04-06 07:21:31,604 EPOCH 50 done: loss 0.0359 - lr 0.100000 +2023-04-06 07:21:31,604 BAD EPOCHS (no improvement): 2 +2023-04-06 07:21:31,607 ---------------------------------------------------------------------------------------------------- +2023-04-06 07:22:35,309 epoch 51 - iter 372/3720 - loss 0.03611297 - time (sec): 63.70 - samples/sec: 4940.79 - lr: 0.100000 +2023-04-06 07:23:39,113 epoch 51 - iter 744/3720 - loss 0.03558047 - time (sec): 127.51 - samples/sec: 4945.55 - lr: 0.100000 +2023-04-06 07:24:42,508 epoch 51 - iter 1116/3720 - loss 0.03554481 - time (sec): 190.90 - samples/sec: 4959.02 - lr: 0.100000 +2023-04-06 07:25:45,777 epoch 51 - iter 1488/3720 - loss 0.03589186 - time (sec): 254.17 - samples/sec: 4954.67 - lr: 0.100000 +2023-04-06 07:26:48,204 epoch 51 - iter 1860/3720 - loss 0.03598627 - time (sec): 316.60 - samples/sec: 4969.12 - lr: 0.100000 +2023-04-06 07:27:52,011 epoch 51 - iter 2232/3720 - loss 0.03592064 - time (sec): 380.40 - samples/sec: 4964.39 - lr: 0.100000 +2023-04-06 07:28:56,520 epoch 51 - iter 2604/3720 - loss 0.03586564 - time (sec): 444.91 - samples/sec: 4955.78 - lr: 0.100000 +2023-04-06 07:30:01,001 epoch 51 - iter 2976/3720 - loss 0.03586686 - time (sec): 509.39 - samples/sec: 4945.34 - lr: 0.100000 +2023-04-06 07:31:05,031 epoch 51 - iter 3348/3720 - loss 0.03590195 - time (sec): 573.42 - samples/sec: 4948.82 - lr: 0.100000 +2023-04-06 07:32:08,022 epoch 51 - iter 3720/3720 - loss 0.03604278 - time (sec): 636.42 - samples/sec: 4952.29 - lr: 0.100000 +2023-04-06 07:32:08,023 ---------------------------------------------------------------------------------------------------- +2023-04-06 07:32:08,023 EPOCH 51 done: loss 0.0360 - lr 0.100000 +2023-04-06 07:32:08,023 BAD EPOCHS (no improvement): 3 +2023-04-06 07:32:08,026 ---------------------------------------------------------------------------------------------------- +2023-04-06 07:33:12,509 epoch 52 - iter 372/3720 - loss 0.03469880 - time (sec): 64.48 - samples/sec: 4932.91 - lr: 0.100000 +2023-04-06 07:34:16,091 epoch 52 - iter 744/3720 - loss 0.03495443 - time (sec): 128.06 - samples/sec: 4943.58 - lr: 0.100000 +2023-04-06 07:35:19,627 epoch 52 - iter 1116/3720 - loss 0.03503903 - time (sec): 191.60 - samples/sec: 4943.40 - lr: 0.100000 +2023-04-06 07:36:22,813 epoch 52 - iter 1488/3720 - loss 0.03533135 - time (sec): 254.79 - samples/sec: 4952.14 - lr: 0.100000 +2023-04-06 07:37:26,237 epoch 52 - iter 1860/3720 - loss 0.03548857 - time (sec): 318.21 - samples/sec: 4955.48 - lr: 0.100000 +2023-04-06 07:38:29,896 epoch 52 - iter 2232/3720 - loss 0.03561160 - time (sec): 381.87 - samples/sec: 4953.14 - lr: 0.100000 +2023-04-06 07:39:34,068 epoch 52 - iter 2604/3720 - loss 0.03563686 - time (sec): 446.04 - samples/sec: 4945.79 - lr: 0.100000 +2023-04-06 07:40:36,586 epoch 52 - iter 2976/3720 - loss 0.03573569 - time (sec): 508.56 - samples/sec: 4960.11 - lr: 0.100000 +2023-04-06 07:41:39,467 epoch 52 - iter 3348/3720 - loss 0.03569256 - time (sec): 571.44 - samples/sec: 4966.97 - lr: 0.100000 +2023-04-06 07:42:41,221 epoch 52 - iter 3720/3720 - loss 0.03576243 - time (sec): 633.20 - samples/sec: 4977.47 - lr: 0.100000 +2023-04-06 07:42:41,222 ---------------------------------------------------------------------------------------------------- +2023-04-06 07:42:41,222 EPOCH 52 done: loss 0.0358 - lr 0.100000 +2023-04-06 07:42:41,222 BAD EPOCHS (no improvement): 0 +2023-04-06 07:42:41,225 ---------------------------------------------------------------------------------------------------- +2023-04-06 07:43:44,567 epoch 53 - iter 372/3720 - loss 0.03521698 - time (sec): 63.34 - samples/sec: 5001.75 - lr: 0.100000 +2023-04-06 07:44:47,871 epoch 53 - iter 744/3720 - loss 0.03535323 - time (sec): 126.65 - samples/sec: 4997.61 - lr: 0.100000 +2023-04-06 07:45:50,809 epoch 53 - iter 1116/3720 - loss 0.03581383 - time (sec): 189.58 - samples/sec: 4994.56 - lr: 0.100000 +2023-04-06 07:46:54,008 epoch 53 - iter 1488/3720 - loss 0.03585699 - time (sec): 252.78 - samples/sec: 4993.35 - lr: 0.100000 +2023-04-06 07:47:57,315 epoch 53 - iter 1860/3720 - loss 0.03546709 - time (sec): 316.09 - samples/sec: 4991.47 - lr: 0.100000 +2023-04-06 07:48:59,339 epoch 53 - iter 2232/3720 - loss 0.03559660 - time (sec): 378.11 - samples/sec: 5004.44 - lr: 0.100000 +2023-04-06 07:50:03,686 epoch 53 - iter 2604/3720 - loss 0.03560430 - time (sec): 442.46 - samples/sec: 4989.10 - lr: 0.100000 +2023-04-06 07:51:06,555 epoch 53 - iter 2976/3720 - loss 0.03555950 - time (sec): 505.33 - samples/sec: 4991.29 - lr: 0.100000 +2023-04-06 07:52:09,988 epoch 53 - iter 3348/3720 - loss 0.03568930 - time (sec): 568.76 - samples/sec: 4988.07 - lr: 0.100000 +2023-04-06 07:53:13,140 epoch 53 - iter 3720/3720 - loss 0.03572553 - time (sec): 631.92 - samples/sec: 4987.55 - lr: 0.100000 +2023-04-06 07:53:13,140 ---------------------------------------------------------------------------------------------------- +2023-04-06 07:53:13,140 EPOCH 53 done: loss 0.0357 - lr 0.100000 +2023-04-06 07:53:13,140 BAD EPOCHS (no improvement): 0 +2023-04-06 07:53:13,143 ---------------------------------------------------------------------------------------------------- +2023-04-06 07:54:17,019 epoch 54 - iter 372/3720 - loss 0.03507077 - time (sec): 63.88 - samples/sec: 4987.30 - lr: 0.100000 +2023-04-06 07:55:20,628 epoch 54 - iter 744/3720 - loss 0.03503947 - time (sec): 127.48 - samples/sec: 4965.15 - lr: 0.100000 +2023-04-06 07:56:23,731 epoch 54 - iter 1116/3720 - loss 0.03511696 - time (sec): 190.59 - samples/sec: 4967.04 - lr: 0.100000 +2023-04-06 07:57:27,250 epoch 54 - iter 1488/3720 - loss 0.03537984 - time (sec): 254.11 - samples/sec: 4964.39 - lr: 0.100000 +2023-04-06 07:58:30,162 epoch 54 - iter 1860/3720 - loss 0.03556180 - time (sec): 317.02 - samples/sec: 4972.03 - lr: 0.100000 +2023-04-06 07:59:33,372 epoch 54 - iter 2232/3720 - loss 0.03557394 - time (sec): 380.23 - samples/sec: 4973.89 - lr: 0.100000 +2023-04-06 08:00:36,612 epoch 54 - iter 2604/3720 - loss 0.03562157 - time (sec): 443.47 - samples/sec: 4973.17 - lr: 0.100000 +2023-04-06 08:01:39,834 epoch 54 - iter 2976/3720 - loss 0.03558331 - time (sec): 506.69 - samples/sec: 4975.68 - lr: 0.100000 +2023-04-06 08:02:43,251 epoch 54 - iter 3348/3720 - loss 0.03570854 - time (sec): 570.11 - samples/sec: 4975.42 - lr: 0.100000 +2023-04-06 08:03:47,595 epoch 54 - iter 3720/3720 - loss 0.03576077 - time (sec): 634.45 - samples/sec: 4967.62 - lr: 0.100000 +2023-04-06 08:03:47,595 ---------------------------------------------------------------------------------------------------- +2023-04-06 08:03:47,595 EPOCH 54 done: loss 0.0358 - lr 0.100000 +2023-04-06 08:03:47,595 BAD EPOCHS (no improvement): 1 +2023-04-06 08:03:47,599 ---------------------------------------------------------------------------------------------------- +2023-04-06 08:04:50,499 epoch 55 - iter 372/3720 - loss 0.03556611 - time (sec): 62.90 - samples/sec: 4994.47 - lr: 0.100000 +2023-04-06 08:05:55,305 epoch 55 - iter 744/3720 - loss 0.03582456 - time (sec): 127.71 - samples/sec: 4965.91 - lr: 0.100000 +2023-04-06 08:06:59,007 epoch 55 - iter 1116/3720 - loss 0.03548060 - time (sec): 191.41 - samples/sec: 4957.25 - lr: 0.100000 +2023-04-06 08:08:01,743 epoch 55 - iter 1488/3720 - loss 0.03558508 - time (sec): 254.14 - samples/sec: 4963.79 - lr: 0.100000 +2023-04-06 08:09:05,576 epoch 55 - iter 1860/3720 - loss 0.03554312 - time (sec): 317.98 - samples/sec: 4962.03 - lr: 0.100000 +2023-04-06 08:10:08,908 epoch 55 - iter 2232/3720 - loss 0.03566213 - time (sec): 381.31 - samples/sec: 4960.97 - lr: 0.100000 +2023-04-06 08:11:12,955 epoch 55 - iter 2604/3720 - loss 0.03578027 - time (sec): 445.36 - samples/sec: 4957.57 - lr: 0.100000 +2023-04-06 08:12:16,798 epoch 55 - iter 2976/3720 - loss 0.03576108 - time (sec): 509.20 - samples/sec: 4956.91 - lr: 0.100000 +2023-04-06 08:13:19,582 epoch 55 - iter 3348/3720 - loss 0.03580154 - time (sec): 571.98 - samples/sec: 4963.63 - lr: 0.100000 +2023-04-06 08:14:22,205 epoch 55 - iter 3720/3720 - loss 0.03582617 - time (sec): 634.61 - samples/sec: 4966.41 - lr: 0.100000 +2023-04-06 08:14:22,205 ---------------------------------------------------------------------------------------------------- +2023-04-06 08:14:22,205 EPOCH 55 done: loss 0.0358 - lr 0.100000 +2023-04-06 08:14:22,205 BAD EPOCHS (no improvement): 2 +2023-04-06 08:14:22,208 ---------------------------------------------------------------------------------------------------- +2023-04-06 08:15:24,411 epoch 56 - iter 372/3720 - loss 0.03443706 - time (sec): 62.20 - samples/sec: 5036.04 - lr: 0.100000 +2023-04-06 08:16:26,636 epoch 56 - iter 744/3720 - loss 0.03516020 - time (sec): 124.43 - samples/sec: 5058.82 - lr: 0.100000 +2023-04-06 08:17:30,105 epoch 56 - iter 1116/3720 - loss 0.03535747 - time (sec): 187.90 - samples/sec: 5032.65 - lr: 0.100000 +2023-04-06 08:18:34,643 epoch 56 - iter 1488/3720 - loss 0.03554717 - time (sec): 252.43 - samples/sec: 4997.00 - lr: 0.100000 +2023-04-06 08:19:38,306 epoch 56 - iter 1860/3720 - loss 0.03543249 - time (sec): 316.10 - samples/sec: 4988.13 - lr: 0.100000 +2023-04-06 08:20:41,104 epoch 56 - iter 2232/3720 - loss 0.03532255 - time (sec): 378.90 - samples/sec: 4989.87 - lr: 0.100000 +2023-04-06 08:21:44,361 epoch 56 - iter 2604/3720 - loss 0.03531136 - time (sec): 442.15 - samples/sec: 4991.51 - lr: 0.100000 +2023-04-06 08:22:47,628 epoch 56 - iter 2976/3720 - loss 0.03552810 - time (sec): 505.42 - samples/sec: 4987.43 - lr: 0.100000 +2023-04-06 08:23:50,303 epoch 56 - iter 3348/3720 - loss 0.03562046 - time (sec): 568.09 - samples/sec: 4993.31 - lr: 0.100000 +2023-04-06 08:24:54,359 epoch 56 - iter 3720/3720 - loss 0.03579107 - time (sec): 632.15 - samples/sec: 4985.70 - lr: 0.100000 +2023-04-06 08:24:54,359 ---------------------------------------------------------------------------------------------------- +2023-04-06 08:24:54,359 EPOCH 56 done: loss 0.0358 - lr 0.100000 +2023-04-06 08:24:54,360 BAD EPOCHS (no improvement): 3 +2023-04-06 08:24:54,365 ---------------------------------------------------------------------------------------------------- +2023-04-06 08:25:58,233 epoch 57 - iter 372/3720 - loss 0.03522513 - time (sec): 63.87 - samples/sec: 4903.71 - lr: 0.100000 +2023-04-06 08:27:02,754 epoch 57 - iter 744/3720 - loss 0.03543756 - time (sec): 128.39 - samples/sec: 4900.92 - lr: 0.100000 +2023-04-06 08:28:06,253 epoch 57 - iter 1116/3720 - loss 0.03571462 - time (sec): 191.89 - samples/sec: 4914.12 - lr: 0.100000 +2023-04-06 08:29:10,700 epoch 57 - iter 1488/3720 - loss 0.03566904 - time (sec): 256.33 - samples/sec: 4913.95 - lr: 0.100000 +2023-04-06 08:30:14,899 epoch 57 - iter 1860/3720 - loss 0.03573546 - time (sec): 320.53 - samples/sec: 4908.38 - lr: 0.100000 +2023-04-06 08:31:19,151 epoch 57 - iter 2232/3720 - loss 0.03548699 - time (sec): 384.79 - samples/sec: 4914.70 - lr: 0.100000 +2023-04-06 08:32:23,916 epoch 57 - iter 2604/3720 - loss 0.03546777 - time (sec): 449.55 - samples/sec: 4909.01 - lr: 0.100000 +2023-04-06 08:33:27,136 epoch 57 - iter 2976/3720 - loss 0.03550752 - time (sec): 512.77 - samples/sec: 4915.96 - lr: 0.100000 +2023-04-06 08:34:29,964 epoch 57 - iter 3348/3720 - loss 0.03561924 - time (sec): 575.60 - samples/sec: 4927.39 - lr: 0.100000 +2023-04-06 08:35:32,600 epoch 57 - iter 3720/3720 - loss 0.03564062 - time (sec): 638.23 - samples/sec: 4938.17 - lr: 0.100000 +2023-04-06 08:35:32,600 ---------------------------------------------------------------------------------------------------- +2023-04-06 08:35:32,600 EPOCH 57 done: loss 0.0356 - lr 0.100000 +2023-04-06 08:35:32,600 BAD EPOCHS (no improvement): 0 +2023-04-06 08:35:32,603 ---------------------------------------------------------------------------------------------------- +2023-04-06 08:36:36,646 epoch 58 - iter 372/3720 - loss 0.03509077 - time (sec): 64.04 - samples/sec: 4929.77 - lr: 0.100000 +2023-04-06 08:37:39,835 epoch 58 - iter 744/3720 - loss 0.03566188 - time (sec): 127.23 - samples/sec: 4947.50 - lr: 0.100000 +2023-04-06 08:38:43,340 epoch 58 - iter 1116/3720 - loss 0.03548289 - time (sec): 190.74 - samples/sec: 4958.98 - lr: 0.100000 +2023-04-06 08:39:47,722 epoch 58 - iter 1488/3720 - loss 0.03546883 - time (sec): 255.12 - samples/sec: 4945.43 - lr: 0.100000 +2023-04-06 08:40:51,456 epoch 58 - iter 1860/3720 - loss 0.03546374 - time (sec): 318.85 - samples/sec: 4948.67 - lr: 0.100000 +2023-04-06 08:41:55,028 epoch 58 - iter 2232/3720 - loss 0.03558942 - time (sec): 382.42 - samples/sec: 4948.86 - lr: 0.100000 +2023-04-06 08:42:59,081 epoch 58 - iter 2604/3720 - loss 0.03561752 - time (sec): 446.48 - samples/sec: 4949.39 - lr: 0.100000 +2023-04-06 08:44:01,965 epoch 58 - iter 2976/3720 - loss 0.03565205 - time (sec): 509.36 - samples/sec: 4956.64 - lr: 0.100000 +2023-04-06 08:45:04,932 epoch 58 - iter 3348/3720 - loss 0.03555554 - time (sec): 572.33 - samples/sec: 4955.43 - lr: 0.100000 +2023-04-06 08:46:08,504 epoch 58 - iter 3720/3720 - loss 0.03565709 - time (sec): 635.90 - samples/sec: 4956.29 - lr: 0.100000 +2023-04-06 08:46:08,505 ---------------------------------------------------------------------------------------------------- +2023-04-06 08:46:08,505 EPOCH 58 done: loss 0.0357 - lr 0.100000 +2023-04-06 08:46:08,505 BAD EPOCHS (no improvement): 1 +2023-04-06 08:46:08,507 ---------------------------------------------------------------------------------------------------- +2023-04-06 08:47:10,580 epoch 59 - iter 372/3720 - loss 0.03472784 - time (sec): 62.07 - samples/sec: 5052.42 - lr: 0.100000 +2023-04-06 08:48:14,755 epoch 59 - iter 744/3720 - loss 0.03524033 - time (sec): 126.25 - samples/sec: 4975.16 - lr: 0.100000 +2023-04-06 08:49:18,120 epoch 59 - iter 1116/3720 - loss 0.03561557 - time (sec): 189.61 - samples/sec: 4966.12 - lr: 0.100000 +2023-04-06 08:50:20,947 epoch 59 - iter 1488/3720 - loss 0.03555656 - time (sec): 252.44 - samples/sec: 4975.37 - lr: 0.100000 +2023-04-06 08:51:25,738 epoch 59 - iter 1860/3720 - loss 0.03548465 - time (sec): 317.23 - samples/sec: 4959.79 - lr: 0.100000 +2023-04-06 08:52:30,049 epoch 59 - iter 2232/3720 - loss 0.03548318 - time (sec): 381.54 - samples/sec: 4950.57 - lr: 0.100000 +2023-04-06 08:53:34,190 epoch 59 - iter 2604/3720 - loss 0.03569103 - time (sec): 445.68 - samples/sec: 4948.31 - lr: 0.100000 +2023-04-06 08:54:37,949 epoch 59 - iter 2976/3720 - loss 0.03575223 - time (sec): 509.44 - samples/sec: 4951.91 - lr: 0.100000 +2023-04-06 08:55:41,386 epoch 59 - iter 3348/3720 - loss 0.03581366 - time (sec): 572.88 - samples/sec: 4952.70 - lr: 0.100000 +2023-04-06 08:56:45,986 epoch 59 - iter 3720/3720 - loss 0.03587479 - time (sec): 637.48 - samples/sec: 4944.03 - lr: 0.100000 +2023-04-06 08:56:45,987 ---------------------------------------------------------------------------------------------------- +2023-04-06 08:56:45,987 EPOCH 59 done: loss 0.0359 - lr 0.100000 +2023-04-06 08:56:45,987 BAD EPOCHS (no improvement): 2 +2023-04-06 08:56:45,989 ---------------------------------------------------------------------------------------------------- +2023-04-06 08:57:48,730 epoch 60 - iter 372/3720 - loss 0.03499679 - time (sec): 62.74 - samples/sec: 5000.59 - lr: 0.100000 +2023-04-06 08:58:52,636 epoch 60 - iter 744/3720 - loss 0.03512788 - time (sec): 126.65 - samples/sec: 4981.76 - lr: 0.100000 +2023-04-06 08:59:56,347 epoch 60 - iter 1116/3720 - loss 0.03529976 - time (sec): 190.36 - samples/sec: 4968.31 - lr: 0.100000 +2023-04-06 09:00:59,103 epoch 60 - iter 1488/3720 - loss 0.03560345 - time (sec): 253.11 - samples/sec: 4971.13 - lr: 0.100000 +2023-04-06 09:02:01,837 epoch 60 - iter 1860/3720 - loss 0.03565454 - time (sec): 315.85 - samples/sec: 4981.76 - lr: 0.100000 +2023-04-06 09:03:04,547 epoch 60 - iter 2232/3720 - loss 0.03556429 - time (sec): 378.56 - samples/sec: 4994.56 - lr: 0.100000 +2023-04-06 09:04:07,043 epoch 60 - iter 2604/3720 - loss 0.03559014 - time (sec): 441.05 - samples/sec: 5001.07 - lr: 0.100000 +2023-04-06 09:05:09,498 epoch 60 - iter 2976/3720 - loss 0.03561401 - time (sec): 503.51 - samples/sec: 5006.08 - lr: 0.100000 +2023-04-06 09:06:12,947 epoch 60 - iter 3348/3720 - loss 0.03585984 - time (sec): 566.96 - samples/sec: 5004.68 - lr: 0.100000 +2023-04-06 09:07:15,771 epoch 60 - iter 3720/3720 - loss 0.03574776 - time (sec): 629.78 - samples/sec: 5004.45 - lr: 0.100000 +2023-04-06 09:07:15,771 ---------------------------------------------------------------------------------------------------- +2023-04-06 09:07:15,771 EPOCH 60 done: loss 0.0357 - lr 0.100000 +2023-04-06 09:07:15,771 BAD EPOCHS (no improvement): 3 +2023-04-06 09:07:15,774 ---------------------------------------------------------------------------------------------------- +2023-04-06 09:08:19,663 epoch 61 - iter 372/3720 - loss 0.03401490 - time (sec): 63.89 - samples/sec: 4961.70 - lr: 0.100000 +2023-04-06 09:09:23,952 epoch 61 - iter 744/3720 - loss 0.03514973 - time (sec): 128.18 - samples/sec: 4943.16 - lr: 0.100000 +2023-04-06 09:10:28,106 epoch 61 - iter 1116/3720 - loss 0.03528165 - time (sec): 192.33 - samples/sec: 4931.53 - lr: 0.100000 +2023-04-06 09:11:31,644 epoch 61 - iter 1488/3720 - loss 0.03550286 - time (sec): 255.87 - samples/sec: 4940.67 - lr: 0.100000 +2023-04-06 09:12:36,190 epoch 61 - iter 1860/3720 - loss 0.03553016 - time (sec): 320.42 - samples/sec: 4925.97 - lr: 0.100000 +2023-04-06 09:13:40,262 epoch 61 - iter 2232/3720 - loss 0.03560856 - time (sec): 384.49 - samples/sec: 4923.30 - lr: 0.100000 +2023-04-06 09:14:41,795 epoch 61 - iter 2604/3720 - loss 0.03554887 - time (sec): 446.02 - samples/sec: 4945.73 - lr: 0.100000 +2023-04-06 09:15:45,261 epoch 61 - iter 2976/3720 - loss 0.03569112 - time (sec): 509.49 - samples/sec: 4945.71 - lr: 0.100000 +2023-04-06 09:16:49,312 epoch 61 - iter 3348/3720 - loss 0.03566798 - time (sec): 573.54 - samples/sec: 4945.05 - lr: 0.100000 +2023-04-06 09:17:53,366 epoch 61 - iter 3720/3720 - loss 0.03574582 - time (sec): 637.59 - samples/sec: 4943.15 - lr: 0.100000 +2023-04-06 09:17:53,366 ---------------------------------------------------------------------------------------------------- +2023-04-06 09:17:53,367 EPOCH 61 done: loss 0.0357 - lr 0.100000 +2023-04-06 09:17:53,367 Epoch 61: reducing learning rate of group 0 to 5.0000e-02. +2023-04-06 09:17:53,367 BAD EPOCHS (no improvement): 4 +2023-04-06 09:17:53,370 ---------------------------------------------------------------------------------------------------- +2023-04-06 09:18:57,578 epoch 62 - iter 372/3720 - loss 0.03497989 - time (sec): 64.21 - samples/sec: 4906.84 - lr: 0.050000 +2023-04-06 09:20:00,256 epoch 62 - iter 744/3720 - loss 0.03456611 - time (sec): 126.89 - samples/sec: 4962.01 - lr: 0.050000 +2023-04-06 09:21:04,208 epoch 62 - iter 1116/3720 - loss 0.03419942 - time (sec): 190.84 - samples/sec: 4956.90 - lr: 0.050000 +2023-04-06 09:22:08,550 epoch 62 - iter 1488/3720 - loss 0.03429432 - time (sec): 255.18 - samples/sec: 4947.79 - lr: 0.050000 +2023-04-06 09:23:12,615 epoch 62 - iter 1860/3720 - loss 0.03407697 - time (sec): 319.24 - samples/sec: 4942.36 - lr: 0.050000 +2023-04-06 09:24:16,266 epoch 62 - iter 2232/3720 - loss 0.03392393 - time (sec): 382.90 - samples/sec: 4943.70 - lr: 0.050000 +2023-04-06 09:25:19,468 epoch 62 - iter 2604/3720 - loss 0.03382584 - time (sec): 446.10 - samples/sec: 4945.27 - lr: 0.050000 +2023-04-06 09:26:23,186 epoch 62 - iter 2976/3720 - loss 0.03374750 - time (sec): 509.82 - samples/sec: 4948.55 - lr: 0.050000 +2023-04-06 09:27:26,185 epoch 62 - iter 3348/3720 - loss 0.03366302 - time (sec): 572.82 - samples/sec: 4952.68 - lr: 0.050000 +2023-04-06 09:28:30,000 epoch 62 - iter 3720/3720 - loss 0.03361755 - time (sec): 636.63 - samples/sec: 4950.62 - lr: 0.050000 +2023-04-06 09:28:30,000 ---------------------------------------------------------------------------------------------------- +2023-04-06 09:28:30,000 EPOCH 62 done: loss 0.0336 - lr 0.050000 +2023-04-06 09:28:30,000 BAD EPOCHS (no improvement): 0 +2023-04-06 09:28:30,003 ---------------------------------------------------------------------------------------------------- +2023-04-06 09:29:33,070 epoch 63 - iter 372/3720 - loss 0.03225239 - time (sec): 63.07 - samples/sec: 4993.12 - lr: 0.050000 +2023-04-06 09:30:36,787 epoch 63 - iter 744/3720 - loss 0.03250590 - time (sec): 126.78 - samples/sec: 4976.52 - lr: 0.050000 +2023-04-06 09:31:39,314 epoch 63 - iter 1116/3720 - loss 0.03295037 - time (sec): 189.31 - samples/sec: 4989.73 - lr: 0.050000 +2023-04-06 09:32:43,392 epoch 63 - iter 1488/3720 - loss 0.03312255 - time (sec): 253.39 - samples/sec: 4966.39 - lr: 0.050000 +2023-04-06 09:33:45,454 epoch 63 - iter 1860/3720 - loss 0.03310235 - time (sec): 315.45 - samples/sec: 4983.17 - lr: 0.050000 +2023-04-06 09:34:49,567 epoch 63 - iter 2232/3720 - loss 0.03292022 - time (sec): 379.56 - samples/sec: 4972.51 - lr: 0.050000 +2023-04-06 09:35:51,932 epoch 63 - iter 2604/3720 - loss 0.03302965 - time (sec): 441.93 - samples/sec: 4979.96 - lr: 0.050000 +2023-04-06 09:36:56,519 epoch 63 - iter 2976/3720 - loss 0.03279925 - time (sec): 506.52 - samples/sec: 4971.89 - lr: 0.050000 +2023-04-06 09:38:00,666 epoch 63 - iter 3348/3720 - loss 0.03265644 - time (sec): 570.66 - samples/sec: 4967.93 - lr: 0.050000 +2023-04-06 09:39:04,150 epoch 63 - iter 3720/3720 - loss 0.03264588 - time (sec): 634.15 - samples/sec: 4970.00 - lr: 0.050000 +2023-04-06 09:39:04,150 ---------------------------------------------------------------------------------------------------- +2023-04-06 09:39:04,150 EPOCH 63 done: loss 0.0326 - lr 0.050000 +2023-04-06 09:39:04,150 BAD EPOCHS (no improvement): 0 +2023-04-06 09:39:04,154 ---------------------------------------------------------------------------------------------------- +2023-04-06 09:40:07,911 epoch 64 - iter 372/3720 - loss 0.03273274 - time (sec): 63.76 - samples/sec: 4956.71 - lr: 0.050000 +2023-04-06 09:41:10,461 epoch 64 - iter 744/3720 - loss 0.03207882 - time (sec): 126.31 - samples/sec: 4991.07 - lr: 0.050000 +2023-04-06 09:42:14,418 epoch 64 - iter 1116/3720 - loss 0.03240069 - time (sec): 190.26 - samples/sec: 4966.45 - lr: 0.050000 +2023-04-06 09:43:17,666 epoch 64 - iter 1488/3720 - loss 0.03244033 - time (sec): 253.51 - samples/sec: 4966.85 - lr: 0.050000 +2023-04-06 09:44:20,296 epoch 64 - iter 1860/3720 - loss 0.03236251 - time (sec): 316.14 - samples/sec: 4974.35 - lr: 0.050000 +2023-04-06 09:45:25,031 epoch 64 - iter 2232/3720 - loss 0.03243121 - time (sec): 380.88 - samples/sec: 4963.60 - lr: 0.050000 +2023-04-06 09:46:28,885 epoch 64 - iter 2604/3720 - loss 0.03231516 - time (sec): 444.73 - samples/sec: 4960.12 - lr: 0.050000 +2023-04-06 09:47:32,235 epoch 64 - iter 2976/3720 - loss 0.03241879 - time (sec): 508.08 - samples/sec: 4964.27 - lr: 0.050000 +2023-04-06 09:48:36,050 epoch 64 - iter 3348/3720 - loss 0.03239816 - time (sec): 571.90 - samples/sec: 4961.55 - lr: 0.050000 +2023-04-06 09:49:39,630 epoch 64 - iter 3720/3720 - loss 0.03239631 - time (sec): 635.48 - samples/sec: 4959.61 - lr: 0.050000 +2023-04-06 09:49:39,630 ---------------------------------------------------------------------------------------------------- +2023-04-06 09:49:39,630 EPOCH 64 done: loss 0.0324 - lr 0.050000 +2023-04-06 09:49:39,630 BAD EPOCHS (no improvement): 0 +2023-04-06 09:49:39,633 ---------------------------------------------------------------------------------------------------- +2023-04-06 09:50:43,116 epoch 65 - iter 372/3720 - loss 0.03289786 - time (sec): 63.48 - samples/sec: 4957.24 - lr: 0.050000 +2023-04-06 09:51:46,500 epoch 65 - iter 744/3720 - loss 0.03221444 - time (sec): 126.87 - samples/sec: 4953.63 - lr: 0.050000 +2023-04-06 09:52:50,737 epoch 65 - iter 1116/3720 - loss 0.03234440 - time (sec): 191.10 - samples/sec: 4937.75 - lr: 0.050000 +2023-04-06 09:53:53,592 epoch 65 - iter 1488/3720 - loss 0.03225068 - time (sec): 253.96 - samples/sec: 4947.51 - lr: 0.050000 +2023-04-06 09:54:58,174 epoch 65 - iter 1860/3720 - loss 0.03220238 - time (sec): 318.54 - samples/sec: 4937.14 - lr: 0.050000 +2023-04-06 09:56:02,536 epoch 65 - iter 2232/3720 - loss 0.03211585 - time (sec): 382.90 - samples/sec: 4930.14 - lr: 0.050000 +2023-04-06 09:57:06,298 epoch 65 - iter 2604/3720 - loss 0.03212059 - time (sec): 446.67 - samples/sec: 4929.46 - lr: 0.050000 +2023-04-06 09:58:10,404 epoch 65 - iter 2976/3720 - loss 0.03209122 - time (sec): 510.77 - samples/sec: 4930.02 - lr: 0.050000 +2023-04-06 09:59:13,868 epoch 65 - iter 3348/3720 - loss 0.03201975 - time (sec): 574.24 - samples/sec: 4933.73 - lr: 0.050000 +2023-04-06 10:00:17,763 epoch 65 - iter 3720/3720 - loss 0.03191218 - time (sec): 638.13 - samples/sec: 4938.98 - lr: 0.050000 +2023-04-06 10:00:17,763 ---------------------------------------------------------------------------------------------------- +2023-04-06 10:00:17,763 EPOCH 65 done: loss 0.0319 - lr 0.050000 +2023-04-06 10:00:17,763 BAD EPOCHS (no improvement): 0 +2023-04-06 10:00:17,766 ---------------------------------------------------------------------------------------------------- +2023-04-06 10:01:20,365 epoch 66 - iter 372/3720 - loss 0.03180213 - time (sec): 62.60 - samples/sec: 4986.99 - lr: 0.050000 +2023-04-06 10:02:24,776 epoch 66 - iter 744/3720 - loss 0.03214387 - time (sec): 127.01 - samples/sec: 4974.10 - lr: 0.050000 +2023-04-06 10:03:26,943 epoch 66 - iter 1116/3720 - loss 0.03205532 - time (sec): 189.18 - samples/sec: 5006.82 - lr: 0.050000 +2023-04-06 10:04:30,066 epoch 66 - iter 1488/3720 - loss 0.03196585 - time (sec): 252.30 - samples/sec: 5001.92 - lr: 0.050000 +2023-04-06 10:05:33,207 epoch 66 - iter 1860/3720 - loss 0.03187393 - time (sec): 315.44 - samples/sec: 4998.37 - lr: 0.050000 +2023-04-06 10:06:36,121 epoch 66 - iter 2232/3720 - loss 0.03190732 - time (sec): 378.36 - samples/sec: 5000.72 - lr: 0.050000 +2023-04-06 10:07:39,422 epoch 66 - iter 2604/3720 - loss 0.03194692 - time (sec): 441.66 - samples/sec: 5000.81 - lr: 0.050000 +2023-04-06 10:08:42,308 epoch 66 - iter 2976/3720 - loss 0.03192703 - time (sec): 504.54 - samples/sec: 4998.84 - lr: 0.050000 +2023-04-06 10:09:45,643 epoch 66 - iter 3348/3720 - loss 0.03190535 - time (sec): 567.88 - samples/sec: 4995.70 - lr: 0.050000 +2023-04-06 10:10:48,607 epoch 66 - iter 3720/3720 - loss 0.03205002 - time (sec): 630.84 - samples/sec: 4996.05 - lr: 0.050000 +2023-04-06 10:10:48,608 ---------------------------------------------------------------------------------------------------- +2023-04-06 10:10:48,608 EPOCH 66 done: loss 0.0321 - lr 0.050000 +2023-04-06 10:10:48,608 BAD EPOCHS (no improvement): 1 +2023-04-06 10:10:48,611 ---------------------------------------------------------------------------------------------------- +2023-04-06 10:11:51,553 epoch 67 - iter 372/3720 - loss 0.03197003 - time (sec): 62.94 - samples/sec: 5006.72 - lr: 0.050000 +2023-04-06 10:12:55,384 epoch 67 - iter 744/3720 - loss 0.03167444 - time (sec): 126.77 - samples/sec: 4979.36 - lr: 0.050000 +2023-04-06 10:13:59,031 epoch 67 - iter 1116/3720 - loss 0.03179666 - time (sec): 190.42 - samples/sec: 4965.30 - lr: 0.050000 +2023-04-06 10:15:02,813 epoch 67 - iter 1488/3720 - loss 0.03166737 - time (sec): 254.20 - samples/sec: 4961.16 - lr: 0.050000 +2023-04-06 10:16:06,300 epoch 67 - iter 1860/3720 - loss 0.03170742 - time (sec): 317.69 - samples/sec: 4969.39 - lr: 0.050000 +2023-04-06 10:17:09,727 epoch 67 - iter 2232/3720 - loss 0.03181418 - time (sec): 381.12 - samples/sec: 4966.40 - lr: 0.050000 +2023-04-06 10:18:14,122 epoch 67 - iter 2604/3720 - loss 0.03163692 - time (sec): 445.51 - samples/sec: 4958.38 - lr: 0.050000 +2023-04-06 10:19:17,530 epoch 67 - iter 2976/3720 - loss 0.03167661 - time (sec): 508.92 - samples/sec: 4955.14 - lr: 0.050000 +2023-04-06 10:20:20,171 epoch 67 - iter 3348/3720 - loss 0.03166178 - time (sec): 571.56 - samples/sec: 4963.69 - lr: 0.050000 +2023-04-06 10:21:22,597 epoch 67 - iter 3720/3720 - loss 0.03171928 - time (sec): 633.99 - samples/sec: 4971.27 - lr: 0.050000 +2023-04-06 10:21:22,597 ---------------------------------------------------------------------------------------------------- +2023-04-06 10:21:22,597 EPOCH 67 done: loss 0.0317 - lr 0.050000 +2023-04-06 10:21:22,597 BAD EPOCHS (no improvement): 0 +2023-04-06 10:21:22,600 ---------------------------------------------------------------------------------------------------- +2023-04-06 10:22:26,310 epoch 68 - iter 372/3720 - loss 0.03161777 - time (sec): 63.71 - samples/sec: 4940.03 - lr: 0.050000 +2023-04-06 10:23:30,377 epoch 68 - iter 744/3720 - loss 0.03148526 - time (sec): 127.78 - samples/sec: 4928.76 - lr: 0.050000 +2023-04-06 10:24:33,195 epoch 68 - iter 1116/3720 - loss 0.03186291 - time (sec): 190.59 - samples/sec: 4956.30 - lr: 0.050000 +2023-04-06 10:25:36,342 epoch 68 - iter 1488/3720 - loss 0.03175793 - time (sec): 253.74 - samples/sec: 4966.81 - lr: 0.050000 +2023-04-06 10:26:41,348 epoch 68 - iter 1860/3720 - loss 0.03156923 - time (sec): 318.75 - samples/sec: 4945.81 - lr: 0.050000 +2023-04-06 10:27:45,571 epoch 68 - iter 2232/3720 - loss 0.03161897 - time (sec): 382.97 - samples/sec: 4940.10 - lr: 0.050000 +2023-04-06 10:28:49,262 epoch 68 - iter 2604/3720 - loss 0.03165787 - time (sec): 446.66 - samples/sec: 4942.58 - lr: 0.050000 +2023-04-06 10:29:53,924 epoch 68 - iter 2976/3720 - loss 0.03164836 - time (sec): 511.32 - samples/sec: 4934.19 - lr: 0.050000 +2023-04-06 10:30:57,633 epoch 68 - iter 3348/3720 - loss 0.03158081 - time (sec): 575.03 - samples/sec: 4935.44 - lr: 0.050000 +2023-04-06 10:32:00,786 epoch 68 - iter 3720/3720 - loss 0.03160046 - time (sec): 638.19 - samples/sec: 4938.55 - lr: 0.050000 +2023-04-06 10:32:00,786 ---------------------------------------------------------------------------------------------------- +2023-04-06 10:32:00,786 EPOCH 68 done: loss 0.0316 - lr 0.050000 +2023-04-06 10:32:00,786 BAD EPOCHS (no improvement): 0 +2023-04-06 10:32:00,789 ---------------------------------------------------------------------------------------------------- +2023-04-06 10:33:04,937 epoch 69 - iter 372/3720 - loss 0.03135092 - time (sec): 64.15 - samples/sec: 4939.21 - lr: 0.050000 +2023-04-06 10:34:07,030 epoch 69 - iter 744/3720 - loss 0.03094274 - time (sec): 126.24 - samples/sec: 4971.53 - lr: 0.050000 +2023-04-06 10:35:11,016 epoch 69 - iter 1116/3720 - loss 0.03116561 - time (sec): 190.23 - samples/sec: 4959.15 - lr: 0.050000 +2023-04-06 10:36:15,342 epoch 69 - iter 1488/3720 - loss 0.03126021 - time (sec): 254.55 - samples/sec: 4945.28 - lr: 0.050000 +2023-04-06 10:37:18,675 epoch 69 - iter 1860/3720 - loss 0.03134390 - time (sec): 317.89 - samples/sec: 4949.61 - lr: 0.050000 +2023-04-06 10:38:22,341 epoch 69 - iter 2232/3720 - loss 0.03134850 - time (sec): 381.55 - samples/sec: 4949.88 - lr: 0.050000 +2023-04-06 10:39:25,106 epoch 69 - iter 2604/3720 - loss 0.03142628 - time (sec): 444.32 - samples/sec: 4958.11 - lr: 0.050000 +2023-04-06 10:40:28,241 epoch 69 - iter 2976/3720 - loss 0.03136588 - time (sec): 507.45 - samples/sec: 4960.83 - lr: 0.050000 +2023-04-06 10:41:32,561 epoch 69 - iter 3348/3720 - loss 0.03130388 - time (sec): 571.77 - samples/sec: 4957.56 - lr: 0.050000 +2023-04-06 10:42:36,606 epoch 69 - iter 3720/3720 - loss 0.03130843 - time (sec): 635.82 - samples/sec: 4956.95 - lr: 0.050000 +2023-04-06 10:42:36,607 ---------------------------------------------------------------------------------------------------- +2023-04-06 10:42:36,607 EPOCH 69 done: loss 0.0313 - lr 0.050000 +2023-04-06 10:42:36,607 BAD EPOCHS (no improvement): 0 +2023-04-06 10:42:36,609 ---------------------------------------------------------------------------------------------------- +2023-04-06 10:43:40,981 epoch 70 - iter 372/3720 - loss 0.03116412 - time (sec): 64.37 - samples/sec: 4901.70 - lr: 0.050000 +2023-04-06 10:44:44,319 epoch 70 - iter 744/3720 - loss 0.03118096 - time (sec): 127.71 - samples/sec: 4940.06 - lr: 0.050000 +2023-04-06 10:45:48,485 epoch 70 - iter 1116/3720 - loss 0.03090943 - time (sec): 191.88 - samples/sec: 4929.28 - lr: 0.050000 +2023-04-06 10:46:52,519 epoch 70 - iter 1488/3720 - loss 0.03093912 - time (sec): 255.91 - samples/sec: 4927.35 - lr: 0.050000 +2023-04-06 10:47:55,740 epoch 70 - iter 1860/3720 - loss 0.03096841 - time (sec): 319.13 - samples/sec: 4924.15 - lr: 0.050000 +2023-04-06 10:48:59,477 epoch 70 - iter 2232/3720 - loss 0.03105662 - time (sec): 382.87 - samples/sec: 4924.60 - lr: 0.050000 +2023-04-06 10:50:02,531 epoch 70 - iter 2604/3720 - loss 0.03118693 - time (sec): 445.92 - samples/sec: 4940.22 - lr: 0.050000 +2023-04-06 10:51:06,113 epoch 70 - iter 2976/3720 - loss 0.03112537 - time (sec): 509.50 - samples/sec: 4946.77 - lr: 0.050000 +2023-04-06 10:52:09,431 epoch 70 - iter 3348/3720 - loss 0.03118119 - time (sec): 572.82 - samples/sec: 4951.62 - lr: 0.050000 +2023-04-06 10:53:14,212 epoch 70 - iter 3720/3720 - loss 0.03123392 - time (sec): 637.60 - samples/sec: 4943.06 - lr: 0.050000 +2023-04-06 10:53:14,213 ---------------------------------------------------------------------------------------------------- +2023-04-06 10:53:14,213 EPOCH 70 done: loss 0.0312 - lr 0.050000 +2023-04-06 10:53:14,213 BAD EPOCHS (no improvement): 0 +2023-04-06 10:53:14,216 ---------------------------------------------------------------------------------------------------- +2023-04-06 10:54:18,318 epoch 71 - iter 372/3720 - loss 0.03113377 - time (sec): 64.10 - samples/sec: 4917.96 - lr: 0.050000 +2023-04-06 10:55:20,822 epoch 71 - iter 744/3720 - loss 0.03099367 - time (sec): 126.61 - samples/sec: 4957.95 - lr: 0.050000 +2023-04-06 10:56:24,775 epoch 71 - iter 1116/3720 - loss 0.03123187 - time (sec): 190.56 - samples/sec: 4951.11 - lr: 0.050000 +2023-04-06 10:57:28,392 epoch 71 - iter 1488/3720 - loss 0.03104929 - time (sec): 254.18 - samples/sec: 4961.57 - lr: 0.050000 +2023-04-06 10:58:31,773 epoch 71 - iter 1860/3720 - loss 0.03090814 - time (sec): 317.56 - samples/sec: 4967.05 - lr: 0.050000 +2023-04-06 10:59:33,384 epoch 71 - iter 2232/3720 - loss 0.03101887 - time (sec): 379.17 - samples/sec: 4986.04 - lr: 0.050000 +2023-04-06 11:00:38,316 epoch 71 - iter 2604/3720 - loss 0.03107583 - time (sec): 444.10 - samples/sec: 4968.86 - lr: 0.050000 +2023-04-06 11:01:41,235 epoch 71 - iter 2976/3720 - loss 0.03110385 - time (sec): 507.02 - samples/sec: 4969.69 - lr: 0.050000 +2023-04-06 11:02:44,951 epoch 71 - iter 3348/3720 - loss 0.03109594 - time (sec): 570.74 - samples/sec: 4969.12 - lr: 0.050000 +2023-04-06 11:03:48,078 epoch 71 - iter 3720/3720 - loss 0.03099105 - time (sec): 633.86 - samples/sec: 4972.24 - lr: 0.050000 +2023-04-06 11:03:48,078 ---------------------------------------------------------------------------------------------------- +2023-04-06 11:03:48,078 EPOCH 71 done: loss 0.0310 - lr 0.050000 +2023-04-06 11:03:48,078 BAD EPOCHS (no improvement): 0 +2023-04-06 11:03:48,082 ---------------------------------------------------------------------------------------------------- +2023-04-06 11:04:51,421 epoch 72 - iter 372/3720 - loss 0.03013338 - time (sec): 63.34 - samples/sec: 4976.42 - lr: 0.050000 +2023-04-06 11:05:54,665 epoch 72 - iter 744/3720 - loss 0.03050364 - time (sec): 126.58 - samples/sec: 4975.09 - lr: 0.050000 +2023-04-06 11:06:56,685 epoch 72 - iter 1116/3720 - loss 0.03046667 - time (sec): 188.60 - samples/sec: 5008.99 - lr: 0.050000 +2023-04-06 11:07:59,410 epoch 72 - iter 1488/3720 - loss 0.03057755 - time (sec): 251.33 - samples/sec: 5009.60 - lr: 0.050000 +2023-04-06 11:09:00,391 epoch 72 - iter 1860/3720 - loss 0.03058173 - time (sec): 312.31 - samples/sec: 5038.96 - lr: 0.050000 +2023-04-06 11:10:04,729 epoch 72 - iter 2232/3720 - loss 0.03055907 - time (sec): 376.65 - samples/sec: 5020.39 - lr: 0.050000 +2023-04-06 11:11:08,809 epoch 72 - iter 2604/3720 - loss 0.03064763 - time (sec): 440.73 - samples/sec: 5003.90 - lr: 0.050000 +2023-04-06 11:12:12,462 epoch 72 - iter 2976/3720 - loss 0.03068538 - time (sec): 504.38 - samples/sec: 4997.32 - lr: 0.050000 +2023-04-06 11:13:16,757 epoch 72 - iter 3348/3720 - loss 0.03079806 - time (sec): 568.68 - samples/sec: 4985.31 - lr: 0.050000 +2023-04-06 11:14:20,977 epoch 72 - iter 3720/3720 - loss 0.03080137 - time (sec): 632.90 - samples/sec: 4979.83 - lr: 0.050000 +2023-04-06 11:14:20,978 ---------------------------------------------------------------------------------------------------- +2023-04-06 11:14:20,978 EPOCH 72 done: loss 0.0308 - lr 0.050000 +2023-04-06 11:14:20,978 BAD EPOCHS (no improvement): 0 +2023-04-06 11:14:20,982 ---------------------------------------------------------------------------------------------------- +2023-04-06 11:15:25,313 epoch 73 - iter 372/3720 - loss 0.03065767 - time (sec): 64.33 - samples/sec: 4924.92 - lr: 0.050000 +2023-04-06 11:16:29,963 epoch 73 - iter 744/3720 - loss 0.03055942 - time (sec): 128.98 - samples/sec: 4906.21 - lr: 0.050000 +2023-04-06 11:17:33,123 epoch 73 - iter 1116/3720 - loss 0.03072176 - time (sec): 192.14 - samples/sec: 4923.46 - lr: 0.050000 +2023-04-06 11:18:36,847 epoch 73 - iter 1488/3720 - loss 0.03048773 - time (sec): 255.87 - samples/sec: 4933.71 - lr: 0.050000 +2023-04-06 11:19:39,856 epoch 73 - iter 1860/3720 - loss 0.03055045 - time (sec): 318.87 - samples/sec: 4944.90 - lr: 0.050000 +2023-04-06 11:20:44,634 epoch 73 - iter 2232/3720 - loss 0.03045798 - time (sec): 383.65 - samples/sec: 4936.56 - lr: 0.050000 +2023-04-06 11:21:46,138 epoch 73 - iter 2604/3720 - loss 0.03051092 - time (sec): 445.16 - samples/sec: 4958.72 - lr: 0.050000 +2023-04-06 11:22:49,617 epoch 73 - iter 2976/3720 - loss 0.03058982 - time (sec): 508.63 - samples/sec: 4959.01 - lr: 0.050000 +2023-04-06 11:23:53,461 epoch 73 - iter 3348/3720 - loss 0.03067650 - time (sec): 572.48 - samples/sec: 4955.73 - lr: 0.050000 +2023-04-06 11:24:57,226 epoch 73 - iter 3720/3720 - loss 0.03066288 - time (sec): 636.24 - samples/sec: 4953.62 - lr: 0.050000 +2023-04-06 11:24:57,226 ---------------------------------------------------------------------------------------------------- +2023-04-06 11:24:57,226 EPOCH 73 done: loss 0.0307 - lr 0.050000 +2023-04-06 11:24:57,226 BAD EPOCHS (no improvement): 0 +2023-04-06 11:24:57,230 ---------------------------------------------------------------------------------------------------- +2023-04-06 11:25:59,629 epoch 74 - iter 372/3720 - loss 0.03113534 - time (sec): 62.40 - samples/sec: 5008.36 - lr: 0.050000 +2023-04-06 11:27:03,370 epoch 74 - iter 744/3720 - loss 0.03054291 - time (sec): 126.14 - samples/sec: 4994.88 - lr: 0.050000 +2023-04-06 11:28:07,338 epoch 74 - iter 1116/3720 - loss 0.03034973 - time (sec): 190.11 - samples/sec: 4982.07 - lr: 0.050000 +2023-04-06 11:29:10,508 epoch 74 - iter 1488/3720 - loss 0.03051028 - time (sec): 253.28 - samples/sec: 4981.10 - lr: 0.050000 +2023-04-06 11:30:14,732 epoch 74 - iter 1860/3720 - loss 0.03053525 - time (sec): 317.50 - samples/sec: 4962.14 - lr: 0.050000 +2023-04-06 11:31:18,305 epoch 74 - iter 2232/3720 - loss 0.03054710 - time (sec): 381.08 - samples/sec: 4954.37 - lr: 0.050000 +2023-04-06 11:32:22,559 epoch 74 - iter 2604/3720 - loss 0.03053230 - time (sec): 445.33 - samples/sec: 4952.66 - lr: 0.050000 +2023-04-06 11:33:25,938 epoch 74 - iter 2976/3720 - loss 0.03060414 - time (sec): 508.71 - samples/sec: 4952.37 - lr: 0.050000 +2023-04-06 11:34:28,978 epoch 74 - iter 3348/3720 - loss 0.03073909 - time (sec): 571.75 - samples/sec: 4956.25 - lr: 0.050000 +2023-04-06 11:35:33,510 epoch 74 - iter 3720/3720 - loss 0.03073551 - time (sec): 636.28 - samples/sec: 4953.34 - lr: 0.050000 +2023-04-06 11:35:33,510 ---------------------------------------------------------------------------------------------------- +2023-04-06 11:35:33,510 EPOCH 74 done: loss 0.0307 - lr 0.050000 +2023-04-06 11:35:33,510 BAD EPOCHS (no improvement): 1 +2023-04-06 11:35:33,514 ---------------------------------------------------------------------------------------------------- +2023-04-06 11:36:37,175 epoch 75 - iter 372/3720 - loss 0.02962953 - time (sec): 63.66 - samples/sec: 4984.36 - lr: 0.050000 +2023-04-06 11:37:41,521 epoch 75 - iter 744/3720 - loss 0.02998085 - time (sec): 128.01 - samples/sec: 4947.37 - lr: 0.050000 +2023-04-06 11:38:45,839 epoch 75 - iter 1116/3720 - loss 0.03047575 - time (sec): 192.33 - samples/sec: 4941.67 - lr: 0.050000 +2023-04-06 11:39:49,011 epoch 75 - iter 1488/3720 - loss 0.03015728 - time (sec): 255.50 - samples/sec: 4956.57 - lr: 0.050000 +2023-04-06 11:40:52,219 epoch 75 - iter 1860/3720 - loss 0.03017682 - time (sec): 318.70 - samples/sec: 4959.20 - lr: 0.050000 +2023-04-06 11:41:54,500 epoch 75 - iter 2232/3720 - loss 0.03046283 - time (sec): 380.99 - samples/sec: 4973.68 - lr: 0.050000 +2023-04-06 11:42:56,958 epoch 75 - iter 2604/3720 - loss 0.03051771 - time (sec): 443.44 - samples/sec: 4976.67 - lr: 0.050000 +2023-04-06 11:44:00,143 epoch 75 - iter 2976/3720 - loss 0.03053466 - time (sec): 506.63 - samples/sec: 4980.69 - lr: 0.050000 +2023-04-06 11:45:03,004 epoch 75 - iter 3348/3720 - loss 0.03053358 - time (sec): 569.49 - samples/sec: 4982.58 - lr: 0.050000 +2023-04-06 11:46:06,889 epoch 75 - iter 3720/3720 - loss 0.03052326 - time (sec): 633.37 - samples/sec: 4976.06 - lr: 0.050000 +2023-04-06 11:46:06,889 ---------------------------------------------------------------------------------------------------- +2023-04-06 11:46:06,889 EPOCH 75 done: loss 0.0305 - lr 0.050000 +2023-04-06 11:46:06,889 BAD EPOCHS (no improvement): 0 +2023-04-06 11:46:06,892 ---------------------------------------------------------------------------------------------------- +2023-04-06 11:47:10,468 epoch 76 - iter 372/3720 - loss 0.03043636 - time (sec): 63.58 - samples/sec: 4976.19 - lr: 0.050000 +2023-04-06 11:48:14,365 epoch 76 - iter 744/3720 - loss 0.03054553 - time (sec): 127.47 - samples/sec: 4949.69 - lr: 0.050000 +2023-04-06 11:49:18,478 epoch 76 - iter 1116/3720 - loss 0.03041469 - time (sec): 191.59 - samples/sec: 4946.42 - lr: 0.050000 +2023-04-06 11:50:20,803 epoch 76 - iter 1488/3720 - loss 0.03043815 - time (sec): 253.91 - samples/sec: 4961.30 - lr: 0.050000 +2023-04-06 11:51:24,769 epoch 76 - iter 1860/3720 - loss 0.03060184 - time (sec): 317.88 - samples/sec: 4949.65 - lr: 0.050000 +2023-04-06 11:52:28,905 epoch 76 - iter 2232/3720 - loss 0.03052971 - time (sec): 382.01 - samples/sec: 4945.22 - lr: 0.050000 +2023-04-06 11:53:32,705 epoch 76 - iter 2604/3720 - loss 0.03047486 - time (sec): 445.81 - samples/sec: 4944.69 - lr: 0.050000 +2023-04-06 11:54:36,541 epoch 76 - iter 2976/3720 - loss 0.03056677 - time (sec): 509.65 - samples/sec: 4945.04 - lr: 0.050000 +2023-04-06 11:55:41,564 epoch 76 - iter 3348/3720 - loss 0.03062374 - time (sec): 574.67 - samples/sec: 4938.42 - lr: 0.050000 +2023-04-06 11:56:45,199 epoch 76 - iter 3720/3720 - loss 0.03076034 - time (sec): 638.31 - samples/sec: 4937.61 - lr: 0.050000 +2023-04-06 11:56:45,199 ---------------------------------------------------------------------------------------------------- +2023-04-06 11:56:45,199 EPOCH 76 done: loss 0.0308 - lr 0.050000 +2023-04-06 11:56:45,199 BAD EPOCHS (no improvement): 1 +2023-04-06 11:56:45,203 ---------------------------------------------------------------------------------------------------- +2023-04-06 11:57:48,768 epoch 77 - iter 372/3720 - loss 0.02994766 - time (sec): 63.57 - samples/sec: 4970.58 - lr: 0.050000 +2023-04-06 11:58:52,262 epoch 77 - iter 744/3720 - loss 0.02974964 - time (sec): 127.06 - samples/sec: 4941.68 - lr: 0.050000 +2023-04-06 11:59:56,463 epoch 77 - iter 1116/3720 - loss 0.03004014 - time (sec): 191.26 - samples/sec: 4924.04 - lr: 0.050000 +2023-04-06 12:01:00,778 epoch 77 - iter 1488/3720 - loss 0.02998906 - time (sec): 255.57 - samples/sec: 4923.95 - lr: 0.050000 +2023-04-06 12:02:04,092 epoch 77 - iter 1860/3720 - loss 0.03021740 - time (sec): 318.89 - samples/sec: 4934.46 - lr: 0.050000 +2023-04-06 12:03:07,272 epoch 77 - iter 2232/3720 - loss 0.03039703 - time (sec): 382.07 - samples/sec: 4941.79 - lr: 0.050000 +2023-04-06 12:04:11,226 epoch 77 - iter 2604/3720 - loss 0.03051115 - time (sec): 446.02 - samples/sec: 4941.60 - lr: 0.050000 +2023-04-06 12:05:15,619 epoch 77 - iter 2976/3720 - loss 0.03050436 - time (sec): 510.42 - samples/sec: 4940.33 - lr: 0.050000 +2023-04-06 12:06:18,391 epoch 77 - iter 3348/3720 - loss 0.03054092 - time (sec): 573.19 - samples/sec: 4949.83 - lr: 0.050000 +2023-04-06 12:07:20,984 epoch 77 - iter 3720/3720 - loss 0.03059546 - time (sec): 635.78 - samples/sec: 4957.23 - lr: 0.050000 +2023-04-06 12:07:20,985 ---------------------------------------------------------------------------------------------------- +2023-04-06 12:07:20,985 EPOCH 77 done: loss 0.0306 - lr 0.050000 +2023-04-06 12:07:20,985 BAD EPOCHS (no improvement): 2 +2023-04-06 12:07:20,988 ---------------------------------------------------------------------------------------------------- +2023-04-06 12:08:24,842 epoch 78 - iter 372/3720 - loss 0.03085487 - time (sec): 63.85 - samples/sec: 4952.46 - lr: 0.050000 +2023-04-06 12:09:28,667 epoch 78 - iter 744/3720 - loss 0.03053833 - time (sec): 127.68 - samples/sec: 4940.54 - lr: 0.050000 +2023-04-06 12:10:31,054 epoch 78 - iter 1116/3720 - loss 0.03042577 - time (sec): 190.07 - samples/sec: 4975.15 - lr: 0.050000 +2023-04-06 12:11:35,363 epoch 78 - iter 1488/3720 - loss 0.03042125 - time (sec): 254.38 - samples/sec: 4961.07 - lr: 0.050000 +2023-04-06 12:12:37,842 epoch 78 - iter 1860/3720 - loss 0.03051081 - time (sec): 316.85 - samples/sec: 4978.06 - lr: 0.050000 +2023-04-06 12:13:40,485 epoch 78 - iter 2232/3720 - loss 0.03049864 - time (sec): 379.50 - samples/sec: 4987.83 - lr: 0.050000 +2023-04-06 12:14:43,634 epoch 78 - iter 2604/3720 - loss 0.03051224 - time (sec): 442.65 - samples/sec: 4983.42 - lr: 0.050000 +2023-04-06 12:15:45,797 epoch 78 - iter 2976/3720 - loss 0.03058829 - time (sec): 504.81 - samples/sec: 4991.41 - lr: 0.050000 +2023-04-06 12:16:48,842 epoch 78 - iter 3348/3720 - loss 0.03046737 - time (sec): 567.85 - samples/sec: 4992.96 - lr: 0.050000 +2023-04-06 12:17:52,755 epoch 78 - iter 3720/3720 - loss 0.03050550 - time (sec): 631.77 - samples/sec: 4988.72 - lr: 0.050000 +2023-04-06 12:17:52,756 ---------------------------------------------------------------------------------------------------- +2023-04-06 12:17:52,756 EPOCH 78 done: loss 0.0305 - lr 0.050000 +2023-04-06 12:17:52,756 BAD EPOCHS (no improvement): 0 +2023-04-06 12:17:52,759 ---------------------------------------------------------------------------------------------------- +2023-04-06 12:18:57,352 epoch 79 - iter 372/3720 - loss 0.02989969 - time (sec): 64.59 - samples/sec: 4938.78 - lr: 0.050000 +2023-04-06 12:20:00,863 epoch 79 - iter 744/3720 - loss 0.03037559 - time (sec): 128.10 - samples/sec: 4955.85 - lr: 0.050000 +2023-04-06 12:21:04,399 epoch 79 - iter 1116/3720 - loss 0.03013356 - time (sec): 191.64 - samples/sec: 4959.13 - lr: 0.050000 +2023-04-06 12:22:06,878 epoch 79 - iter 1488/3720 - loss 0.03009245 - time (sec): 254.12 - samples/sec: 4978.84 - lr: 0.050000 +2023-04-06 12:23:08,817 epoch 79 - iter 1860/3720 - loss 0.03002431 - time (sec): 316.06 - samples/sec: 4996.97 - lr: 0.050000 +2023-04-06 12:24:11,867 epoch 79 - iter 2232/3720 - loss 0.03013416 - time (sec): 379.11 - samples/sec: 4992.95 - lr: 0.050000 +2023-04-06 12:25:15,535 epoch 79 - iter 2604/3720 - loss 0.03017423 - time (sec): 442.78 - samples/sec: 4986.62 - lr: 0.050000 +2023-04-06 12:26:19,252 epoch 79 - iter 2976/3720 - loss 0.03027454 - time (sec): 506.49 - samples/sec: 4980.98 - lr: 0.050000 +2023-04-06 12:27:22,216 epoch 79 - iter 3348/3720 - loss 0.03035162 - time (sec): 569.46 - samples/sec: 4983.40 - lr: 0.050000 +2023-04-06 12:28:25,719 epoch 79 - iter 3720/3720 - loss 0.03040132 - time (sec): 632.96 - samples/sec: 4979.32 - lr: 0.050000 +2023-04-06 12:28:25,720 ---------------------------------------------------------------------------------------------------- +2023-04-06 12:28:25,720 EPOCH 79 done: loss 0.0304 - lr 0.050000 +2023-04-06 12:28:25,720 BAD EPOCHS (no improvement): 0 +2023-04-06 12:28:25,723 ---------------------------------------------------------------------------------------------------- +2023-04-06 12:29:29,741 epoch 80 - iter 372/3720 - loss 0.02967585 - time (sec): 64.02 - samples/sec: 4965.95 - lr: 0.050000 +2023-04-06 12:30:32,266 epoch 80 - iter 744/3720 - loss 0.02980327 - time (sec): 126.54 - samples/sec: 4992.19 - lr: 0.050000 +2023-04-06 12:31:35,831 epoch 80 - iter 1116/3720 - loss 0.02997426 - time (sec): 190.11 - samples/sec: 4983.89 - lr: 0.050000 +2023-04-06 12:32:39,623 epoch 80 - iter 1488/3720 - loss 0.03019761 - time (sec): 253.90 - samples/sec: 4973.92 - lr: 0.050000 +2023-04-06 12:33:42,193 epoch 80 - iter 1860/3720 - loss 0.03017472 - time (sec): 316.47 - samples/sec: 4988.34 - lr: 0.050000 +2023-04-06 12:34:45,880 epoch 80 - iter 2232/3720 - loss 0.03006042 - time (sec): 380.16 - samples/sec: 4982.57 - lr: 0.050000 +2023-04-06 12:35:50,163 epoch 80 - iter 2604/3720 - loss 0.03008109 - time (sec): 444.44 - samples/sec: 4974.44 - lr: 0.050000 +2023-04-06 12:36:53,578 epoch 80 - iter 2976/3720 - loss 0.03009367 - time (sec): 507.85 - samples/sec: 4971.11 - lr: 0.050000 +2023-04-06 12:37:56,594 epoch 80 - iter 3348/3720 - loss 0.03025149 - time (sec): 570.87 - samples/sec: 4973.91 - lr: 0.050000 +2023-04-06 12:38:58,959 epoch 80 - iter 3720/3720 - loss 0.03029803 - time (sec): 633.24 - samples/sec: 4977.15 - lr: 0.050000 +2023-04-06 12:38:58,959 ---------------------------------------------------------------------------------------------------- +2023-04-06 12:38:58,959 EPOCH 80 done: loss 0.0303 - lr 0.050000 +2023-04-06 12:38:58,959 BAD EPOCHS (no improvement): 0 +2023-04-06 12:38:58,962 ---------------------------------------------------------------------------------------------------- +2023-04-06 12:40:01,930 epoch 81 - iter 372/3720 - loss 0.02975027 - time (sec): 62.97 - samples/sec: 4999.89 - lr: 0.050000 +2023-04-06 12:41:04,302 epoch 81 - iter 744/3720 - loss 0.03051976 - time (sec): 125.34 - samples/sec: 5016.68 - lr: 0.050000 +2023-04-06 12:42:07,250 epoch 81 - iter 1116/3720 - loss 0.03076626 - time (sec): 188.29 - samples/sec: 5016.89 - lr: 0.050000 +2023-04-06 12:43:10,955 epoch 81 - iter 1488/3720 - loss 0.03052334 - time (sec): 251.99 - samples/sec: 5003.81 - lr: 0.050000 +2023-04-06 12:44:15,673 epoch 81 - iter 1860/3720 - loss 0.03042447 - time (sec): 316.71 - samples/sec: 4987.43 - lr: 0.050000 +2023-04-06 12:45:19,950 epoch 81 - iter 2232/3720 - loss 0.03036129 - time (sec): 380.99 - samples/sec: 4971.63 - lr: 0.050000 +2023-04-06 12:46:23,964 epoch 81 - iter 2604/3720 - loss 0.03039412 - time (sec): 445.00 - samples/sec: 4966.96 - lr: 0.050000 +2023-04-06 12:47:26,745 epoch 81 - iter 2976/3720 - loss 0.03030867 - time (sec): 507.78 - samples/sec: 4968.93 - lr: 0.050000 +2023-04-06 12:48:30,741 epoch 81 - iter 3348/3720 - loss 0.03025832 - time (sec): 571.78 - samples/sec: 4962.95 - lr: 0.050000 +2023-04-06 12:49:34,322 epoch 81 - iter 3720/3720 - loss 0.03027550 - time (sec): 635.36 - samples/sec: 4960.51 - lr: 0.050000 +2023-04-06 12:49:34,322 ---------------------------------------------------------------------------------------------------- +2023-04-06 12:49:34,322 EPOCH 81 done: loss 0.0303 - lr 0.050000 +2023-04-06 12:49:34,322 BAD EPOCHS (no improvement): 0 +2023-04-06 12:49:34,325 ---------------------------------------------------------------------------------------------------- +2023-04-06 12:50:37,764 epoch 82 - iter 372/3720 - loss 0.02977248 - time (sec): 63.44 - samples/sec: 4980.45 - lr: 0.050000 +2023-04-06 12:51:40,812 epoch 82 - iter 744/3720 - loss 0.02977672 - time (sec): 126.49 - samples/sec: 4972.33 - lr: 0.050000 +2023-04-06 12:52:43,768 epoch 82 - iter 1116/3720 - loss 0.02981920 - time (sec): 189.44 - samples/sec: 4986.93 - lr: 0.050000 +2023-04-06 12:53:47,696 epoch 82 - iter 1488/3720 - loss 0.02974237 - time (sec): 253.37 - samples/sec: 4987.24 - lr: 0.050000 +2023-04-06 12:54:51,401 epoch 82 - iter 1860/3720 - loss 0.02983702 - time (sec): 317.08 - samples/sec: 4971.99 - lr: 0.050000 +2023-04-06 12:55:55,682 epoch 82 - iter 2232/3720 - loss 0.02997370 - time (sec): 381.36 - samples/sec: 4963.87 - lr: 0.050000 +2023-04-06 12:56:58,728 epoch 82 - iter 2604/3720 - loss 0.03010291 - time (sec): 444.40 - samples/sec: 4967.19 - lr: 0.050000 +2023-04-06 12:58:01,531 epoch 82 - iter 2976/3720 - loss 0.03005695 - time (sec): 507.21 - samples/sec: 4974.33 - lr: 0.050000 +2023-04-06 12:59:05,659 epoch 82 - iter 3348/3720 - loss 0.03006183 - time (sec): 571.33 - samples/sec: 4965.83 - lr: 0.050000 +2023-04-06 13:00:08,499 epoch 82 - iter 3720/3720 - loss 0.03017237 - time (sec): 634.17 - samples/sec: 4969.80 - lr: 0.050000 +2023-04-06 13:00:08,499 ---------------------------------------------------------------------------------------------------- +2023-04-06 13:00:08,499 EPOCH 82 done: loss 0.0302 - lr 0.050000 +2023-04-06 13:00:08,499 BAD EPOCHS (no improvement): 0 +2023-04-06 13:00:08,502 ---------------------------------------------------------------------------------------------------- +2023-04-06 13:01:12,221 epoch 83 - iter 372/3720 - loss 0.03043908 - time (sec): 63.72 - samples/sec: 4951.87 - lr: 0.050000 +2023-04-06 13:02:16,000 epoch 83 - iter 744/3720 - loss 0.03032200 - time (sec): 127.50 - samples/sec: 4941.02 - lr: 0.050000 +2023-04-06 13:03:20,241 epoch 83 - iter 1116/3720 - loss 0.03014522 - time (sec): 191.74 - samples/sec: 4933.39 - lr: 0.050000 +2023-04-06 13:04:24,273 epoch 83 - iter 1488/3720 - loss 0.03036548 - time (sec): 255.77 - samples/sec: 4933.74 - lr: 0.050000 +2023-04-06 13:05:27,755 epoch 83 - iter 1860/3720 - loss 0.03029812 - time (sec): 319.25 - samples/sec: 4932.26 - lr: 0.050000 +2023-04-06 13:06:31,221 epoch 83 - iter 2232/3720 - loss 0.03030823 - time (sec): 382.72 - samples/sec: 4940.43 - lr: 0.050000 +2023-04-06 13:07:33,936 epoch 83 - iter 2604/3720 - loss 0.03029005 - time (sec): 445.43 - samples/sec: 4954.28 - lr: 0.050000 +2023-04-06 13:08:38,059 epoch 83 - iter 2976/3720 - loss 0.03027530 - time (sec): 509.56 - samples/sec: 4948.93 - lr: 0.050000 +2023-04-06 13:09:41,850 epoch 83 - iter 3348/3720 - loss 0.03022734 - time (sec): 573.35 - samples/sec: 4947.83 - lr: 0.050000 +2023-04-06 13:10:45,251 epoch 83 - iter 3720/3720 - loss 0.03015810 - time (sec): 636.75 - samples/sec: 4949.70 - lr: 0.050000 +2023-04-06 13:10:45,251 ---------------------------------------------------------------------------------------------------- +2023-04-06 13:10:45,251 EPOCH 83 done: loss 0.0302 - lr 0.050000 +2023-04-06 13:10:45,251 BAD EPOCHS (no improvement): 0 +2023-04-06 13:10:45,254 ---------------------------------------------------------------------------------------------------- +2023-04-06 13:11:48,427 epoch 84 - iter 372/3720 - loss 0.02908372 - time (sec): 63.17 - samples/sec: 4960.66 - lr: 0.050000 +2023-04-06 13:12:52,193 epoch 84 - iter 744/3720 - loss 0.02956119 - time (sec): 126.94 - samples/sec: 4942.69 - lr: 0.050000 +2023-04-06 13:13:56,791 epoch 84 - iter 1116/3720 - loss 0.02940072 - time (sec): 191.54 - samples/sec: 4934.39 - lr: 0.050000 +2023-04-06 13:14:59,569 epoch 84 - iter 1488/3720 - loss 0.02954165 - time (sec): 254.31 - samples/sec: 4952.96 - lr: 0.050000 +2023-04-06 13:16:01,106 epoch 84 - iter 1860/3720 - loss 0.02981238 - time (sec): 315.85 - samples/sec: 4978.97 - lr: 0.050000 +2023-04-06 13:17:04,334 epoch 84 - iter 2232/3720 - loss 0.02981780 - time (sec): 379.08 - samples/sec: 4984.31 - lr: 0.050000 +2023-04-06 13:18:08,919 epoch 84 - iter 2604/3720 - loss 0.02981041 - time (sec): 443.67 - samples/sec: 4975.37 - lr: 0.050000 +2023-04-06 13:19:12,215 epoch 84 - iter 2976/3720 - loss 0.02984617 - time (sec): 506.96 - samples/sec: 4976.52 - lr: 0.050000 +2023-04-06 13:20:14,762 epoch 84 - iter 3348/3720 - loss 0.02999180 - time (sec): 569.51 - samples/sec: 4981.50 - lr: 0.050000 +2023-04-06 13:21:18,532 epoch 84 - iter 3720/3720 - loss 0.03004575 - time (sec): 633.28 - samples/sec: 4976.83 - lr: 0.050000 +2023-04-06 13:21:18,532 ---------------------------------------------------------------------------------------------------- +2023-04-06 13:21:18,532 EPOCH 84 done: loss 0.0300 - lr 0.050000 +2023-04-06 13:21:18,532 BAD EPOCHS (no improvement): 0 +2023-04-06 13:21:18,535 ---------------------------------------------------------------------------------------------------- +2023-04-06 13:22:22,664 epoch 85 - iter 372/3720 - loss 0.02902546 - time (sec): 64.13 - samples/sec: 4936.46 - lr: 0.050000 +2023-04-06 13:23:26,348 epoch 85 - iter 744/3720 - loss 0.02949886 - time (sec): 127.81 - samples/sec: 4943.93 - lr: 0.050000 +2023-04-06 13:24:31,398 epoch 85 - iter 1116/3720 - loss 0.02952757 - time (sec): 192.86 - samples/sec: 4916.08 - lr: 0.050000 +2023-04-06 13:25:35,221 epoch 85 - iter 1488/3720 - loss 0.02998131 - time (sec): 256.69 - samples/sec: 4911.89 - lr: 0.050000 +2023-04-06 13:26:39,389 epoch 85 - iter 1860/3720 - loss 0.02996414 - time (sec): 320.85 - samples/sec: 4908.02 - lr: 0.050000 +2023-04-06 13:27:43,083 epoch 85 - iter 2232/3720 - loss 0.03001694 - time (sec): 384.55 - samples/sec: 4915.96 - lr: 0.050000 +2023-04-06 13:28:47,258 epoch 85 - iter 2604/3720 - loss 0.02993371 - time (sec): 448.72 - samples/sec: 4918.72 - lr: 0.050000 +2023-04-06 13:29:51,792 epoch 85 - iter 2976/3720 - loss 0.02987828 - time (sec): 513.26 - samples/sec: 4912.85 - lr: 0.050000 +2023-04-06 13:30:55,747 epoch 85 - iter 3348/3720 - loss 0.02983418 - time (sec): 577.21 - samples/sec: 4912.32 - lr: 0.050000 +2023-04-06 13:31:59,736 epoch 85 - iter 3720/3720 - loss 0.02986079 - time (sec): 641.20 - samples/sec: 4915.33 - lr: 0.050000 +2023-04-06 13:31:59,737 ---------------------------------------------------------------------------------------------------- +2023-04-06 13:31:59,737 EPOCH 85 done: loss 0.0299 - lr 0.050000 +2023-04-06 13:31:59,737 BAD EPOCHS (no improvement): 0 +2023-04-06 13:31:59,740 ---------------------------------------------------------------------------------------------------- +2023-04-06 13:33:03,757 epoch 86 - iter 372/3720 - loss 0.02923677 - time (sec): 64.02 - samples/sec: 4934.86 - lr: 0.050000 +2023-04-06 13:34:06,935 epoch 86 - iter 744/3720 - loss 0.02950851 - time (sec): 127.20 - samples/sec: 4968.11 - lr: 0.050000 +2023-04-06 13:35:09,973 epoch 86 - iter 1116/3720 - loss 0.02994130 - time (sec): 190.23 - samples/sec: 4981.61 - lr: 0.050000 +2023-04-06 13:36:12,083 epoch 86 - iter 1488/3720 - loss 0.03002814 - time (sec): 252.34 - samples/sec: 5004.61 - lr: 0.050000 +2023-04-06 13:37:14,901 epoch 86 - iter 1860/3720 - loss 0.02999422 - time (sec): 315.16 - samples/sec: 5009.75 - lr: 0.050000 +2023-04-06 13:38:17,771 epoch 86 - iter 2232/3720 - loss 0.02999098 - time (sec): 378.03 - samples/sec: 5010.54 - lr: 0.050000 +2023-04-06 13:39:21,085 epoch 86 - iter 2604/3720 - loss 0.02992430 - time (sec): 441.34 - samples/sec: 5001.78 - lr: 0.050000 +2023-04-06 13:40:25,116 epoch 86 - iter 2976/3720 - loss 0.02990109 - time (sec): 505.38 - samples/sec: 4993.15 - lr: 0.050000 +2023-04-06 13:41:27,680 epoch 86 - iter 3348/3720 - loss 0.02995638 - time (sec): 567.94 - samples/sec: 4993.61 - lr: 0.050000 +2023-04-06 13:42:30,937 epoch 86 - iter 3720/3720 - loss 0.02997383 - time (sec): 631.20 - samples/sec: 4993.23 - lr: 0.050000 +2023-04-06 13:42:30,937 ---------------------------------------------------------------------------------------------------- +2023-04-06 13:42:30,937 EPOCH 86 done: loss 0.0300 - lr 0.050000 +2023-04-06 13:42:30,937 BAD EPOCHS (no improvement): 1 +2023-04-06 13:42:30,940 ---------------------------------------------------------------------------------------------------- +2023-04-06 13:43:34,861 epoch 87 - iter 372/3720 - loss 0.02955950 - time (sec): 63.92 - samples/sec: 4928.74 - lr: 0.050000 +2023-04-06 13:44:39,653 epoch 87 - iter 744/3720 - loss 0.02946349 - time (sec): 128.71 - samples/sec: 4932.74 - lr: 0.050000 +2023-04-06 13:45:43,726 epoch 87 - iter 1116/3720 - loss 0.02977305 - time (sec): 192.79 - samples/sec: 4932.02 - lr: 0.050000 +2023-04-06 13:46:47,650 epoch 87 - iter 1488/3720 - loss 0.02979529 - time (sec): 256.71 - samples/sec: 4923.84 - lr: 0.050000 +2023-04-06 13:47:51,153 epoch 87 - iter 1860/3720 - loss 0.02988215 - time (sec): 320.21 - samples/sec: 4927.51 - lr: 0.050000 +2023-04-06 13:48:55,054 epoch 87 - iter 2232/3720 - loss 0.02994461 - time (sec): 384.11 - samples/sec: 4926.85 - lr: 0.050000 +2023-04-06 13:50:00,227 epoch 87 - iter 2604/3720 - loss 0.02983321 - time (sec): 449.29 - samples/sec: 4915.60 - lr: 0.050000 +2023-04-06 13:51:03,744 epoch 87 - iter 2976/3720 - loss 0.02987213 - time (sec): 512.80 - samples/sec: 4916.68 - lr: 0.050000 +2023-04-06 13:52:07,890 epoch 87 - iter 3348/3720 - loss 0.02979281 - time (sec): 576.95 - samples/sec: 4916.04 - lr: 0.050000 +2023-04-06 13:53:12,302 epoch 87 - iter 3720/3720 - loss 0.02979169 - time (sec): 641.36 - samples/sec: 4914.10 - lr: 0.050000 +2023-04-06 13:53:12,302 ---------------------------------------------------------------------------------------------------- +2023-04-06 13:53:12,302 EPOCH 87 done: loss 0.0298 - lr 0.050000 +2023-04-06 13:53:12,302 BAD EPOCHS (no improvement): 0 +2023-04-06 13:53:12,305 ---------------------------------------------------------------------------------------------------- +2023-04-06 13:54:16,223 epoch 88 - iter 372/3720 - loss 0.02878423 - time (sec): 63.92 - samples/sec: 4925.16 - lr: 0.050000 +2023-04-06 13:55:19,407 epoch 88 - iter 744/3720 - loss 0.02900817 - time (sec): 127.10 - samples/sec: 4931.56 - lr: 0.050000 +2023-04-06 13:56:22,766 epoch 88 - iter 1116/3720 - loss 0.02934331 - time (sec): 190.46 - samples/sec: 4943.01 - lr: 0.050000 +2023-04-06 13:57:25,382 epoch 88 - iter 1488/3720 - loss 0.02947376 - time (sec): 253.08 - samples/sec: 4964.91 - lr: 0.050000 +2023-04-06 13:58:29,104 epoch 88 - iter 1860/3720 - loss 0.02954726 - time (sec): 316.80 - samples/sec: 4968.14 - lr: 0.050000 +2023-04-06 13:59:31,746 epoch 88 - iter 2232/3720 - loss 0.02971221 - time (sec): 379.44 - samples/sec: 4981.73 - lr: 0.050000 +2023-04-06 14:00:35,645 epoch 88 - iter 2604/3720 - loss 0.02971017 - time (sec): 443.34 - samples/sec: 4973.40 - lr: 0.050000 +2023-04-06 14:01:39,863 epoch 88 - iter 2976/3720 - loss 0.02969125 - time (sec): 507.56 - samples/sec: 4969.18 - lr: 0.050000 +2023-04-06 14:02:43,882 epoch 88 - iter 3348/3720 - loss 0.02979260 - time (sec): 571.58 - samples/sec: 4965.68 - lr: 0.050000 +2023-04-06 14:03:46,446 epoch 88 - iter 3720/3720 - loss 0.02979054 - time (sec): 634.14 - samples/sec: 4970.05 - lr: 0.050000 +2023-04-06 14:03:46,447 ---------------------------------------------------------------------------------------------------- +2023-04-06 14:03:46,447 EPOCH 88 done: loss 0.0298 - lr 0.050000 +2023-04-06 14:03:46,447 BAD EPOCHS (no improvement): 0 +2023-04-06 14:03:46,451 ---------------------------------------------------------------------------------------------------- +2023-04-06 14:04:49,702 epoch 89 - iter 372/3720 - loss 0.02946297 - time (sec): 63.25 - samples/sec: 4971.61 - lr: 0.050000 +2023-04-06 14:05:54,264 epoch 89 - iter 744/3720 - loss 0.03008024 - time (sec): 127.81 - samples/sec: 4928.31 - lr: 0.050000 +2023-04-06 14:06:59,024 epoch 89 - iter 1116/3720 - loss 0.02983486 - time (sec): 192.57 - samples/sec: 4923.71 - lr: 0.050000 +2023-04-06 14:08:03,409 epoch 89 - iter 1488/3720 - loss 0.02967858 - time (sec): 256.96 - samples/sec: 4917.98 - lr: 0.050000 +2023-04-06 14:09:06,664 epoch 89 - iter 1860/3720 - loss 0.02955772 - time (sec): 320.21 - samples/sec: 4928.70 - lr: 0.050000 +2023-04-06 14:10:09,000 epoch 89 - iter 2232/3720 - loss 0.02962135 - time (sec): 382.55 - samples/sec: 4948.27 - lr: 0.050000 +2023-04-06 14:11:11,921 epoch 89 - iter 2604/3720 - loss 0.02959664 - time (sec): 445.47 - samples/sec: 4951.07 - lr: 0.050000 +2023-04-06 14:12:16,345 epoch 89 - iter 2976/3720 - loss 0.02970072 - time (sec): 509.89 - samples/sec: 4944.29 - lr: 0.050000 +2023-04-06 14:13:21,194 epoch 89 - iter 3348/3720 - loss 0.02971199 - time (sec): 574.74 - samples/sec: 4938.18 - lr: 0.050000 +2023-04-06 14:14:25,101 epoch 89 - iter 3720/3720 - loss 0.02974746 - time (sec): 638.65 - samples/sec: 4934.96 - lr: 0.050000 +2023-04-06 14:14:25,101 ---------------------------------------------------------------------------------------------------- +2023-04-06 14:14:25,101 EPOCH 89 done: loss 0.0297 - lr 0.050000 +2023-04-06 14:14:25,101 BAD EPOCHS (no improvement): 0 +2023-04-06 14:14:25,104 ---------------------------------------------------------------------------------------------------- +2023-04-06 14:15:29,312 epoch 90 - iter 372/3720 - loss 0.02967709 - time (sec): 64.21 - samples/sec: 4935.27 - lr: 0.050000 +2023-04-06 14:16:33,686 epoch 90 - iter 744/3720 - loss 0.02956470 - time (sec): 128.58 - samples/sec: 4924.76 - lr: 0.050000 +2023-04-06 14:17:37,387 epoch 90 - iter 1116/3720 - loss 0.02956805 - time (sec): 192.28 - samples/sec: 4929.26 - lr: 0.050000 +2023-04-06 14:18:40,952 epoch 90 - iter 1488/3720 - loss 0.02963412 - time (sec): 255.85 - samples/sec: 4934.68 - lr: 0.050000 +2023-04-06 14:19:45,152 epoch 90 - iter 1860/3720 - loss 0.02984104 - time (sec): 320.05 - samples/sec: 4927.35 - lr: 0.050000 +2023-04-06 14:20:49,368 epoch 90 - iter 2232/3720 - loss 0.02978023 - time (sec): 384.26 - samples/sec: 4924.98 - lr: 0.050000 +2023-04-06 14:21:53,220 epoch 90 - iter 2604/3720 - loss 0.02980348 - time (sec): 448.12 - samples/sec: 4929.15 - lr: 0.050000 +2023-04-06 14:22:57,003 epoch 90 - iter 2976/3720 - loss 0.02980065 - time (sec): 511.90 - samples/sec: 4926.88 - lr: 0.050000 +2023-04-06 14:24:00,692 epoch 90 - iter 3348/3720 - loss 0.02970333 - time (sec): 575.59 - samples/sec: 4929.03 - lr: 0.050000 +2023-04-06 14:25:05,523 epoch 90 - iter 3720/3720 - loss 0.02968234 - time (sec): 640.42 - samples/sec: 4921.34 - lr: 0.050000 +2023-04-06 14:25:05,523 ---------------------------------------------------------------------------------------------------- +2023-04-06 14:25:05,523 EPOCH 90 done: loss 0.0297 - lr 0.050000 +2023-04-06 14:25:05,523 BAD EPOCHS (no improvement): 0 +2023-04-06 14:25:05,527 ---------------------------------------------------------------------------------------------------- +2023-04-06 14:26:09,538 epoch 91 - iter 372/3720 - loss 0.02855779 - time (sec): 64.01 - samples/sec: 4950.08 - lr: 0.050000 +2023-04-06 14:27:12,559 epoch 91 - iter 744/3720 - loss 0.02911246 - time (sec): 127.03 - samples/sec: 4970.09 - lr: 0.050000 +2023-04-06 14:28:15,052 epoch 91 - iter 1116/3720 - loss 0.02935122 - time (sec): 189.52 - samples/sec: 4994.77 - lr: 0.050000 +2023-04-06 14:29:18,974 epoch 91 - iter 1488/3720 - loss 0.02941200 - time (sec): 253.45 - samples/sec: 4983.38 - lr: 0.050000 +2023-04-06 14:30:23,126 epoch 91 - iter 1860/3720 - loss 0.02947597 - time (sec): 317.60 - samples/sec: 4966.61 - lr: 0.050000 +2023-04-06 14:31:25,350 epoch 91 - iter 2232/3720 - loss 0.02953269 - time (sec): 379.82 - samples/sec: 4975.14 - lr: 0.050000 +2023-04-06 14:32:28,560 epoch 91 - iter 2604/3720 - loss 0.02945525 - time (sec): 443.03 - samples/sec: 4977.74 - lr: 0.050000 +2023-04-06 14:33:32,497 epoch 91 - iter 2976/3720 - loss 0.02944464 - time (sec): 506.97 - samples/sec: 4974.91 - lr: 0.050000 +2023-04-06 14:34:35,915 epoch 91 - iter 3348/3720 - loss 0.02957418 - time (sec): 570.39 - samples/sec: 4974.90 - lr: 0.050000 +2023-04-06 14:35:39,277 epoch 91 - iter 3720/3720 - loss 0.02955067 - time (sec): 633.75 - samples/sec: 4973.12 - lr: 0.050000 +2023-04-06 14:35:39,278 ---------------------------------------------------------------------------------------------------- +2023-04-06 14:35:39,278 EPOCH 91 done: loss 0.0296 - lr 0.050000 +2023-04-06 14:35:39,278 BAD EPOCHS (no improvement): 0 +2023-04-06 14:35:39,281 ---------------------------------------------------------------------------------------------------- +2023-04-06 14:36:42,207 epoch 92 - iter 372/3720 - loss 0.03000054 - time (sec): 62.93 - samples/sec: 5009.41 - lr: 0.050000 +2023-04-06 14:37:46,192 epoch 92 - iter 744/3720 - loss 0.03046749 - time (sec): 126.91 - samples/sec: 4947.57 - lr: 0.050000 +2023-04-06 14:38:50,601 epoch 92 - iter 1116/3720 - loss 0.03014072 - time (sec): 191.32 - samples/sec: 4938.82 - lr: 0.050000 +2023-04-06 14:39:54,783 epoch 92 - iter 1488/3720 - loss 0.03012977 - time (sec): 255.50 - samples/sec: 4934.32 - lr: 0.050000 +2023-04-06 14:40:58,658 epoch 92 - iter 1860/3720 - loss 0.03005794 - time (sec): 319.38 - samples/sec: 4933.31 - lr: 0.050000 +2023-04-06 14:42:01,560 epoch 92 - iter 2232/3720 - loss 0.03000857 - time (sec): 382.28 - samples/sec: 4937.17 - lr: 0.050000 +2023-04-06 14:43:05,835 epoch 92 - iter 2604/3720 - loss 0.02985341 - time (sec): 446.55 - samples/sec: 4938.38 - lr: 0.050000 +2023-04-06 14:44:11,044 epoch 92 - iter 2976/3720 - loss 0.02979932 - time (sec): 511.76 - samples/sec: 4931.23 - lr: 0.050000 +2023-04-06 14:45:14,862 epoch 92 - iter 3348/3720 - loss 0.02979041 - time (sec): 575.58 - samples/sec: 4931.62 - lr: 0.050000 +2023-04-06 14:46:18,753 epoch 92 - iter 3720/3720 - loss 0.02961658 - time (sec): 639.47 - samples/sec: 4928.61 - lr: 0.050000 +2023-04-06 14:46:18,754 ---------------------------------------------------------------------------------------------------- +2023-04-06 14:46:18,754 EPOCH 92 done: loss 0.0296 - lr 0.050000 +2023-04-06 14:46:18,754 BAD EPOCHS (no improvement): 1 +2023-04-06 14:46:18,757 ---------------------------------------------------------------------------------------------------- +2023-04-06 14:47:22,362 epoch 93 - iter 372/3720 - loss 0.02949013 - time (sec): 63.61 - samples/sec: 4934.02 - lr: 0.050000 +2023-04-06 14:48:27,004 epoch 93 - iter 744/3720 - loss 0.02954477 - time (sec): 128.25 - samples/sec: 4908.90 - lr: 0.050000 +2023-04-06 14:49:31,369 epoch 93 - iter 1116/3720 - loss 0.02954577 - time (sec): 192.61 - samples/sec: 4900.16 - lr: 0.050000 +2023-04-06 14:50:32,931 epoch 93 - iter 1488/3720 - loss 0.02958463 - time (sec): 254.17 - samples/sec: 4945.72 - lr: 0.050000 +2023-04-06 14:51:35,509 epoch 93 - iter 1860/3720 - loss 0.02962799 - time (sec): 316.75 - samples/sec: 4967.73 - lr: 0.050000 +2023-04-06 14:52:38,620 epoch 93 - iter 2232/3720 - loss 0.02969660 - time (sec): 379.86 - samples/sec: 4974.26 - lr: 0.050000 +2023-04-06 14:53:41,162 epoch 93 - iter 2604/3720 - loss 0.02972034 - time (sec): 442.41 - samples/sec: 4985.21 - lr: 0.050000 +2023-04-06 14:54:44,347 epoch 93 - iter 2976/3720 - loss 0.02969130 - time (sec): 505.59 - samples/sec: 4988.07 - lr: 0.050000 +2023-04-06 14:55:47,388 epoch 93 - iter 3348/3720 - loss 0.02971463 - time (sec): 568.63 - samples/sec: 4989.28 - lr: 0.050000 +2023-04-06 14:56:49,677 epoch 93 - iter 3720/3720 - loss 0.02968347 - time (sec): 630.92 - samples/sec: 4995.42 - lr: 0.050000 +2023-04-06 14:56:49,678 ---------------------------------------------------------------------------------------------------- +2023-04-06 14:56:49,678 EPOCH 93 done: loss 0.0297 - lr 0.050000 +2023-04-06 14:56:49,678 BAD EPOCHS (no improvement): 2 +2023-04-06 14:56:49,681 ---------------------------------------------------------------------------------------------------- +2023-04-06 14:57:51,883 epoch 94 - iter 372/3720 - loss 0.02924225 - time (sec): 62.20 - samples/sec: 5024.92 - lr: 0.050000 +2023-04-06 14:58:55,243 epoch 94 - iter 744/3720 - loss 0.02917742 - time (sec): 125.56 - samples/sec: 5018.20 - lr: 0.050000 +2023-04-06 14:59:58,387 epoch 94 - iter 1116/3720 - loss 0.02940144 - time (sec): 188.71 - samples/sec: 5015.68 - lr: 0.050000 +2023-04-06 15:01:02,165 epoch 94 - iter 1488/3720 - loss 0.02928628 - time (sec): 252.48 - samples/sec: 4995.52 - lr: 0.050000 +2023-04-06 15:02:06,720 epoch 94 - iter 1860/3720 - loss 0.02954478 - time (sec): 317.04 - samples/sec: 4973.97 - lr: 0.050000 +2023-04-06 15:03:11,366 epoch 94 - iter 2232/3720 - loss 0.02944295 - time (sec): 381.68 - samples/sec: 4957.13 - lr: 0.050000 +2023-04-06 15:04:14,372 epoch 94 - iter 2604/3720 - loss 0.02932206 - time (sec): 444.69 - samples/sec: 4961.61 - lr: 0.050000 +2023-04-06 15:05:17,643 epoch 94 - iter 2976/3720 - loss 0.02934208 - time (sec): 507.96 - samples/sec: 4962.62 - lr: 0.050000 +2023-04-06 15:06:20,427 epoch 94 - iter 3348/3720 - loss 0.02945435 - time (sec): 570.75 - samples/sec: 4965.75 - lr: 0.050000 +2023-04-06 15:07:24,884 epoch 94 - iter 3720/3720 - loss 0.02951776 - time (sec): 635.20 - samples/sec: 4961.74 - lr: 0.050000 +2023-04-06 15:07:24,884 ---------------------------------------------------------------------------------------------------- +2023-04-06 15:07:24,884 EPOCH 94 done: loss 0.0295 - lr 0.050000 +2023-04-06 15:07:24,884 BAD EPOCHS (no improvement): 0 +2023-04-06 15:07:24,888 ---------------------------------------------------------------------------------------------------- +2023-04-06 15:08:27,171 epoch 95 - iter 372/3720 - loss 0.02936498 - time (sec): 62.28 - samples/sec: 5039.08 - lr: 0.050000 +2023-04-06 15:09:30,536 epoch 95 - iter 744/3720 - loss 0.02887280 - time (sec): 125.65 - samples/sec: 5008.77 - lr: 0.050000 +2023-04-06 15:10:33,863 epoch 95 - iter 1116/3720 - loss 0.02894426 - time (sec): 188.97 - samples/sec: 5005.54 - lr: 0.050000 +2023-04-06 15:11:38,073 epoch 95 - iter 1488/3720 - loss 0.02927178 - time (sec): 253.19 - samples/sec: 4972.78 - lr: 0.050000 +2023-04-06 15:12:42,544 epoch 95 - iter 1860/3720 - loss 0.02919982 - time (sec): 317.66 - samples/sec: 4950.72 - lr: 0.050000 +2023-04-06 15:13:47,007 epoch 95 - iter 2232/3720 - loss 0.02912063 - time (sec): 382.12 - samples/sec: 4946.09 - lr: 0.050000 +2023-04-06 15:14:50,719 epoch 95 - iter 2604/3720 - loss 0.02914057 - time (sec): 445.83 - samples/sec: 4950.06 - lr: 0.050000 +2023-04-06 15:15:54,115 epoch 95 - iter 2976/3720 - loss 0.02914541 - time (sec): 509.23 - samples/sec: 4951.91 - lr: 0.050000 +2023-04-06 15:16:57,568 epoch 95 - iter 3348/3720 - loss 0.02916951 - time (sec): 572.68 - samples/sec: 4954.18 - lr: 0.050000 +2023-04-06 15:18:01,117 epoch 95 - iter 3720/3720 - loss 0.02926558 - time (sec): 636.23 - samples/sec: 4953.74 - lr: 0.050000 +2023-04-06 15:18:01,117 ---------------------------------------------------------------------------------------------------- +2023-04-06 15:18:01,117 EPOCH 95 done: loss 0.0293 - lr 0.050000 +2023-04-06 15:18:01,117 BAD EPOCHS (no improvement): 0 +2023-04-06 15:18:01,124 ---------------------------------------------------------------------------------------------------- +2023-04-06 15:19:05,315 epoch 96 - iter 372/3720 - loss 0.02967119 - time (sec): 64.19 - samples/sec: 4927.13 - lr: 0.050000 +2023-04-06 15:20:09,775 epoch 96 - iter 744/3720 - loss 0.02946338 - time (sec): 128.65 - samples/sec: 4914.75 - lr: 0.050000 +2023-04-06 15:21:12,527 epoch 96 - iter 1116/3720 - loss 0.02952667 - time (sec): 191.40 - samples/sec: 4943.59 - lr: 0.050000 +2023-04-06 15:22:15,935 epoch 96 - iter 1488/3720 - loss 0.02925585 - time (sec): 254.81 - samples/sec: 4957.78 - lr: 0.050000 +2023-04-06 15:23:19,925 epoch 96 - iter 1860/3720 - loss 0.02927701 - time (sec): 318.80 - samples/sec: 4946.03 - lr: 0.050000 +2023-04-06 15:24:23,982 epoch 96 - iter 2232/3720 - loss 0.02911695 - time (sec): 382.86 - samples/sec: 4940.62 - lr: 0.050000 +2023-04-06 15:25:27,385 epoch 96 - iter 2604/3720 - loss 0.02923169 - time (sec): 446.26 - samples/sec: 4939.68 - lr: 0.050000 +2023-04-06 15:26:31,221 epoch 96 - iter 2976/3720 - loss 0.02936122 - time (sec): 510.10 - samples/sec: 4939.62 - lr: 0.050000 +2023-04-06 15:27:34,688 epoch 96 - iter 3348/3720 - loss 0.02930831 - time (sec): 573.56 - samples/sec: 4941.02 - lr: 0.050000 +2023-04-06 15:28:38,474 epoch 96 - iter 3720/3720 - loss 0.02929948 - time (sec): 637.35 - samples/sec: 4945.03 - lr: 0.050000 +2023-04-06 15:28:38,474 ---------------------------------------------------------------------------------------------------- +2023-04-06 15:28:38,474 EPOCH 96 done: loss 0.0293 - lr 0.050000 +2023-04-06 15:28:38,474 BAD EPOCHS (no improvement): 1 +2023-04-06 15:28:38,477 ---------------------------------------------------------------------------------------------------- +2023-04-06 15:29:41,896 epoch 97 - iter 372/3720 - loss 0.02846987 - time (sec): 63.42 - samples/sec: 4964.38 - lr: 0.050000 +2023-04-06 15:30:45,520 epoch 97 - iter 744/3720 - loss 0.02902019 - time (sec): 127.04 - samples/sec: 4956.62 - lr: 0.050000 +2023-04-06 15:31:48,172 epoch 97 - iter 1116/3720 - loss 0.02921452 - time (sec): 189.69 - samples/sec: 4971.69 - lr: 0.050000 +2023-04-06 15:32:51,629 epoch 97 - iter 1488/3720 - loss 0.02924840 - time (sec): 253.15 - samples/sec: 4974.23 - lr: 0.050000 +2023-04-06 15:33:53,890 epoch 97 - iter 1860/3720 - loss 0.02927003 - time (sec): 315.41 - samples/sec: 4985.37 - lr: 0.050000 +2023-04-06 15:34:57,913 epoch 97 - iter 2232/3720 - loss 0.02925115 - time (sec): 379.44 - samples/sec: 4981.77 - lr: 0.050000 +2023-04-06 15:36:01,517 epoch 97 - iter 2604/3720 - loss 0.02926837 - time (sec): 443.04 - samples/sec: 4979.62 - lr: 0.050000 +2023-04-06 15:37:05,820 epoch 97 - iter 2976/3720 - loss 0.02929307 - time (sec): 507.34 - samples/sec: 4967.57 - lr: 0.050000 +2023-04-06 15:38:09,978 epoch 97 - iter 3348/3720 - loss 0.02928203 - time (sec): 571.50 - samples/sec: 4964.43 - lr: 0.050000 +2023-04-06 15:39:13,882 epoch 97 - iter 3720/3720 - loss 0.02929182 - time (sec): 635.41 - samples/sec: 4960.16 - lr: 0.050000 +2023-04-06 15:39:13,883 ---------------------------------------------------------------------------------------------------- +2023-04-06 15:39:13,883 EPOCH 97 done: loss 0.0293 - lr 0.050000 +2023-04-06 15:39:13,883 BAD EPOCHS (no improvement): 2 +2023-04-06 15:39:13,886 ---------------------------------------------------------------------------------------------------- +2023-04-06 15:40:18,041 epoch 98 - iter 372/3720 - loss 0.02915454 - time (sec): 64.16 - samples/sec: 4892.46 - lr: 0.050000 +2023-04-06 15:41:21,546 epoch 98 - iter 744/3720 - loss 0.02918277 - time (sec): 127.66 - samples/sec: 4924.41 - lr: 0.050000 +2023-04-06 15:42:25,001 epoch 98 - iter 1116/3720 - loss 0.02909367 - time (sec): 191.11 - samples/sec: 4932.07 - lr: 0.050000 +2023-04-06 15:43:27,908 epoch 98 - iter 1488/3720 - loss 0.02927396 - time (sec): 254.02 - samples/sec: 4949.97 - lr: 0.050000 +2023-04-06 15:44:31,820 epoch 98 - iter 1860/3720 - loss 0.02931938 - time (sec): 317.93 - samples/sec: 4954.28 - lr: 0.050000 +2023-04-06 15:45:35,712 epoch 98 - iter 2232/3720 - loss 0.02927944 - time (sec): 381.83 - samples/sec: 4948.43 - lr: 0.050000 +2023-04-06 15:46:39,824 epoch 98 - iter 2604/3720 - loss 0.02925248 - time (sec): 445.94 - samples/sec: 4939.69 - lr: 0.050000 +2023-04-06 15:47:43,650 epoch 98 - iter 2976/3720 - loss 0.02905909 - time (sec): 509.76 - samples/sec: 4942.76 - lr: 0.050000 +2023-04-06 15:48:47,900 epoch 98 - iter 3348/3720 - loss 0.02912807 - time (sec): 574.01 - samples/sec: 4940.40 - lr: 0.050000 +2023-04-06 15:49:52,162 epoch 98 - iter 3720/3720 - loss 0.02928766 - time (sec): 638.28 - samples/sec: 4937.85 - lr: 0.050000 +2023-04-06 15:49:52,163 ---------------------------------------------------------------------------------------------------- +2023-04-06 15:49:52,163 EPOCH 98 done: loss 0.0293 - lr 0.050000 +2023-04-06 15:49:52,163 BAD EPOCHS (no improvement): 3 +2023-04-06 15:49:52,167 ---------------------------------------------------------------------------------------------------- +2023-04-06 15:50:57,014 epoch 99 - iter 372/3720 - loss 0.02846481 - time (sec): 64.85 - samples/sec: 4883.70 - lr: 0.050000 +2023-04-06 15:52:01,104 epoch 99 - iter 744/3720 - loss 0.02860222 - time (sec): 128.94 - samples/sec: 4905.84 - lr: 0.050000 +2023-04-06 15:53:04,755 epoch 99 - iter 1116/3720 - loss 0.02893728 - time (sec): 192.59 - samples/sec: 4921.85 - lr: 0.050000 +2023-04-06 15:54:08,776 epoch 99 - iter 1488/3720 - loss 0.02911058 - time (sec): 256.61 - samples/sec: 4929.96 - lr: 0.050000 +2023-04-06 15:55:13,006 epoch 99 - iter 1860/3720 - loss 0.02900851 - time (sec): 320.84 - samples/sec: 4925.42 - lr: 0.050000 +2023-04-06 15:56:15,908 epoch 99 - iter 2232/3720 - loss 0.02918873 - time (sec): 383.74 - samples/sec: 4933.64 - lr: 0.050000 +2023-04-06 15:57:19,760 epoch 99 - iter 2604/3720 - loss 0.02922697 - time (sec): 447.59 - samples/sec: 4935.96 - lr: 0.050000 +2023-04-06 15:58:23,155 epoch 99 - iter 2976/3720 - loss 0.02929975 - time (sec): 510.99 - samples/sec: 4937.80 - lr: 0.050000 +2023-04-06 15:59:27,525 epoch 99 - iter 3348/3720 - loss 0.02925750 - time (sec): 575.36 - samples/sec: 4931.22 - lr: 0.050000 +2023-04-06 16:00:31,230 epoch 99 - iter 3720/3720 - loss 0.02926185 - time (sec): 639.06 - samples/sec: 4931.77 - lr: 0.050000 +2023-04-06 16:00:31,230 ---------------------------------------------------------------------------------------------------- +2023-04-06 16:00:31,230 EPOCH 99 done: loss 0.0293 - lr 0.050000 +2023-04-06 16:00:31,231 BAD EPOCHS (no improvement): 0 +2023-04-06 16:00:31,234 ---------------------------------------------------------------------------------------------------- +2023-04-06 16:01:35,409 epoch 100 - iter 372/3720 - loss 0.02926741 - time (sec): 64.17 - samples/sec: 4891.41 - lr: 0.050000 +2023-04-06 16:02:38,622 epoch 100 - iter 744/3720 - loss 0.02886811 - time (sec): 127.39 - samples/sec: 4938.32 - lr: 0.050000 +2023-04-06 16:03:42,243 epoch 100 - iter 1116/3720 - loss 0.02903872 - time (sec): 191.01 - samples/sec: 4928.43 - lr: 0.050000 +2023-04-06 16:04:47,341 epoch 100 - iter 1488/3720 - loss 0.02897199 - time (sec): 256.11 - samples/sec: 4910.73 - lr: 0.050000 +2023-04-06 16:05:52,173 epoch 100 - iter 1860/3720 - loss 0.02898875 - time (sec): 320.94 - samples/sec: 4911.30 - lr: 0.050000 +2023-04-06 16:06:57,196 epoch 100 - iter 2232/3720 - loss 0.02908536 - time (sec): 385.96 - samples/sec: 4902.11 - lr: 0.050000 +2023-04-06 16:08:01,001 epoch 100 - iter 2604/3720 - loss 0.02905924 - time (sec): 449.77 - samples/sec: 4908.45 - lr: 0.050000 +2023-04-06 16:09:04,671 epoch 100 - iter 2976/3720 - loss 0.02908040 - time (sec): 513.44 - samples/sec: 4909.42 - lr: 0.050000 +2023-04-06 16:10:08,680 epoch 100 - iter 3348/3720 - loss 0.02912874 - time (sec): 577.45 - samples/sec: 4909.75 - lr: 0.050000 +2023-04-06 16:11:13,261 epoch 100 - iter 3720/3720 - loss 0.02917659 - time (sec): 642.03 - samples/sec: 4909.01 - lr: 0.050000 +2023-04-06 16:11:13,261 ---------------------------------------------------------------------------------------------------- +2023-04-06 16:11:13,261 EPOCH 100 done: loss 0.0292 - lr 0.050000 +2023-04-06 16:11:13,261 BAD EPOCHS (no improvement): 0 +2023-04-06 16:11:13,264 ---------------------------------------------------------------------------------------------------- +2023-04-06 16:12:16,908 epoch 101 - iter 372/3720 - loss 0.02868550 - time (sec): 63.64 - samples/sec: 4939.62 - lr: 0.050000 +2023-04-06 16:13:19,781 epoch 101 - iter 744/3720 - loss 0.02869803 - time (sec): 126.52 - samples/sec: 4977.98 - lr: 0.050000 +2023-04-06 16:14:23,407 epoch 101 - iter 1116/3720 - loss 0.02879305 - time (sec): 190.14 - samples/sec: 4968.58 - lr: 0.050000 +2023-04-06 16:15:26,705 epoch 101 - iter 1488/3720 - loss 0.02877063 - time (sec): 253.44 - samples/sec: 4962.77 - lr: 0.050000 +2023-04-06 16:16:31,576 epoch 101 - iter 1860/3720 - loss 0.02879079 - time (sec): 318.31 - samples/sec: 4948.32 - lr: 0.050000 +2023-04-06 16:17:34,756 epoch 101 - iter 2232/3720 - loss 0.02890731 - time (sec): 381.49 - samples/sec: 4952.85 - lr: 0.050000 +2023-04-06 16:18:38,963 epoch 101 - iter 2604/3720 - loss 0.02894713 - time (sec): 445.70 - samples/sec: 4949.01 - lr: 0.050000 +2023-04-06 16:19:42,548 epoch 101 - iter 2976/3720 - loss 0.02882801 - time (sec): 509.28 - samples/sec: 4951.83 - lr: 0.050000 +2023-04-06 16:20:45,613 epoch 101 - iter 3348/3720 - loss 0.02892971 - time (sec): 572.35 - samples/sec: 4956.44 - lr: 0.050000 +2023-04-06 16:21:48,377 epoch 101 - iter 3720/3720 - loss 0.02896954 - time (sec): 635.11 - samples/sec: 4962.44 - lr: 0.050000 +2023-04-06 16:21:48,378 ---------------------------------------------------------------------------------------------------- +2023-04-06 16:21:48,378 EPOCH 101 done: loss 0.0290 - lr 0.050000 +2023-04-06 16:21:48,378 BAD EPOCHS (no improvement): 0 +2023-04-06 16:21:48,381 ---------------------------------------------------------------------------------------------------- +2023-04-06 16:22:50,215 epoch 102 - iter 372/3720 - loss 0.02881203 - time (sec): 61.83 - samples/sec: 5072.57 - lr: 0.050000 +2023-04-06 16:23:52,864 epoch 102 - iter 744/3720 - loss 0.02944004 - time (sec): 124.48 - samples/sec: 5049.06 - lr: 0.050000 +2023-04-06 16:24:55,607 epoch 102 - iter 1116/3720 - loss 0.02928611 - time (sec): 187.23 - samples/sec: 5042.76 - lr: 0.050000 +2023-04-06 16:25:58,472 epoch 102 - iter 1488/3720 - loss 0.02928647 - time (sec): 250.09 - samples/sec: 5047.97 - lr: 0.050000 +2023-04-06 16:27:00,669 epoch 102 - iter 1860/3720 - loss 0.02933067 - time (sec): 312.29 - samples/sec: 5047.54 - lr: 0.050000 +2023-04-06 16:28:03,582 epoch 102 - iter 2232/3720 - loss 0.02924074 - time (sec): 375.20 - samples/sec: 5040.48 - lr: 0.050000 +2023-04-06 16:29:06,368 epoch 102 - iter 2604/3720 - loss 0.02923811 - time (sec): 437.99 - samples/sec: 5040.36 - lr: 0.050000 +2023-04-06 16:30:09,324 epoch 102 - iter 2976/3720 - loss 0.02921632 - time (sec): 500.94 - samples/sec: 5031.45 - lr: 0.050000 +2023-04-06 16:31:12,993 epoch 102 - iter 3348/3720 - loss 0.02929971 - time (sec): 564.61 - samples/sec: 5020.45 - lr: 0.050000 +2023-04-06 16:32:17,716 epoch 102 - iter 3720/3720 - loss 0.02929986 - time (sec): 629.34 - samples/sec: 5008.00 - lr: 0.050000 +2023-04-06 16:32:17,717 ---------------------------------------------------------------------------------------------------- +2023-04-06 16:32:17,717 EPOCH 102 done: loss 0.0293 - lr 0.050000 +2023-04-06 16:32:17,717 BAD EPOCHS (no improvement): 1 +2023-04-06 16:32:17,720 ---------------------------------------------------------------------------------------------------- +2023-04-06 16:33:21,203 epoch 103 - iter 372/3720 - loss 0.02976637 - time (sec): 63.48 - samples/sec: 4940.11 - lr: 0.050000 +2023-04-06 16:34:26,238 epoch 103 - iter 744/3720 - loss 0.02902686 - time (sec): 128.52 - samples/sec: 4916.39 - lr: 0.050000 +2023-04-06 16:35:30,502 epoch 103 - iter 1116/3720 - loss 0.02884190 - time (sec): 192.78 - samples/sec: 4923.55 - lr: 0.050000 +2023-04-06 16:36:34,348 epoch 103 - iter 1488/3720 - loss 0.02859953 - time (sec): 256.63 - samples/sec: 4923.70 - lr: 0.050000 +2023-04-06 16:37:39,158 epoch 103 - iter 1860/3720 - loss 0.02871555 - time (sec): 321.44 - samples/sec: 4916.14 - lr: 0.050000 +2023-04-06 16:38:43,747 epoch 103 - iter 2232/3720 - loss 0.02871976 - time (sec): 386.03 - samples/sec: 4915.45 - lr: 0.050000 +2023-04-06 16:39:46,948 epoch 103 - iter 2604/3720 - loss 0.02895213 - time (sec): 449.23 - samples/sec: 4918.80 - lr: 0.050000 +2023-04-06 16:40:51,473 epoch 103 - iter 2976/3720 - loss 0.02903915 - time (sec): 513.75 - samples/sec: 4910.60 - lr: 0.050000 +2023-04-06 16:41:56,334 epoch 103 - iter 3348/3720 - loss 0.02908869 - time (sec): 578.61 - samples/sec: 4905.48 - lr: 0.050000 +2023-04-06 16:42:59,655 epoch 103 - iter 3720/3720 - loss 0.02912004 - time (sec): 641.93 - samples/sec: 4909.71 - lr: 0.050000 +2023-04-06 16:42:59,655 ---------------------------------------------------------------------------------------------------- +2023-04-06 16:42:59,655 EPOCH 103 done: loss 0.0291 - lr 0.050000 +2023-04-06 16:42:59,655 BAD EPOCHS (no improvement): 2 +2023-04-06 16:42:59,659 ---------------------------------------------------------------------------------------------------- +2023-04-06 16:44:03,164 epoch 104 - iter 372/3720 - loss 0.02794056 - time (sec): 63.51 - samples/sec: 4940.25 - lr: 0.050000 +2023-04-06 16:45:07,071 epoch 104 - iter 744/3720 - loss 0.02836150 - time (sec): 127.41 - samples/sec: 4938.79 - lr: 0.050000 +2023-04-06 16:46:11,702 epoch 104 - iter 1116/3720 - loss 0.02825259 - time (sec): 192.04 - samples/sec: 4924.08 - lr: 0.050000 +2023-04-06 16:47:16,459 epoch 104 - iter 1488/3720 - loss 0.02828719 - time (sec): 256.80 - samples/sec: 4919.51 - lr: 0.050000 +2023-04-06 16:48:20,799 epoch 104 - iter 1860/3720 - loss 0.02850305 - time (sec): 321.14 - samples/sec: 4920.31 - lr: 0.050000 +2023-04-06 16:49:23,570 epoch 104 - iter 2232/3720 - loss 0.02876834 - time (sec): 383.91 - samples/sec: 4932.68 - lr: 0.050000 +2023-04-06 16:50:26,233 epoch 104 - iter 2604/3720 - loss 0.02885298 - time (sec): 446.57 - samples/sec: 4941.14 - lr: 0.050000 +2023-04-06 16:51:28,962 epoch 104 - iter 2976/3720 - loss 0.02894524 - time (sec): 509.30 - samples/sec: 4952.59 - lr: 0.050000 +2023-04-06 16:52:31,609 epoch 104 - iter 3348/3720 - loss 0.02896460 - time (sec): 571.95 - samples/sec: 4960.15 - lr: 0.050000 +2023-04-06 16:53:34,519 epoch 104 - iter 3720/3720 - loss 0.02897805 - time (sec): 634.86 - samples/sec: 4964.42 - lr: 0.050000 +2023-04-06 16:53:34,519 ---------------------------------------------------------------------------------------------------- +2023-04-06 16:53:34,519 EPOCH 104 done: loss 0.0290 - lr 0.050000 +2023-04-06 16:53:34,519 BAD EPOCHS (no improvement): 3 +2023-04-06 16:53:34,522 ---------------------------------------------------------------------------------------------------- +2023-04-06 16:54:37,908 epoch 105 - iter 372/3720 - loss 0.02848474 - time (sec): 63.39 - samples/sec: 5004.69 - lr: 0.050000 +2023-04-06 16:55:41,910 epoch 105 - iter 744/3720 - loss 0.02891930 - time (sec): 127.39 - samples/sec: 4959.30 - lr: 0.050000 +2023-04-06 16:56:45,614 epoch 105 - iter 1116/3720 - loss 0.02886648 - time (sec): 191.09 - samples/sec: 4952.09 - lr: 0.050000 +2023-04-06 16:57:49,847 epoch 105 - iter 1488/3720 - loss 0.02888613 - time (sec): 255.32 - samples/sec: 4943.68 - lr: 0.050000 +2023-04-06 16:58:53,006 epoch 105 - iter 1860/3720 - loss 0.02877241 - time (sec): 318.48 - samples/sec: 4952.26 - lr: 0.050000 +2023-04-06 16:59:55,569 epoch 105 - iter 2232/3720 - loss 0.02866175 - time (sec): 381.05 - samples/sec: 4960.30 - lr: 0.050000 +2023-04-06 17:01:00,023 epoch 105 - iter 2604/3720 - loss 0.02864414 - time (sec): 445.50 - samples/sec: 4957.09 - lr: 0.050000 +2023-04-06 17:02:03,781 epoch 105 - iter 2976/3720 - loss 0.02863500 - time (sec): 509.26 - samples/sec: 4953.44 - lr: 0.050000 +2023-04-06 17:03:08,218 epoch 105 - iter 3348/3720 - loss 0.02883981 - time (sec): 573.70 - samples/sec: 4948.87 - lr: 0.050000 +2023-04-06 17:04:11,931 epoch 105 - iter 3720/3720 - loss 0.02885578 - time (sec): 637.41 - samples/sec: 4944.57 - lr: 0.050000 +2023-04-06 17:04:11,931 ---------------------------------------------------------------------------------------------------- +2023-04-06 17:04:11,931 EPOCH 105 done: loss 0.0289 - lr 0.050000 +2023-04-06 17:04:11,931 BAD EPOCHS (no improvement): 0 +2023-04-06 17:04:11,934 ---------------------------------------------------------------------------------------------------- +2023-04-06 17:05:16,709 epoch 106 - iter 372/3720 - loss 0.02956074 - time (sec): 64.77 - samples/sec: 4910.20 - lr: 0.050000 +2023-04-06 17:06:20,970 epoch 106 - iter 744/3720 - loss 0.02964768 - time (sec): 129.04 - samples/sec: 4902.56 - lr: 0.050000 +2023-04-06 17:07:24,282 epoch 106 - iter 1116/3720 - loss 0.02933871 - time (sec): 192.35 - samples/sec: 4921.90 - lr: 0.050000 +2023-04-06 17:08:27,831 epoch 106 - iter 1488/3720 - loss 0.02917584 - time (sec): 255.90 - samples/sec: 4936.52 - lr: 0.050000 +2023-04-06 17:09:31,094 epoch 106 - iter 1860/3720 - loss 0.02921854 - time (sec): 319.16 - samples/sec: 4944.81 - lr: 0.050000 +2023-04-06 17:10:35,149 epoch 106 - iter 2232/3720 - loss 0.02913248 - time (sec): 383.21 - samples/sec: 4944.33 - lr: 0.050000 +2023-04-06 17:11:38,271 epoch 106 - iter 2604/3720 - loss 0.02899441 - time (sec): 446.34 - samples/sec: 4948.91 - lr: 0.050000 +2023-04-06 17:12:41,927 epoch 106 - iter 2976/3720 - loss 0.02900669 - time (sec): 509.99 - samples/sec: 4948.51 - lr: 0.050000 +2023-04-06 17:13:45,552 epoch 106 - iter 3348/3720 - loss 0.02900425 - time (sec): 573.62 - samples/sec: 4948.92 - lr: 0.050000 +2023-04-06 17:14:49,765 epoch 106 - iter 3720/3720 - loss 0.02890924 - time (sec): 637.83 - samples/sec: 4941.30 - lr: 0.050000 +2023-04-06 17:14:49,765 ---------------------------------------------------------------------------------------------------- +2023-04-06 17:14:49,765 EPOCH 106 done: loss 0.0289 - lr 0.050000 +2023-04-06 17:14:49,765 BAD EPOCHS (no improvement): 1 +2023-04-06 17:14:49,768 ---------------------------------------------------------------------------------------------------- +2023-04-06 17:15:53,842 epoch 107 - iter 372/3720 - loss 0.02800491 - time (sec): 64.07 - samples/sec: 4922.91 - lr: 0.050000 +2023-04-06 17:16:57,412 epoch 107 - iter 744/3720 - loss 0.02823637 - time (sec): 127.64 - samples/sec: 4953.94 - lr: 0.050000 +2023-04-06 17:18:01,167 epoch 107 - iter 1116/3720 - loss 0.02861287 - time (sec): 191.40 - samples/sec: 4941.07 - lr: 0.050000 +2023-04-06 17:19:04,321 epoch 107 - iter 1488/3720 - loss 0.02881320 - time (sec): 254.55 - samples/sec: 4950.35 - lr: 0.050000 +2023-04-06 17:20:07,174 epoch 107 - iter 1860/3720 - loss 0.02872406 - time (sec): 317.41 - samples/sec: 4970.37 - lr: 0.050000 +2023-04-06 17:21:08,908 epoch 107 - iter 2232/3720 - loss 0.02882268 - time (sec): 379.14 - samples/sec: 4983.42 - lr: 0.050000 +2023-04-06 17:22:12,336 epoch 107 - iter 2604/3720 - loss 0.02883334 - time (sec): 442.57 - samples/sec: 4990.61 - lr: 0.050000 +2023-04-06 17:23:14,935 epoch 107 - iter 2976/3720 - loss 0.02889807 - time (sec): 505.17 - samples/sec: 4997.02 - lr: 0.050000 +2023-04-06 17:24:18,198 epoch 107 - iter 3348/3720 - loss 0.02887444 - time (sec): 568.43 - samples/sec: 4996.30 - lr: 0.050000 +2023-04-06 17:25:20,301 epoch 107 - iter 3720/3720 - loss 0.02885701 - time (sec): 630.53 - samples/sec: 4998.50 - lr: 0.050000 +2023-04-06 17:25:20,301 ---------------------------------------------------------------------------------------------------- +2023-04-06 17:25:20,301 EPOCH 107 done: loss 0.0289 - lr 0.050000 +2023-04-06 17:25:20,301 BAD EPOCHS (no improvement): 2 +2023-04-06 17:25:20,304 ---------------------------------------------------------------------------------------------------- +2023-04-06 17:26:24,279 epoch 108 - iter 372/3720 - loss 0.02834232 - time (sec): 63.97 - samples/sec: 4943.86 - lr: 0.050000 +2023-04-06 17:27:28,148 epoch 108 - iter 744/3720 - loss 0.02839086 - time (sec): 127.84 - samples/sec: 4948.53 - lr: 0.050000 +2023-04-06 17:28:30,736 epoch 108 - iter 1116/3720 - loss 0.02874352 - time (sec): 190.43 - samples/sec: 4975.68 - lr: 0.050000 +2023-04-06 17:29:33,820 epoch 108 - iter 1488/3720 - loss 0.02865885 - time (sec): 253.52 - samples/sec: 4973.58 - lr: 0.050000 +2023-04-06 17:30:37,432 epoch 108 - iter 1860/3720 - loss 0.02861584 - time (sec): 317.13 - samples/sec: 4974.93 - lr: 0.050000 +2023-04-06 17:31:40,947 epoch 108 - iter 2232/3720 - loss 0.02873260 - time (sec): 380.64 - samples/sec: 4970.76 - lr: 0.050000 +2023-04-06 17:32:45,352 epoch 108 - iter 2604/3720 - loss 0.02887913 - time (sec): 445.05 - samples/sec: 4959.96 - lr: 0.050000 +2023-04-06 17:33:48,857 epoch 108 - iter 2976/3720 - loss 0.02884463 - time (sec): 508.55 - samples/sec: 4962.67 - lr: 0.050000 +2023-04-06 17:34:52,541 epoch 108 - iter 3348/3720 - loss 0.02882512 - time (sec): 572.24 - samples/sec: 4960.26 - lr: 0.050000 +2023-04-06 17:35:56,493 epoch 108 - iter 3720/3720 - loss 0.02876946 - time (sec): 636.19 - samples/sec: 4954.05 - lr: 0.050000 +2023-04-06 17:35:56,493 ---------------------------------------------------------------------------------------------------- +2023-04-06 17:35:56,493 EPOCH 108 done: loss 0.0288 - lr 0.050000 +2023-04-06 17:35:56,493 BAD EPOCHS (no improvement): 0 +2023-04-06 17:35:56,497 ---------------------------------------------------------------------------------------------------- +2023-04-06 17:37:00,572 epoch 109 - iter 372/3720 - loss 0.02841398 - time (sec): 64.08 - samples/sec: 4929.69 - lr: 0.050000 +2023-04-06 17:38:04,019 epoch 109 - iter 744/3720 - loss 0.02850382 - time (sec): 127.52 - samples/sec: 4930.02 - lr: 0.050000 +2023-04-06 17:39:07,991 epoch 109 - iter 1116/3720 - loss 0.02852396 - time (sec): 191.49 - samples/sec: 4924.26 - lr: 0.050000 +2023-04-06 17:40:11,467 epoch 109 - iter 1488/3720 - loss 0.02871293 - time (sec): 254.97 - samples/sec: 4932.80 - lr: 0.050000 +2023-04-06 17:41:15,598 epoch 109 - iter 1860/3720 - loss 0.02880669 - time (sec): 319.10 - samples/sec: 4924.26 - lr: 0.050000 +2023-04-06 17:42:19,664 epoch 109 - iter 2232/3720 - loss 0.02881068 - time (sec): 383.17 - samples/sec: 4923.89 - lr: 0.050000 +2023-04-06 17:43:24,228 epoch 109 - iter 2604/3720 - loss 0.02874266 - time (sec): 447.73 - samples/sec: 4923.06 - lr: 0.050000 +2023-04-06 17:44:28,013 epoch 109 - iter 2976/3720 - loss 0.02866993 - time (sec): 511.52 - samples/sec: 4926.17 - lr: 0.050000 +2023-04-06 17:45:32,387 epoch 109 - iter 3348/3720 - loss 0.02868024 - time (sec): 575.89 - samples/sec: 4924.73 - lr: 0.050000 +2023-04-06 17:46:35,281 epoch 109 - iter 3720/3720 - loss 0.02876157 - time (sec): 638.78 - samples/sec: 4933.93 - lr: 0.050000 +2023-04-06 17:46:35,281 ---------------------------------------------------------------------------------------------------- +2023-04-06 17:46:35,281 EPOCH 109 done: loss 0.0288 - lr 0.050000 +2023-04-06 17:46:35,281 BAD EPOCHS (no improvement): 0 +2023-04-06 17:46:35,284 ---------------------------------------------------------------------------------------------------- +2023-04-06 17:47:38,550 epoch 110 - iter 372/3720 - loss 0.02880920 - time (sec): 63.27 - samples/sec: 4986.03 - lr: 0.050000 +2023-04-06 17:48:41,087 epoch 110 - iter 744/3720 - loss 0.02851942 - time (sec): 125.80 - samples/sec: 5023.90 - lr: 0.050000 +2023-04-06 17:49:43,649 epoch 110 - iter 1116/3720 - loss 0.02866770 - time (sec): 188.37 - samples/sec: 5031.15 - lr: 0.050000 +2023-04-06 17:50:47,594 epoch 110 - iter 1488/3720 - loss 0.02865069 - time (sec): 252.31 - samples/sec: 5007.43 - lr: 0.050000 +2023-04-06 17:51:51,188 epoch 110 - iter 1860/3720 - loss 0.02875658 - time (sec): 315.90 - samples/sec: 4995.56 - lr: 0.050000 +2023-04-06 17:52:54,789 epoch 110 - iter 2232/3720 - loss 0.02890267 - time (sec): 379.51 - samples/sec: 4987.81 - lr: 0.050000 +2023-04-06 17:53:58,537 epoch 110 - iter 2604/3720 - loss 0.02886673 - time (sec): 443.25 - samples/sec: 4982.66 - lr: 0.050000 +2023-04-06 17:55:01,522 epoch 110 - iter 2976/3720 - loss 0.02893921 - time (sec): 506.24 - samples/sec: 4979.73 - lr: 0.050000 +2023-04-06 17:56:04,715 epoch 110 - iter 3348/3720 - loss 0.02887197 - time (sec): 569.43 - samples/sec: 4978.46 - lr: 0.050000 +2023-04-06 17:57:08,428 epoch 110 - iter 3720/3720 - loss 0.02879770 - time (sec): 633.14 - samples/sec: 4977.88 - lr: 0.050000 +2023-04-06 17:57:08,429 ---------------------------------------------------------------------------------------------------- +2023-04-06 17:57:08,429 EPOCH 110 done: loss 0.0288 - lr 0.050000 +2023-04-06 17:57:08,429 BAD EPOCHS (no improvement): 1 +2023-04-06 17:57:08,432 ---------------------------------------------------------------------------------------------------- +2023-04-06 17:58:12,516 epoch 111 - iter 372/3720 - loss 0.02936568 - time (sec): 64.08 - samples/sec: 4901.69 - lr: 0.050000 +2023-04-06 17:59:16,303 epoch 111 - iter 744/3720 - loss 0.02922799 - time (sec): 127.87 - samples/sec: 4923.93 - lr: 0.050000 +2023-04-06 18:00:19,984 epoch 111 - iter 1116/3720 - loss 0.02903980 - time (sec): 191.55 - samples/sec: 4933.88 - lr: 0.050000 +2023-04-06 18:01:23,853 epoch 111 - iter 1488/3720 - loss 0.02886305 - time (sec): 255.42 - samples/sec: 4937.56 - lr: 0.050000 +2023-04-06 18:02:26,911 epoch 111 - iter 1860/3720 - loss 0.02869059 - time (sec): 318.48 - samples/sec: 4949.74 - lr: 0.050000 +2023-04-06 18:03:30,898 epoch 111 - iter 2232/3720 - loss 0.02861122 - time (sec): 382.47 - samples/sec: 4949.67 - lr: 0.050000 +2023-04-06 18:04:34,183 epoch 111 - iter 2604/3720 - loss 0.02857775 - time (sec): 445.75 - samples/sec: 4957.08 - lr: 0.050000 +2023-04-06 18:05:37,359 epoch 111 - iter 2976/3720 - loss 0.02851697 - time (sec): 508.93 - samples/sec: 4959.08 - lr: 0.050000 +2023-04-06 18:06:40,417 epoch 111 - iter 3348/3720 - loss 0.02854522 - time (sec): 571.99 - samples/sec: 4962.24 - lr: 0.050000 +2023-04-06 18:07:43,144 epoch 111 - iter 3720/3720 - loss 0.02853782 - time (sec): 634.71 - samples/sec: 4965.58 - lr: 0.050000 +2023-04-06 18:07:43,144 ---------------------------------------------------------------------------------------------------- +2023-04-06 18:07:43,144 EPOCH 111 done: loss 0.0285 - lr 0.050000 +2023-04-06 18:07:43,144 BAD EPOCHS (no improvement): 0 +2023-04-06 18:07:43,148 ---------------------------------------------------------------------------------------------------- +2023-04-06 18:08:46,599 epoch 112 - iter 372/3720 - loss 0.02813126 - time (sec): 63.45 - samples/sec: 4954.53 - lr: 0.050000 +2023-04-06 18:09:50,216 epoch 112 - iter 744/3720 - loss 0.02845559 - time (sec): 127.07 - samples/sec: 4945.79 - lr: 0.050000 +2023-04-06 18:10:53,807 epoch 112 - iter 1116/3720 - loss 0.02883468 - time (sec): 190.66 - samples/sec: 4958.64 - lr: 0.050000 +2023-04-06 18:11:56,054 epoch 112 - iter 1488/3720 - loss 0.02885031 - time (sec): 252.91 - samples/sec: 4981.53 - lr: 0.050000 +2023-04-06 18:12:59,597 epoch 112 - iter 1860/3720 - loss 0.02889557 - time (sec): 316.45 - samples/sec: 4978.80 - lr: 0.050000 +2023-04-06 18:14:02,666 epoch 112 - iter 2232/3720 - loss 0.02903618 - time (sec): 379.52 - samples/sec: 4981.14 - lr: 0.050000 +2023-04-06 18:15:06,074 epoch 112 - iter 2604/3720 - loss 0.02892502 - time (sec): 442.93 - samples/sec: 4979.15 - lr: 0.050000 +2023-04-06 18:16:10,092 epoch 112 - iter 2976/3720 - loss 0.02892389 - time (sec): 506.94 - samples/sec: 4973.78 - lr: 0.050000 +2023-04-06 18:17:12,681 epoch 112 - iter 3348/3720 - loss 0.02894698 - time (sec): 569.53 - samples/sec: 4977.99 - lr: 0.050000 +2023-04-06 18:18:15,880 epoch 112 - iter 3720/3720 - loss 0.02887480 - time (sec): 632.73 - samples/sec: 4981.11 - lr: 0.050000 +2023-04-06 18:18:15,880 ---------------------------------------------------------------------------------------------------- +2023-04-06 18:18:15,880 EPOCH 112 done: loss 0.0289 - lr 0.050000 +2023-04-06 18:18:15,881 BAD EPOCHS (no improvement): 1 +2023-04-06 18:18:15,884 ---------------------------------------------------------------------------------------------------- +2023-04-06 18:19:18,187 epoch 113 - iter 372/3720 - loss 0.02880723 - time (sec): 62.30 - samples/sec: 5060.44 - lr: 0.050000 +2023-04-06 18:20:20,784 epoch 113 - iter 744/3720 - loss 0.02876553 - time (sec): 124.90 - samples/sec: 5052.58 - lr: 0.050000 +2023-04-06 18:21:23,750 epoch 113 - iter 1116/3720 - loss 0.02897645 - time (sec): 187.87 - samples/sec: 5034.04 - lr: 0.050000 +2023-04-06 18:22:27,003 epoch 113 - iter 1488/3720 - loss 0.02887117 - time (sec): 251.12 - samples/sec: 5011.98 - lr: 0.050000 +2023-04-06 18:23:31,298 epoch 113 - iter 1860/3720 - loss 0.02877149 - time (sec): 315.41 - samples/sec: 4997.95 - lr: 0.050000 +2023-04-06 18:24:35,282 epoch 113 - iter 2232/3720 - loss 0.02885075 - time (sec): 379.40 - samples/sec: 4984.55 - lr: 0.050000 +2023-04-06 18:25:39,092 epoch 113 - iter 2604/3720 - loss 0.02885398 - time (sec): 443.21 - samples/sec: 4976.09 - lr: 0.050000 +2023-04-06 18:26:43,751 epoch 113 - iter 2976/3720 - loss 0.02884556 - time (sec): 507.87 - samples/sec: 4962.23 - lr: 0.050000 +2023-04-06 18:27:47,317 epoch 113 - iter 3348/3720 - loss 0.02883566 - time (sec): 571.43 - samples/sec: 4964.05 - lr: 0.050000 +2023-04-06 18:28:51,157 epoch 113 - iter 3720/3720 - loss 0.02883942 - time (sec): 635.27 - samples/sec: 4961.20 - lr: 0.050000 +2023-04-06 18:28:51,157 ---------------------------------------------------------------------------------------------------- +2023-04-06 18:28:51,157 EPOCH 113 done: loss 0.0288 - lr 0.050000 +2023-04-06 18:28:51,157 BAD EPOCHS (no improvement): 2 +2023-04-06 18:28:51,160 ---------------------------------------------------------------------------------------------------- +2023-04-06 18:29:54,191 epoch 114 - iter 372/3720 - loss 0.02825922 - time (sec): 63.03 - samples/sec: 4952.07 - lr: 0.050000 +2023-04-06 18:30:57,550 epoch 114 - iter 744/3720 - loss 0.02827768 - time (sec): 126.39 - samples/sec: 4955.43 - lr: 0.050000 +2023-04-06 18:32:02,440 epoch 114 - iter 1116/3720 - loss 0.02832827 - time (sec): 191.28 - samples/sec: 4940.26 - lr: 0.050000 +2023-04-06 18:33:07,304 epoch 114 - iter 1488/3720 - loss 0.02853831 - time (sec): 256.14 - samples/sec: 4926.31 - lr: 0.050000 +2023-04-06 18:34:11,156 epoch 114 - iter 1860/3720 - loss 0.02855166 - time (sec): 320.00 - samples/sec: 4933.45 - lr: 0.050000 +2023-04-06 18:35:13,342 epoch 114 - iter 2232/3720 - loss 0.02859716 - time (sec): 382.18 - samples/sec: 4954.20 - lr: 0.050000 +2023-04-06 18:36:16,232 epoch 114 - iter 2604/3720 - loss 0.02862590 - time (sec): 445.07 - samples/sec: 4962.55 - lr: 0.050000 +2023-04-06 18:37:19,883 epoch 114 - iter 2976/3720 - loss 0.02860909 - time (sec): 508.72 - samples/sec: 4962.97 - lr: 0.050000 +2023-04-06 18:38:23,770 epoch 114 - iter 3348/3720 - loss 0.02871705 - time (sec): 572.61 - samples/sec: 4956.31 - lr: 0.050000 +2023-04-06 18:39:26,389 epoch 114 - iter 3720/3720 - loss 0.02871430 - time (sec): 635.23 - samples/sec: 4961.54 - lr: 0.050000 +2023-04-06 18:39:26,389 ---------------------------------------------------------------------------------------------------- +2023-04-06 18:39:26,389 EPOCH 114 done: loss 0.0287 - lr 0.050000 +2023-04-06 18:39:26,389 BAD EPOCHS (no improvement): 3 +2023-04-06 18:39:26,392 ---------------------------------------------------------------------------------------------------- +2023-04-06 18:40:29,860 epoch 115 - iter 372/3720 - loss 0.02911821 - time (sec): 63.47 - samples/sec: 4927.30 - lr: 0.050000 +2023-04-06 18:41:33,450 epoch 115 - iter 744/3720 - loss 0.02882231 - time (sec): 127.06 - samples/sec: 4941.74 - lr: 0.050000 +2023-04-06 18:42:37,355 epoch 115 - iter 1116/3720 - loss 0.02867095 - time (sec): 190.96 - samples/sec: 4947.90 - lr: 0.050000 +2023-04-06 18:43:41,391 epoch 115 - iter 1488/3720 - loss 0.02861315 - time (sec): 255.00 - samples/sec: 4942.20 - lr: 0.050000 +2023-04-06 18:44:44,772 epoch 115 - iter 1860/3720 - loss 0.02848779 - time (sec): 318.38 - samples/sec: 4944.27 - lr: 0.050000 +2023-04-06 18:45:49,487 epoch 115 - iter 2232/3720 - loss 0.02855081 - time (sec): 383.09 - samples/sec: 4935.84 - lr: 0.050000 +2023-04-06 18:46:53,533 epoch 115 - iter 2604/3720 - loss 0.02856081 - time (sec): 447.14 - samples/sec: 4935.65 - lr: 0.050000 +2023-04-06 18:47:56,484 epoch 115 - iter 2976/3720 - loss 0.02863237 - time (sec): 510.09 - samples/sec: 4944.03 - lr: 0.050000 +2023-04-06 18:49:00,712 epoch 115 - iter 3348/3720 - loss 0.02869631 - time (sec): 574.32 - samples/sec: 4939.07 - lr: 0.050000 +2023-04-06 18:50:04,554 epoch 115 - iter 3720/3720 - loss 0.02869026 - time (sec): 638.16 - samples/sec: 4938.74 - lr: 0.050000 +2023-04-06 18:50:04,554 ---------------------------------------------------------------------------------------------------- +2023-04-06 18:50:04,554 EPOCH 115 done: loss 0.0287 - lr 0.050000 +2023-04-06 18:50:04,554 Epoch 115: reducing learning rate of group 0 to 2.5000e-02. +2023-04-06 18:50:04,554 BAD EPOCHS (no improvement): 4 +2023-04-06 18:50:04,557 ---------------------------------------------------------------------------------------------------- +2023-04-06 18:51:07,957 epoch 116 - iter 372/3720 - loss 0.02821545 - time (sec): 63.40 - samples/sec: 4960.45 - lr: 0.025000 +2023-04-06 18:52:12,265 epoch 116 - iter 744/3720 - loss 0.02796080 - time (sec): 127.71 - samples/sec: 4930.76 - lr: 0.025000 +2023-04-06 18:53:16,249 epoch 116 - iter 1116/3720 - loss 0.02784636 - time (sec): 191.69 - samples/sec: 4923.98 - lr: 0.025000 +2023-04-06 18:54:20,407 epoch 116 - iter 1488/3720 - loss 0.02793204 - time (sec): 255.85 - samples/sec: 4934.67 - lr: 0.025000 +2023-04-06 18:55:24,127 epoch 116 - iter 1860/3720 - loss 0.02790313 - time (sec): 319.57 - samples/sec: 4934.35 - lr: 0.025000 +2023-04-06 18:56:26,817 epoch 116 - iter 2232/3720 - loss 0.02773606 - time (sec): 382.26 - samples/sec: 4950.67 - lr: 0.025000 +2023-04-06 18:57:29,417 epoch 116 - iter 2604/3720 - loss 0.02764451 - time (sec): 444.86 - samples/sec: 4963.13 - lr: 0.025000 +2023-04-06 18:58:31,527 epoch 116 - iter 2976/3720 - loss 0.02765926 - time (sec): 506.97 - samples/sec: 4974.90 - lr: 0.025000 +2023-04-06 18:59:34,328 epoch 116 - iter 3348/3720 - loss 0.02768845 - time (sec): 569.77 - samples/sec: 4980.06 - lr: 0.025000 +2023-04-06 19:00:36,591 epoch 116 - iter 3720/3720 - loss 0.02772749 - time (sec): 632.03 - samples/sec: 4986.62 - lr: 0.025000 +2023-04-06 19:00:36,592 ---------------------------------------------------------------------------------------------------- +2023-04-06 19:00:36,592 EPOCH 116 done: loss 0.0277 - lr 0.025000 +2023-04-06 19:00:36,592 BAD EPOCHS (no improvement): 0 +2023-04-06 19:00:36,595 ---------------------------------------------------------------------------------------------------- +2023-04-06 19:01:38,677 epoch 117 - iter 372/3720 - loss 0.02675697 - time (sec): 62.08 - samples/sec: 5051.78 - lr: 0.025000 +2023-04-06 19:02:41,867 epoch 117 - iter 744/3720 - loss 0.02663327 - time (sec): 125.27 - samples/sec: 5015.39 - lr: 0.025000 +2023-04-06 19:03:45,084 epoch 117 - iter 1116/3720 - loss 0.02706868 - time (sec): 188.49 - samples/sec: 5008.26 - lr: 0.025000 +2023-04-06 19:04:48,764 epoch 117 - iter 1488/3720 - loss 0.02706415 - time (sec): 252.17 - samples/sec: 5003.54 - lr: 0.025000 +2023-04-06 19:05:50,662 epoch 117 - iter 1860/3720 - loss 0.02719994 - time (sec): 314.07 - samples/sec: 5013.20 - lr: 0.025000 +2023-04-06 19:06:53,396 epoch 117 - iter 2232/3720 - loss 0.02713182 - time (sec): 376.80 - samples/sec: 5012.63 - lr: 0.025000 +2023-04-06 19:07:57,352 epoch 117 - iter 2604/3720 - loss 0.02707887 - time (sec): 440.76 - samples/sec: 5006.54 - lr: 0.025000 +2023-04-06 19:08:59,908 epoch 117 - iter 2976/3720 - loss 0.02710851 - time (sec): 503.31 - samples/sec: 5005.35 - lr: 0.025000 +2023-04-06 19:10:02,971 epoch 117 - iter 3348/3720 - loss 0.02721646 - time (sec): 566.38 - samples/sec: 5004.31 - lr: 0.025000 +2023-04-06 19:11:07,259 epoch 117 - iter 3720/3720 - loss 0.02713624 - time (sec): 630.66 - samples/sec: 4997.45 - lr: 0.025000 +2023-04-06 19:11:07,259 ---------------------------------------------------------------------------------------------------- +2023-04-06 19:11:07,259 EPOCH 117 done: loss 0.0271 - lr 0.025000 +2023-04-06 19:11:07,259 BAD EPOCHS (no improvement): 0 +2023-04-06 19:11:07,263 ---------------------------------------------------------------------------------------------------- +2023-04-06 19:12:10,966 epoch 118 - iter 372/3720 - loss 0.02669724 - time (sec): 63.70 - samples/sec: 4937.62 - lr: 0.025000 +2023-04-06 19:13:14,278 epoch 118 - iter 744/3720 - loss 0.02721880 - time (sec): 127.02 - samples/sec: 4945.51 - lr: 0.025000 +2023-04-06 19:14:19,061 epoch 118 - iter 1116/3720 - loss 0.02706087 - time (sec): 191.80 - samples/sec: 4920.94 - lr: 0.025000 +2023-04-06 19:15:21,193 epoch 118 - iter 1488/3720 - loss 0.02716530 - time (sec): 253.93 - samples/sec: 4945.84 - lr: 0.025000 +2023-04-06 19:16:25,556 epoch 118 - iter 1860/3720 - loss 0.02716783 - time (sec): 318.29 - samples/sec: 4945.42 - lr: 0.025000 +2023-04-06 19:17:29,322 epoch 118 - iter 2232/3720 - loss 0.02706879 - time (sec): 382.06 - samples/sec: 4947.43 - lr: 0.025000 +2023-04-06 19:18:34,509 epoch 118 - iter 2604/3720 - loss 0.02708168 - time (sec): 447.25 - samples/sec: 4934.76 - lr: 0.025000 +2023-04-06 19:19:38,213 epoch 118 - iter 2976/3720 - loss 0.02703912 - time (sec): 510.95 - samples/sec: 4937.91 - lr: 0.025000 +2023-04-06 19:20:41,819 epoch 118 - iter 3348/3720 - loss 0.02707908 - time (sec): 574.56 - samples/sec: 4938.99 - lr: 0.025000 +2023-04-06 19:21:45,197 epoch 118 - iter 3720/3720 - loss 0.02702579 - time (sec): 637.93 - samples/sec: 4940.50 - lr: 0.025000 +2023-04-06 19:21:45,197 ---------------------------------------------------------------------------------------------------- +2023-04-06 19:21:45,197 EPOCH 118 done: loss 0.0270 - lr 0.025000 +2023-04-06 19:21:45,197 BAD EPOCHS (no improvement): 0 +2023-04-06 19:21:45,200 ---------------------------------------------------------------------------------------------------- +2023-04-06 19:22:48,238 epoch 119 - iter 372/3720 - loss 0.02718127 - time (sec): 63.04 - samples/sec: 5003.14 - lr: 0.025000 +2023-04-06 19:23:50,912 epoch 119 - iter 744/3720 - loss 0.02726518 - time (sec): 125.71 - samples/sec: 4994.01 - lr: 0.025000 +2023-04-06 19:24:54,097 epoch 119 - iter 1116/3720 - loss 0.02701256 - time (sec): 188.90 - samples/sec: 4997.19 - lr: 0.025000 +2023-04-06 19:25:56,821 epoch 119 - iter 1488/3720 - loss 0.02697041 - time (sec): 251.62 - samples/sec: 4998.53 - lr: 0.025000 +2023-04-06 19:26:58,741 epoch 119 - iter 1860/3720 - loss 0.02697449 - time (sec): 313.54 - samples/sec: 5009.34 - lr: 0.025000 +2023-04-06 19:28:02,318 epoch 119 - iter 2232/3720 - loss 0.02707016 - time (sec): 377.12 - samples/sec: 5001.18 - lr: 0.025000 +2023-04-06 19:29:05,727 epoch 119 - iter 2604/3720 - loss 0.02701127 - time (sec): 440.53 - samples/sec: 4996.73 - lr: 0.025000 +2023-04-06 19:30:10,360 epoch 119 - iter 2976/3720 - loss 0.02697199 - time (sec): 505.16 - samples/sec: 4983.04 - lr: 0.025000 +2023-04-06 19:31:14,922 epoch 119 - iter 3348/3720 - loss 0.02700429 - time (sec): 569.72 - samples/sec: 4975.14 - lr: 0.025000 +2023-04-06 19:32:19,639 epoch 119 - iter 3720/3720 - loss 0.02696087 - time (sec): 634.44 - samples/sec: 4967.72 - lr: 0.025000 +2023-04-06 19:32:19,639 ---------------------------------------------------------------------------------------------------- +2023-04-06 19:32:19,639 EPOCH 119 done: loss 0.0270 - lr 0.025000 +2023-04-06 19:32:19,639 BAD EPOCHS (no improvement): 0 +2023-04-06 19:32:19,642 ---------------------------------------------------------------------------------------------------- +2023-04-06 19:33:23,815 epoch 120 - iter 372/3720 - loss 0.02680386 - time (sec): 64.17 - samples/sec: 4922.23 - lr: 0.025000 +2023-04-06 19:34:27,141 epoch 120 - iter 744/3720 - loss 0.02695026 - time (sec): 127.50 - samples/sec: 4940.91 - lr: 0.025000 +2023-04-06 19:35:29,995 epoch 120 - iter 1116/3720 - loss 0.02687993 - time (sec): 190.35 - samples/sec: 4961.80 - lr: 0.025000 +2023-04-06 19:36:34,191 epoch 120 - iter 1488/3720 - loss 0.02712338 - time (sec): 254.55 - samples/sec: 4956.47 - lr: 0.025000 +2023-04-06 19:37:38,294 epoch 120 - iter 1860/3720 - loss 0.02702479 - time (sec): 318.65 - samples/sec: 4944.56 - lr: 0.025000 +2023-04-06 19:38:41,655 epoch 120 - iter 2232/3720 - loss 0.02690621 - time (sec): 382.01 - samples/sec: 4949.55 - lr: 0.025000 +2023-04-06 19:39:45,334 epoch 120 - iter 2604/3720 - loss 0.02694464 - time (sec): 445.69 - samples/sec: 4947.86 - lr: 0.025000 +2023-04-06 19:40:48,440 epoch 120 - iter 2976/3720 - loss 0.02695253 - time (sec): 508.80 - samples/sec: 4949.23 - lr: 0.025000 +2023-04-06 19:41:52,934 epoch 120 - iter 3348/3720 - loss 0.02695106 - time (sec): 573.29 - samples/sec: 4946.11 - lr: 0.025000 +2023-04-06 19:42:56,744 epoch 120 - iter 3720/3720 - loss 0.02691680 - time (sec): 637.10 - samples/sec: 4946.96 - lr: 0.025000 +2023-04-06 19:42:56,744 ---------------------------------------------------------------------------------------------------- +2023-04-06 19:42:56,744 EPOCH 120 done: loss 0.0269 - lr 0.025000 +2023-04-06 19:42:56,744 BAD EPOCHS (no improvement): 0 +2023-04-06 19:42:56,747 ---------------------------------------------------------------------------------------------------- +2023-04-06 19:44:00,181 epoch 121 - iter 372/3720 - loss 0.02731040 - time (sec): 63.43 - samples/sec: 4975.67 - lr: 0.025000 +2023-04-06 19:45:03,502 epoch 121 - iter 744/3720 - loss 0.02731590 - time (sec): 126.76 - samples/sec: 4993.30 - lr: 0.025000 +2023-04-06 19:46:08,061 epoch 121 - iter 1116/3720 - loss 0.02689033 - time (sec): 191.31 - samples/sec: 4955.16 - lr: 0.025000 +2023-04-06 19:47:12,064 epoch 121 - iter 1488/3720 - loss 0.02672188 - time (sec): 255.32 - samples/sec: 4944.92 - lr: 0.025000 +2023-04-06 19:48:15,567 epoch 121 - iter 1860/3720 - loss 0.02666091 - time (sec): 318.82 - samples/sec: 4945.28 - lr: 0.025000 +2023-04-06 19:49:19,854 epoch 121 - iter 2232/3720 - loss 0.02663124 - time (sec): 383.11 - samples/sec: 4937.49 - lr: 0.025000 +2023-04-06 19:50:23,225 epoch 121 - iter 2604/3720 - loss 0.02671111 - time (sec): 446.48 - samples/sec: 4940.58 - lr: 0.025000 +2023-04-06 19:51:26,327 epoch 121 - iter 2976/3720 - loss 0.02669765 - time (sec): 509.58 - samples/sec: 4947.35 - lr: 0.025000 +2023-04-06 19:52:29,926 epoch 121 - iter 3348/3720 - loss 0.02670859 - time (sec): 573.18 - samples/sec: 4948.39 - lr: 0.025000 +2023-04-06 19:53:33,415 epoch 121 - iter 3720/3720 - loss 0.02670706 - time (sec): 636.67 - samples/sec: 4950.33 - lr: 0.025000 +2023-04-06 19:53:33,415 ---------------------------------------------------------------------------------------------------- +2023-04-06 19:53:33,415 EPOCH 121 done: loss 0.0267 - lr 0.025000 +2023-04-06 19:53:33,415 BAD EPOCHS (no improvement): 0 +2023-04-06 19:53:33,419 ---------------------------------------------------------------------------------------------------- +2023-04-06 19:54:37,754 epoch 122 - iter 372/3720 - loss 0.02598740 - time (sec): 64.34 - samples/sec: 4905.80 - lr: 0.025000 +2023-04-06 19:55:42,681 epoch 122 - iter 744/3720 - loss 0.02656373 - time (sec): 129.26 - samples/sec: 4897.77 - lr: 0.025000 +2023-04-06 19:56:45,612 epoch 122 - iter 1116/3720 - loss 0.02656848 - time (sec): 192.19 - samples/sec: 4931.86 - lr: 0.025000 +2023-04-06 19:57:48,664 epoch 122 - iter 1488/3720 - loss 0.02669494 - time (sec): 255.25 - samples/sec: 4950.96 - lr: 0.025000 +2023-04-06 19:58:52,574 epoch 122 - iter 1860/3720 - loss 0.02665255 - time (sec): 319.16 - samples/sec: 4939.30 - lr: 0.025000 +2023-04-06 19:59:55,997 epoch 122 - iter 2232/3720 - loss 0.02664812 - time (sec): 382.58 - samples/sec: 4940.88 - lr: 0.025000 +2023-04-06 20:00:59,794 epoch 122 - iter 2604/3720 - loss 0.02669736 - time (sec): 446.38 - samples/sec: 4942.45 - lr: 0.025000 +2023-04-06 20:02:03,761 epoch 122 - iter 2976/3720 - loss 0.02676921 - time (sec): 510.34 - samples/sec: 4943.11 - lr: 0.025000 +2023-04-06 20:03:07,085 epoch 122 - iter 3348/3720 - loss 0.02673274 - time (sec): 573.67 - samples/sec: 4945.82 - lr: 0.025000 +2023-04-06 20:04:10,240 epoch 122 - iter 3720/3720 - loss 0.02670126 - time (sec): 636.82 - samples/sec: 4949.13 - lr: 0.025000 +2023-04-06 20:04:10,240 ---------------------------------------------------------------------------------------------------- +2023-04-06 20:04:10,240 EPOCH 122 done: loss 0.0267 - lr 0.025000 +2023-04-06 20:04:10,240 BAD EPOCHS (no improvement): 0 +2023-04-06 20:04:10,245 ---------------------------------------------------------------------------------------------------- +2023-04-06 20:05:12,932 epoch 123 - iter 372/3720 - loss 0.02653286 - time (sec): 62.69 - samples/sec: 5036.53 - lr: 0.025000 +2023-04-06 20:06:15,120 epoch 123 - iter 744/3720 - loss 0.02689535 - time (sec): 124.88 - samples/sec: 5041.14 - lr: 0.025000 +2023-04-06 20:07:18,745 epoch 123 - iter 1116/3720 - loss 0.02664607 - time (sec): 188.50 - samples/sec: 5013.66 - lr: 0.025000 +2023-04-06 20:08:22,419 epoch 123 - iter 1488/3720 - loss 0.02660883 - time (sec): 252.17 - samples/sec: 5008.11 - lr: 0.025000 +2023-04-06 20:09:25,423 epoch 123 - iter 1860/3720 - loss 0.02656737 - time (sec): 315.18 - samples/sec: 5001.03 - lr: 0.025000 +2023-04-06 20:10:29,678 epoch 123 - iter 2232/3720 - loss 0.02659796 - time (sec): 379.43 - samples/sec: 4988.49 - lr: 0.025000 +2023-04-06 20:11:32,277 epoch 123 - iter 2604/3720 - loss 0.02662924 - time (sec): 442.03 - samples/sec: 4996.37 - lr: 0.025000 +2023-04-06 20:12:35,036 epoch 123 - iter 2976/3720 - loss 0.02662029 - time (sec): 504.79 - samples/sec: 4998.47 - lr: 0.025000 +2023-04-06 20:13:38,977 epoch 123 - iter 3348/3720 - loss 0.02656031 - time (sec): 568.73 - samples/sec: 4991.21 - lr: 0.025000 +2023-04-06 20:14:42,417 epoch 123 - iter 3720/3720 - loss 0.02662917 - time (sec): 632.17 - samples/sec: 4985.53 - lr: 0.025000 +2023-04-06 20:14:42,417 ---------------------------------------------------------------------------------------------------- +2023-04-06 20:14:42,417 EPOCH 123 done: loss 0.0266 - lr 0.025000 +2023-04-06 20:14:42,417 BAD EPOCHS (no improvement): 0 +2023-04-06 20:14:42,420 ---------------------------------------------------------------------------------------------------- +2023-04-06 20:15:45,805 epoch 124 - iter 372/3720 - loss 0.02646290 - time (sec): 63.38 - samples/sec: 4951.31 - lr: 0.025000 +2023-04-06 20:16:49,805 epoch 124 - iter 744/3720 - loss 0.02640494 - time (sec): 127.38 - samples/sec: 4934.70 - lr: 0.025000 +2023-04-06 20:17:53,126 epoch 124 - iter 1116/3720 - loss 0.02628842 - time (sec): 190.71 - samples/sec: 4954.98 - lr: 0.025000 +2023-04-06 20:18:55,135 epoch 124 - iter 1488/3720 - loss 0.02636300 - time (sec): 252.71 - samples/sec: 4989.83 - lr: 0.025000 +2023-04-06 20:19:56,619 epoch 124 - iter 1860/3720 - loss 0.02630184 - time (sec): 314.20 - samples/sec: 5008.32 - lr: 0.025000 +2023-04-06 20:20:59,211 epoch 124 - iter 2232/3720 - loss 0.02626940 - time (sec): 376.79 - samples/sec: 5016.94 - lr: 0.025000 +2023-04-06 20:22:01,999 epoch 124 - iter 2604/3720 - loss 0.02638424 - time (sec): 439.58 - samples/sec: 5015.96 - lr: 0.025000 +2023-04-06 20:23:04,829 epoch 124 - iter 2976/3720 - loss 0.02649910 - time (sec): 502.41 - samples/sec: 5018.66 - lr: 0.025000 +2023-04-06 20:24:07,211 epoch 124 - iter 3348/3720 - loss 0.02653918 - time (sec): 564.79 - samples/sec: 5023.01 - lr: 0.025000 +2023-04-06 20:25:11,504 epoch 124 - iter 3720/3720 - loss 0.02663640 - time (sec): 629.08 - samples/sec: 5010.00 - lr: 0.025000 +2023-04-06 20:25:11,505 ---------------------------------------------------------------------------------------------------- +2023-04-06 20:25:11,505 EPOCH 124 done: loss 0.0266 - lr 0.025000 +2023-04-06 20:25:11,505 BAD EPOCHS (no improvement): 1 +2023-04-06 20:25:11,508 ---------------------------------------------------------------------------------------------------- +2023-04-06 20:26:15,531 epoch 125 - iter 372/3720 - loss 0.02534478 - time (sec): 64.02 - samples/sec: 4932.33 - lr: 0.025000 +2023-04-06 20:27:19,395 epoch 125 - iter 744/3720 - loss 0.02581998 - time (sec): 127.89 - samples/sec: 4926.68 - lr: 0.025000 +2023-04-06 20:28:23,262 epoch 125 - iter 1116/3720 - loss 0.02624280 - time (sec): 191.75 - samples/sec: 4932.38 - lr: 0.025000 +2023-04-06 20:29:26,429 epoch 125 - iter 1488/3720 - loss 0.02628706 - time (sec): 254.92 - samples/sec: 4947.10 - lr: 0.025000 +2023-04-06 20:30:30,237 epoch 125 - iter 1860/3720 - loss 0.02624753 - time (sec): 318.73 - samples/sec: 4945.07 - lr: 0.025000 +2023-04-06 20:31:34,859 epoch 125 - iter 2232/3720 - loss 0.02628655 - time (sec): 383.35 - samples/sec: 4939.29 - lr: 0.025000 +2023-04-06 20:32:38,569 epoch 125 - iter 2604/3720 - loss 0.02633956 - time (sec): 447.06 - samples/sec: 4933.77 - lr: 0.025000 +2023-04-06 20:33:42,777 epoch 125 - iter 2976/3720 - loss 0.02634226 - time (sec): 511.27 - samples/sec: 4930.17 - lr: 0.025000 +2023-04-06 20:34:46,447 epoch 125 - iter 3348/3720 - loss 0.02642968 - time (sec): 574.94 - samples/sec: 4932.09 - lr: 0.025000 +2023-04-06 20:35:51,005 epoch 125 - iter 3720/3720 - loss 0.02641503 - time (sec): 639.50 - samples/sec: 4928.42 - lr: 0.025000 +2023-04-06 20:35:51,005 ---------------------------------------------------------------------------------------------------- +2023-04-06 20:35:51,005 EPOCH 125 done: loss 0.0264 - lr 0.025000 +2023-04-06 20:35:51,005 BAD EPOCHS (no improvement): 0 +2023-04-06 20:35:51,009 ---------------------------------------------------------------------------------------------------- +2023-04-06 20:36:55,001 epoch 126 - iter 372/3720 - loss 0.02531438 - time (sec): 63.99 - samples/sec: 4911.63 - lr: 0.025000 +2023-04-06 20:37:58,546 epoch 126 - iter 744/3720 - loss 0.02554386 - time (sec): 127.54 - samples/sec: 4928.08 - lr: 0.025000 +2023-04-06 20:39:02,530 epoch 126 - iter 1116/3720 - loss 0.02568486 - time (sec): 191.52 - samples/sec: 4926.48 - lr: 0.025000 +2023-04-06 20:40:06,252 epoch 126 - iter 1488/3720 - loss 0.02567360 - time (sec): 255.24 - samples/sec: 4930.82 - lr: 0.025000 +2023-04-06 20:41:08,786 epoch 126 - iter 1860/3720 - loss 0.02587454 - time (sec): 317.78 - samples/sec: 4952.65 - lr: 0.025000 +2023-04-06 20:42:11,901 epoch 126 - iter 2232/3720 - loss 0.02600226 - time (sec): 380.89 - samples/sec: 4964.09 - lr: 0.025000 +2023-04-06 20:43:14,515 epoch 126 - iter 2604/3720 - loss 0.02608638 - time (sec): 443.51 - samples/sec: 4975.03 - lr: 0.025000 +2023-04-06 20:44:16,686 epoch 126 - iter 2976/3720 - loss 0.02612202 - time (sec): 505.68 - samples/sec: 4983.84 - lr: 0.025000 +2023-04-06 20:45:19,444 epoch 126 - iter 3348/3720 - loss 0.02619542 - time (sec): 568.44 - samples/sec: 4990.47 - lr: 0.025000 +2023-04-06 20:46:23,292 epoch 126 - iter 3720/3720 - loss 0.02624532 - time (sec): 632.28 - samples/sec: 4984.65 - lr: 0.025000 +2023-04-06 20:46:23,292 ---------------------------------------------------------------------------------------------------- +2023-04-06 20:46:23,292 EPOCH 126 done: loss 0.0262 - lr 0.025000 +2023-04-06 20:46:23,292 BAD EPOCHS (no improvement): 0 +2023-04-06 20:46:23,295 ---------------------------------------------------------------------------------------------------- +2023-04-06 20:47:27,596 epoch 127 - iter 372/3720 - loss 0.02579680 - time (sec): 64.30 - samples/sec: 4904.80 - lr: 0.025000 +2023-04-06 20:48:31,740 epoch 127 - iter 744/3720 - loss 0.02596528 - time (sec): 128.44 - samples/sec: 4907.61 - lr: 0.025000 +2023-04-06 20:49:36,560 epoch 127 - iter 1116/3720 - loss 0.02608173 - time (sec): 193.26 - samples/sec: 4904.64 - lr: 0.025000 +2023-04-06 20:50:40,080 epoch 127 - iter 1488/3720 - loss 0.02601741 - time (sec): 256.78 - samples/sec: 4922.38 - lr: 0.025000 +2023-04-06 20:51:42,737 epoch 127 - iter 1860/3720 - loss 0.02604764 - time (sec): 319.44 - samples/sec: 4942.99 - lr: 0.025000 +2023-04-06 20:52:45,980 epoch 127 - iter 2232/3720 - loss 0.02608747 - time (sec): 382.68 - samples/sec: 4948.80 - lr: 0.025000 +2023-04-06 20:53:49,492 epoch 127 - iter 2604/3720 - loss 0.02615918 - time (sec): 446.20 - samples/sec: 4952.40 - lr: 0.025000 +2023-04-06 20:54:53,390 epoch 127 - iter 2976/3720 - loss 0.02624227 - time (sec): 510.09 - samples/sec: 4945.33 - lr: 0.025000 +2023-04-06 20:55:58,069 epoch 127 - iter 3348/3720 - loss 0.02620766 - time (sec): 574.77 - samples/sec: 4939.41 - lr: 0.025000 +2023-04-06 20:57:00,176 epoch 127 - iter 3720/3720 - loss 0.02619732 - time (sec): 636.88 - samples/sec: 4948.67 - lr: 0.025000 +2023-04-06 20:57:00,177 ---------------------------------------------------------------------------------------------------- +2023-04-06 20:57:00,177 EPOCH 127 done: loss 0.0262 - lr 0.025000 +2023-04-06 20:57:00,177 BAD EPOCHS (no improvement): 0 +2023-04-06 20:57:00,180 ---------------------------------------------------------------------------------------------------- +2023-04-06 20:58:03,014 epoch 128 - iter 372/3720 - loss 0.02628506 - time (sec): 62.83 - samples/sec: 4991.67 - lr: 0.025000 +2023-04-06 20:59:05,789 epoch 128 - iter 744/3720 - loss 0.02647100 - time (sec): 125.61 - samples/sec: 4990.64 - lr: 0.025000 +2023-04-06 21:00:11,004 epoch 128 - iter 1116/3720 - loss 0.02659542 - time (sec): 190.82 - samples/sec: 4946.11 - lr: 0.025000 +2023-04-06 21:01:16,208 epoch 128 - iter 1488/3720 - loss 0.02650373 - time (sec): 256.03 - samples/sec: 4932.21 - lr: 0.025000 +2023-04-06 21:02:19,235 epoch 128 - iter 1860/3720 - loss 0.02648294 - time (sec): 319.06 - samples/sec: 4937.35 - lr: 0.025000 +2023-04-06 21:03:23,840 epoch 128 - iter 2232/3720 - loss 0.02646224 - time (sec): 383.66 - samples/sec: 4930.41 - lr: 0.025000 +2023-04-06 21:04:27,528 epoch 128 - iter 2604/3720 - loss 0.02654571 - time (sec): 447.35 - samples/sec: 4931.29 - lr: 0.025000 +2023-04-06 21:05:31,354 epoch 128 - iter 2976/3720 - loss 0.02643899 - time (sec): 511.17 - samples/sec: 4932.34 - lr: 0.025000 +2023-04-06 21:06:35,909 epoch 128 - iter 3348/3720 - loss 0.02642192 - time (sec): 575.73 - samples/sec: 4929.00 - lr: 0.025000 +2023-04-06 21:07:39,186 epoch 128 - iter 3720/3720 - loss 0.02639418 - time (sec): 639.01 - samples/sec: 4932.21 - lr: 0.025000 +2023-04-06 21:07:39,186 ---------------------------------------------------------------------------------------------------- +2023-04-06 21:07:39,186 EPOCH 128 done: loss 0.0264 - lr 0.025000 +2023-04-06 21:07:39,186 BAD EPOCHS (no improvement): 1 +2023-04-06 21:07:39,189 ---------------------------------------------------------------------------------------------------- +2023-04-06 21:08:42,876 epoch 129 - iter 372/3720 - loss 0.02643114 - time (sec): 63.69 - samples/sec: 4904.80 - lr: 0.025000 +2023-04-06 21:09:47,140 epoch 129 - iter 744/3720 - loss 0.02633930 - time (sec): 127.95 - samples/sec: 4917.39 - lr: 0.025000 +2023-04-06 21:10:50,200 epoch 129 - iter 1116/3720 - loss 0.02634387 - time (sec): 191.01 - samples/sec: 4942.11 - lr: 0.025000 +2023-04-06 21:11:53,293 epoch 129 - iter 1488/3720 - loss 0.02641411 - time (sec): 254.10 - samples/sec: 4952.45 - lr: 0.025000 +2023-04-06 21:12:55,714 epoch 129 - iter 1860/3720 - loss 0.02637481 - time (sec): 316.53 - samples/sec: 4975.52 - lr: 0.025000 +2023-04-06 21:14:00,163 epoch 129 - iter 2232/3720 - loss 0.02623052 - time (sec): 380.97 - samples/sec: 4973.52 - lr: 0.025000 +2023-04-06 21:15:03,340 epoch 129 - iter 2604/3720 - loss 0.02630420 - time (sec): 444.15 - samples/sec: 4974.64 - lr: 0.025000 +2023-04-06 21:16:06,768 epoch 129 - iter 2976/3720 - loss 0.02640706 - time (sec): 507.58 - samples/sec: 4970.72 - lr: 0.025000 +2023-04-06 21:17:10,516 epoch 129 - iter 3348/3720 - loss 0.02638523 - time (sec): 571.33 - samples/sec: 4966.94 - lr: 0.025000 +2023-04-06 21:18:15,192 epoch 129 - iter 3720/3720 - loss 0.02632172 - time (sec): 636.00 - samples/sec: 4955.50 - lr: 0.025000 +2023-04-06 21:18:15,192 ---------------------------------------------------------------------------------------------------- +2023-04-06 21:18:15,192 EPOCH 129 done: loss 0.0263 - lr 0.025000 +2023-04-06 21:18:15,192 BAD EPOCHS (no improvement): 2 +2023-04-06 21:18:15,199 ---------------------------------------------------------------------------------------------------- +2023-04-06 21:19:18,502 epoch 130 - iter 372/3720 - loss 0.02577645 - time (sec): 63.30 - samples/sec: 4955.91 - lr: 0.025000 +2023-04-06 21:20:21,849 epoch 130 - iter 744/3720 - loss 0.02608502 - time (sec): 126.65 - samples/sec: 4970.02 - lr: 0.025000 +2023-04-06 21:21:25,546 epoch 130 - iter 1116/3720 - loss 0.02598848 - time (sec): 190.35 - samples/sec: 4965.13 - lr: 0.025000 +2023-04-06 21:22:27,917 epoch 130 - iter 1488/3720 - loss 0.02586645 - time (sec): 252.72 - samples/sec: 4985.07 - lr: 0.025000 +2023-04-06 21:23:31,506 epoch 130 - iter 1860/3720 - loss 0.02590813 - time (sec): 316.31 - samples/sec: 4981.76 - lr: 0.025000 +2023-04-06 21:24:34,761 epoch 130 - iter 2232/3720 - loss 0.02608655 - time (sec): 379.56 - samples/sec: 4981.43 - lr: 0.025000 +2023-04-06 21:25:37,983 epoch 130 - iter 2604/3720 - loss 0.02619504 - time (sec): 442.78 - samples/sec: 4980.55 - lr: 0.025000 +2023-04-06 21:26:40,873 epoch 130 - iter 2976/3720 - loss 0.02619835 - time (sec): 505.67 - samples/sec: 4984.34 - lr: 0.025000 +2023-04-06 21:27:42,738 epoch 130 - iter 3348/3720 - loss 0.02622439 - time (sec): 567.54 - samples/sec: 4997.30 - lr: 0.025000 +2023-04-06 21:28:45,512 epoch 130 - iter 3720/3720 - loss 0.02614202 - time (sec): 630.31 - samples/sec: 5000.24 - lr: 0.025000 +2023-04-06 21:28:45,512 ---------------------------------------------------------------------------------------------------- +2023-04-06 21:28:45,512 EPOCH 130 done: loss 0.0261 - lr 0.025000 +2023-04-06 21:28:45,512 BAD EPOCHS (no improvement): 0 +2023-04-06 21:28:45,518 ---------------------------------------------------------------------------------------------------- +2023-04-06 21:29:48,226 epoch 131 - iter 372/3720 - loss 0.02583416 - time (sec): 62.71 - samples/sec: 5029.38 - lr: 0.025000 +2023-04-06 21:30:50,711 epoch 131 - iter 744/3720 - loss 0.02579379 - time (sec): 125.19 - samples/sec: 5035.47 - lr: 0.025000 +2023-04-06 21:31:53,354 epoch 131 - iter 1116/3720 - loss 0.02578966 - time (sec): 187.84 - samples/sec: 5043.32 - lr: 0.025000 +2023-04-06 21:32:56,132 epoch 131 - iter 1488/3720 - loss 0.02576554 - time (sec): 250.61 - samples/sec: 5044.14 - lr: 0.025000 +2023-04-06 21:33:58,300 epoch 131 - iter 1860/3720 - loss 0.02566748 - time (sec): 312.78 - samples/sec: 5045.38 - lr: 0.025000 +2023-04-06 21:35:02,035 epoch 131 - iter 2232/3720 - loss 0.02583357 - time (sec): 376.52 - samples/sec: 5028.45 - lr: 0.025000 +2023-04-06 21:36:04,422 epoch 131 - iter 2604/3720 - loss 0.02604849 - time (sec): 438.90 - samples/sec: 5026.52 - lr: 0.025000 +2023-04-06 21:37:08,289 epoch 131 - iter 2976/3720 - loss 0.02610628 - time (sec): 502.77 - samples/sec: 5013.34 - lr: 0.025000 +2023-04-06 21:38:11,661 epoch 131 - iter 3348/3720 - loss 0.02608858 - time (sec): 566.14 - samples/sec: 5005.48 - lr: 0.025000 +2023-04-06 21:39:16,384 epoch 131 - iter 3720/3720 - loss 0.02614340 - time (sec): 630.87 - samples/sec: 4995.85 - lr: 0.025000 +2023-04-06 21:39:16,384 ---------------------------------------------------------------------------------------------------- +2023-04-06 21:39:16,384 EPOCH 131 done: loss 0.0261 - lr 0.025000 +2023-04-06 21:39:16,384 BAD EPOCHS (no improvement): 1 +2023-04-06 21:39:16,388 ---------------------------------------------------------------------------------------------------- +2023-04-06 21:40:19,287 epoch 132 - iter 372/3720 - loss 0.02608236 - time (sec): 62.90 - samples/sec: 4969.94 - lr: 0.025000 +2023-04-06 21:41:23,718 epoch 132 - iter 744/3720 - loss 0.02601802 - time (sec): 127.33 - samples/sec: 4945.46 - lr: 0.025000 +2023-04-06 21:42:27,863 epoch 132 - iter 1116/3720 - loss 0.02631864 - time (sec): 191.48 - samples/sec: 4937.69 - lr: 0.025000 +2023-04-06 21:43:32,268 epoch 132 - iter 1488/3720 - loss 0.02620156 - time (sec): 255.88 - samples/sec: 4933.57 - lr: 0.025000 +2023-04-06 21:44:37,090 epoch 132 - iter 1860/3720 - loss 0.02619527 - time (sec): 320.70 - samples/sec: 4920.44 - lr: 0.025000 +2023-04-06 21:45:40,680 epoch 132 - iter 2232/3720 - loss 0.02618574 - time (sec): 384.29 - samples/sec: 4921.06 - lr: 0.025000 +2023-04-06 21:46:44,513 epoch 132 - iter 2604/3720 - loss 0.02604139 - time (sec): 448.12 - samples/sec: 4917.79 - lr: 0.025000 +2023-04-06 21:47:49,229 epoch 132 - iter 2976/3720 - loss 0.02614251 - time (sec): 512.84 - samples/sec: 4913.54 - lr: 0.025000 +2023-04-06 21:48:51,742 epoch 132 - iter 3348/3720 - loss 0.02614245 - time (sec): 575.35 - samples/sec: 4925.30 - lr: 0.025000 +2023-04-06 21:49:55,623 epoch 132 - iter 3720/3720 - loss 0.02612145 - time (sec): 639.24 - samples/sec: 4930.44 - lr: 0.025000 +2023-04-06 21:49:55,623 ---------------------------------------------------------------------------------------------------- +2023-04-06 21:49:55,623 EPOCH 132 done: loss 0.0261 - lr 0.025000 +2023-04-06 21:49:55,623 BAD EPOCHS (no improvement): 0 +2023-04-06 21:49:55,627 ---------------------------------------------------------------------------------------------------- +2023-04-06 21:50:58,443 epoch 133 - iter 372/3720 - loss 0.02553210 - time (sec): 62.82 - samples/sec: 5011.88 - lr: 0.025000 +2023-04-06 21:52:02,486 epoch 133 - iter 744/3720 - loss 0.02560492 - time (sec): 126.86 - samples/sec: 4979.06 - lr: 0.025000 +2023-04-06 21:53:04,156 epoch 133 - iter 1116/3720 - loss 0.02608778 - time (sec): 188.53 - samples/sec: 5017.29 - lr: 0.025000 +2023-04-06 21:54:07,561 epoch 133 - iter 1488/3720 - loss 0.02616909 - time (sec): 251.93 - samples/sec: 5004.50 - lr: 0.025000 +2023-04-06 21:55:12,056 epoch 133 - iter 1860/3720 - loss 0.02626976 - time (sec): 316.43 - samples/sec: 4980.32 - lr: 0.025000 +2023-04-06 21:56:15,780 epoch 133 - iter 2232/3720 - loss 0.02615927 - time (sec): 380.15 - samples/sec: 4974.76 - lr: 0.025000 +2023-04-06 21:57:19,597 epoch 133 - iter 2604/3720 - loss 0.02605486 - time (sec): 443.97 - samples/sec: 4969.11 - lr: 0.025000 +2023-04-06 21:58:23,279 epoch 133 - iter 2976/3720 - loss 0.02617783 - time (sec): 507.65 - samples/sec: 4967.51 - lr: 0.025000 +2023-04-06 21:59:27,050 epoch 133 - iter 3348/3720 - loss 0.02620108 - time (sec): 571.42 - samples/sec: 4963.89 - lr: 0.025000 +2023-04-06 22:00:30,946 epoch 133 - iter 3720/3720 - loss 0.02611399 - time (sec): 635.32 - samples/sec: 4960.83 - lr: 0.025000 +2023-04-06 22:00:30,946 ---------------------------------------------------------------------------------------------------- +2023-04-06 22:00:30,946 EPOCH 133 done: loss 0.0261 - lr 0.025000 +2023-04-06 22:00:30,946 BAD EPOCHS (no improvement): 0 +2023-04-06 22:00:30,950 ---------------------------------------------------------------------------------------------------- +2023-04-06 22:01:35,438 epoch 134 - iter 372/3720 - loss 0.02583291 - time (sec): 64.49 - samples/sec: 4920.43 - lr: 0.025000 +2023-04-06 22:02:40,061 epoch 134 - iter 744/3720 - loss 0.02600139 - time (sec): 129.11 - samples/sec: 4909.15 - lr: 0.025000 +2023-04-06 22:03:44,224 epoch 134 - iter 1116/3720 - loss 0.02617786 - time (sec): 193.27 - samples/sec: 4915.91 - lr: 0.025000 +2023-04-06 22:04:48,602 epoch 134 - iter 1488/3720 - loss 0.02603403 - time (sec): 257.65 - samples/sec: 4911.66 - lr: 0.025000 +2023-04-06 22:05:52,644 epoch 134 - iter 1860/3720 - loss 0.02626694 - time (sec): 321.69 - samples/sec: 4921.62 - lr: 0.025000 +2023-04-06 22:06:54,744 epoch 134 - iter 2232/3720 - loss 0.02613598 - time (sec): 383.79 - samples/sec: 4937.22 - lr: 0.025000 +2023-04-06 22:07:57,460 epoch 134 - iter 2604/3720 - loss 0.02610478 - time (sec): 446.51 - samples/sec: 4951.08 - lr: 0.025000 +2023-04-06 22:08:59,147 epoch 134 - iter 2976/3720 - loss 0.02603591 - time (sec): 508.20 - samples/sec: 4967.64 - lr: 0.025000 +2023-04-06 22:10:01,299 epoch 134 - iter 3348/3720 - loss 0.02596891 - time (sec): 570.35 - samples/sec: 4975.07 - lr: 0.025000 +2023-04-06 22:11:05,089 epoch 134 - iter 3720/3720 - loss 0.02599401 - time (sec): 634.14 - samples/sec: 4970.06 - lr: 0.025000 +2023-04-06 22:11:05,089 ---------------------------------------------------------------------------------------------------- +2023-04-06 22:11:05,089 EPOCH 134 done: loss 0.0260 - lr 0.025000 +2023-04-06 22:11:05,089 BAD EPOCHS (no improvement): 0 +2023-04-06 22:11:05,119 ---------------------------------------------------------------------------------------------------- +2023-04-06 22:12:09,174 epoch 135 - iter 372/3720 - loss 0.02566066 - time (sec): 64.05 - samples/sec: 4883.81 - lr: 0.025000 +2023-04-06 22:13:13,125 epoch 135 - iter 744/3720 - loss 0.02587147 - time (sec): 128.01 - samples/sec: 4891.86 - lr: 0.025000 +2023-04-06 22:14:16,754 epoch 135 - iter 1116/3720 - loss 0.02587474 - time (sec): 191.63 - samples/sec: 4907.99 - lr: 0.025000 +2023-04-06 22:15:21,193 epoch 135 - iter 1488/3720 - loss 0.02595556 - time (sec): 256.07 - samples/sec: 4911.45 - lr: 0.025000 +2023-04-06 22:16:24,594 epoch 135 - iter 1860/3720 - loss 0.02582688 - time (sec): 319.47 - samples/sec: 4928.54 - lr: 0.025000 +2023-04-06 22:17:28,680 epoch 135 - iter 2232/3720 - loss 0.02583154 - time (sec): 383.56 - samples/sec: 4931.94 - lr: 0.025000 +2023-04-06 22:18:33,286 epoch 135 - iter 2604/3720 - loss 0.02586650 - time (sec): 448.17 - samples/sec: 4928.42 - lr: 0.025000 +2023-04-06 22:19:36,631 epoch 135 - iter 2976/3720 - loss 0.02592220 - time (sec): 511.51 - samples/sec: 4930.47 - lr: 0.025000 +2023-04-06 22:20:40,501 epoch 135 - iter 3348/3720 - loss 0.02587278 - time (sec): 575.38 - samples/sec: 4930.62 - lr: 0.025000 +2023-04-06 22:21:44,435 epoch 135 - iter 3720/3720 - loss 0.02590732 - time (sec): 639.32 - samples/sec: 4929.82 - lr: 0.025000 +2023-04-06 22:21:44,435 ---------------------------------------------------------------------------------------------------- +2023-04-06 22:21:44,435 EPOCH 135 done: loss 0.0259 - lr 0.025000 +2023-04-06 22:21:44,435 BAD EPOCHS (no improvement): 0 +2023-04-06 22:21:44,439 ---------------------------------------------------------------------------------------------------- +2023-04-06 22:22:48,281 epoch 136 - iter 372/3720 - loss 0.02723063 - time (sec): 63.84 - samples/sec: 4950.72 - lr: 0.025000 +2023-04-06 22:23:52,174 epoch 136 - iter 744/3720 - loss 0.02611622 - time (sec): 127.74 - samples/sec: 4951.16 - lr: 0.025000 +2023-04-06 22:24:56,334 epoch 136 - iter 1116/3720 - loss 0.02612083 - time (sec): 191.90 - samples/sec: 4946.21 - lr: 0.025000 +2023-04-06 22:25:59,241 epoch 136 - iter 1488/3720 - loss 0.02621783 - time (sec): 254.80 - samples/sec: 4957.76 - lr: 0.025000 +2023-04-06 22:27:02,838 epoch 136 - iter 1860/3720 - loss 0.02605925 - time (sec): 318.40 - samples/sec: 4953.83 - lr: 0.025000 +2023-04-06 22:28:06,527 epoch 136 - iter 2232/3720 - loss 0.02603578 - time (sec): 382.09 - samples/sec: 4955.32 - lr: 0.025000 +2023-04-06 22:29:09,400 epoch 136 - iter 2604/3720 - loss 0.02598420 - time (sec): 444.96 - samples/sec: 4960.21 - lr: 0.025000 +2023-04-06 22:30:12,756 epoch 136 - iter 2976/3720 - loss 0.02593483 - time (sec): 508.32 - samples/sec: 4960.75 - lr: 0.025000 +2023-04-06 22:31:16,277 epoch 136 - iter 3348/3720 - loss 0.02593681 - time (sec): 571.84 - samples/sec: 4960.80 - lr: 0.025000 +2023-04-06 22:32:19,806 epoch 136 - iter 3720/3720 - loss 0.02599687 - time (sec): 635.37 - samples/sec: 4960.46 - lr: 0.025000 +2023-04-06 22:32:19,806 ---------------------------------------------------------------------------------------------------- +2023-04-06 22:32:19,806 EPOCH 136 done: loss 0.0260 - lr 0.025000 +2023-04-06 22:32:19,806 BAD EPOCHS (no improvement): 1 +2023-04-06 22:32:19,809 ---------------------------------------------------------------------------------------------------- +2023-04-06 22:33:23,643 epoch 137 - iter 372/3720 - loss 0.02613913 - time (sec): 63.83 - samples/sec: 4924.51 - lr: 0.025000 +2023-04-06 22:34:29,340 epoch 137 - iter 744/3720 - loss 0.02598281 - time (sec): 129.53 - samples/sec: 4881.99 - lr: 0.025000 +2023-04-06 22:35:33,482 epoch 137 - iter 1116/3720 - loss 0.02592690 - time (sec): 193.67 - samples/sec: 4886.97 - lr: 0.025000 +2023-04-06 22:36:36,862 epoch 137 - iter 1488/3720 - loss 0.02599989 - time (sec): 257.05 - samples/sec: 4909.45 - lr: 0.025000 +2023-04-06 22:37:40,900 epoch 137 - iter 1860/3720 - loss 0.02584012 - time (sec): 321.09 - samples/sec: 4915.39 - lr: 0.025000 +2023-04-06 22:38:43,964 epoch 137 - iter 2232/3720 - loss 0.02583791 - time (sec): 384.15 - samples/sec: 4928.64 - lr: 0.025000 +2023-04-06 22:39:47,727 epoch 137 - iter 2604/3720 - loss 0.02584277 - time (sec): 447.92 - samples/sec: 4929.96 - lr: 0.025000 +2023-04-06 22:40:51,228 epoch 137 - iter 2976/3720 - loss 0.02588664 - time (sec): 511.42 - samples/sec: 4931.63 - lr: 0.025000 +2023-04-06 22:41:55,001 epoch 137 - iter 3348/3720 - loss 0.02585971 - time (sec): 575.19 - samples/sec: 4932.24 - lr: 0.025000 +2023-04-06 22:42:58,501 epoch 137 - iter 3720/3720 - loss 0.02583166 - time (sec): 638.69 - samples/sec: 4934.64 - lr: 0.025000 +2023-04-06 22:42:58,501 ---------------------------------------------------------------------------------------------------- +2023-04-06 22:42:58,501 EPOCH 137 done: loss 0.0258 - lr 0.025000 +2023-04-06 22:42:58,501 BAD EPOCHS (no improvement): 0 +2023-04-06 22:42:58,504 ---------------------------------------------------------------------------------------------------- +2023-04-06 22:44:02,262 epoch 138 - iter 372/3720 - loss 0.02638899 - time (sec): 63.76 - samples/sec: 4950.99 - lr: 0.025000 +2023-04-06 22:45:06,774 epoch 138 - iter 744/3720 - loss 0.02577679 - time (sec): 128.27 - samples/sec: 4924.26 - lr: 0.025000 +2023-04-06 22:46:11,548 epoch 138 - iter 1116/3720 - loss 0.02563858 - time (sec): 193.04 - samples/sec: 4906.53 - lr: 0.025000 +2023-04-06 22:47:17,012 epoch 138 - iter 1488/3720 - loss 0.02551228 - time (sec): 258.51 - samples/sec: 4890.39 - lr: 0.025000 +2023-04-06 22:48:21,572 epoch 138 - iter 1860/3720 - loss 0.02556028 - time (sec): 323.07 - samples/sec: 4886.61 - lr: 0.025000 +2023-04-06 22:49:24,678 epoch 138 - iter 2232/3720 - loss 0.02568383 - time (sec): 386.17 - samples/sec: 4907.24 - lr: 0.025000 +2023-04-06 22:50:27,797 epoch 138 - iter 2604/3720 - loss 0.02579370 - time (sec): 449.29 - samples/sec: 4917.43 - lr: 0.025000 +2023-04-06 22:51:30,979 epoch 138 - iter 2976/3720 - loss 0.02573020 - time (sec): 512.47 - samples/sec: 4923.16 - lr: 0.025000 +2023-04-06 22:52:33,807 epoch 138 - iter 3348/3720 - loss 0.02588175 - time (sec): 575.30 - samples/sec: 4934.35 - lr: 0.025000 +2023-04-06 22:53:36,022 epoch 138 - iter 3720/3720 - loss 0.02588153 - time (sec): 637.52 - samples/sec: 4943.73 - lr: 0.025000 +2023-04-06 22:53:36,022 ---------------------------------------------------------------------------------------------------- +2023-04-06 22:53:36,022 EPOCH 138 done: loss 0.0259 - lr 0.025000 +2023-04-06 22:53:36,022 BAD EPOCHS (no improvement): 1 +2023-04-06 22:53:36,026 ---------------------------------------------------------------------------------------------------- +2023-04-06 22:54:38,481 epoch 139 - iter 372/3720 - loss 0.02552485 - time (sec): 62.45 - samples/sec: 5022.53 - lr: 0.025000 +2023-04-06 22:55:41,481 epoch 139 - iter 744/3720 - loss 0.02553804 - time (sec): 125.46 - samples/sec: 5017.18 - lr: 0.025000 +2023-04-06 22:56:44,429 epoch 139 - iter 1116/3720 - loss 0.02573355 - time (sec): 188.40 - samples/sec: 5018.26 - lr: 0.025000 +2023-04-06 22:57:46,288 epoch 139 - iter 1488/3720 - loss 0.02583800 - time (sec): 250.26 - samples/sec: 5034.55 - lr: 0.025000 +2023-04-06 22:58:50,182 epoch 139 - iter 1860/3720 - loss 0.02573281 - time (sec): 314.16 - samples/sec: 5007.64 - lr: 0.025000 +2023-04-06 22:59:54,958 epoch 139 - iter 2232/3720 - loss 0.02593784 - time (sec): 378.93 - samples/sec: 4982.69 - lr: 0.025000 +2023-04-06 23:00:59,157 epoch 139 - iter 2604/3720 - loss 0.02592564 - time (sec): 443.13 - samples/sec: 4976.41 - lr: 0.025000 +2023-04-06 23:02:03,185 epoch 139 - iter 2976/3720 - loss 0.02590531 - time (sec): 507.16 - samples/sec: 4971.44 - lr: 0.025000 +2023-04-06 23:03:07,721 epoch 139 - iter 3348/3720 - loss 0.02590306 - time (sec): 571.69 - samples/sec: 4965.32 - lr: 0.025000 +2023-04-06 23:04:11,651 epoch 139 - iter 3720/3720 - loss 0.02592914 - time (sec): 635.63 - samples/sec: 4958.44 - lr: 0.025000 +2023-04-06 23:04:11,652 ---------------------------------------------------------------------------------------------------- +2023-04-06 23:04:11,652 EPOCH 139 done: loss 0.0259 - lr 0.025000 +2023-04-06 23:04:11,652 BAD EPOCHS (no improvement): 2 +2023-04-06 23:04:11,655 ---------------------------------------------------------------------------------------------------- +2023-04-06 23:05:15,980 epoch 140 - iter 372/3720 - loss 0.02533624 - time (sec): 64.32 - samples/sec: 4923.12 - lr: 0.025000 +2023-04-06 23:06:19,205 epoch 140 - iter 744/3720 - loss 0.02598887 - time (sec): 127.55 - samples/sec: 4940.86 - lr: 0.025000 +2023-04-06 23:07:23,079 epoch 140 - iter 1116/3720 - loss 0.02585332 - time (sec): 191.42 - samples/sec: 4950.32 - lr: 0.025000 +2023-04-06 23:08:26,418 epoch 140 - iter 1488/3720 - loss 0.02574556 - time (sec): 254.76 - samples/sec: 4964.48 - lr: 0.025000 +2023-04-06 23:09:30,357 epoch 140 - iter 1860/3720 - loss 0.02578041 - time (sec): 318.70 - samples/sec: 4957.90 - lr: 0.025000 +2023-04-06 23:10:33,812 epoch 140 - iter 2232/3720 - loss 0.02575237 - time (sec): 382.16 - samples/sec: 4957.11 - lr: 0.025000 +2023-04-06 23:11:37,488 epoch 140 - iter 2604/3720 - loss 0.02572028 - time (sec): 445.83 - samples/sec: 4954.54 - lr: 0.025000 +2023-04-06 23:12:40,708 epoch 140 - iter 2976/3720 - loss 0.02579612 - time (sec): 509.05 - samples/sec: 4956.48 - lr: 0.025000 +2023-04-06 23:13:44,271 epoch 140 - iter 3348/3720 - loss 0.02577860 - time (sec): 572.62 - samples/sec: 4955.38 - lr: 0.025000 +2023-04-06 23:14:47,348 epoch 140 - iter 3720/3720 - loss 0.02574111 - time (sec): 635.69 - samples/sec: 4957.92 - lr: 0.025000 +2023-04-06 23:14:47,348 ---------------------------------------------------------------------------------------------------- +2023-04-06 23:14:47,348 EPOCH 140 done: loss 0.0257 - lr 0.025000 +2023-04-06 23:14:47,348 BAD EPOCHS (no improvement): 0 +2023-04-06 23:14:47,352 ---------------------------------------------------------------------------------------------------- +2023-04-06 23:15:51,919 epoch 141 - iter 372/3720 - loss 0.02442453 - time (sec): 64.57 - samples/sec: 4882.76 - lr: 0.025000 +2023-04-06 23:16:55,411 epoch 141 - iter 744/3720 - loss 0.02513508 - time (sec): 128.06 - samples/sec: 4921.75 - lr: 0.025000 +2023-04-06 23:17:59,499 epoch 141 - iter 1116/3720 - loss 0.02526491 - time (sec): 192.15 - samples/sec: 4924.39 - lr: 0.025000 +2023-04-06 23:19:03,941 epoch 141 - iter 1488/3720 - loss 0.02534890 - time (sec): 256.59 - samples/sec: 4927.69 - lr: 0.025000 +2023-04-06 23:20:07,287 epoch 141 - iter 1860/3720 - loss 0.02549156 - time (sec): 319.94 - samples/sec: 4932.14 - lr: 0.025000 +2023-04-06 23:21:11,308 epoch 141 - iter 2232/3720 - loss 0.02555004 - time (sec): 383.96 - samples/sec: 4926.40 - lr: 0.025000 +2023-04-06 23:22:14,759 epoch 141 - iter 2604/3720 - loss 0.02561058 - time (sec): 447.41 - samples/sec: 4932.97 - lr: 0.025000 +2023-04-06 23:23:16,727 epoch 141 - iter 2976/3720 - loss 0.02566289 - time (sec): 509.38 - samples/sec: 4946.11 - lr: 0.025000 +2023-04-06 23:24:20,412 epoch 141 - iter 3348/3720 - loss 0.02566191 - time (sec): 573.06 - samples/sec: 4949.10 - lr: 0.025000 +2023-04-06 23:25:24,711 epoch 141 - iter 3720/3720 - loss 0.02572472 - time (sec): 637.36 - samples/sec: 4944.95 - lr: 0.025000 +2023-04-06 23:25:24,711 ---------------------------------------------------------------------------------------------------- +2023-04-06 23:25:24,711 EPOCH 141 done: loss 0.0257 - lr 0.025000 +2023-04-06 23:25:24,712 BAD EPOCHS (no improvement): 0 +2023-04-06 23:25:24,715 ---------------------------------------------------------------------------------------------------- +2023-04-06 23:26:28,871 epoch 142 - iter 372/3720 - loss 0.02454281 - time (sec): 64.16 - samples/sec: 4919.81 - lr: 0.025000 +2023-04-06 23:27:33,203 epoch 142 - iter 744/3720 - loss 0.02554346 - time (sec): 128.49 - samples/sec: 4916.30 - lr: 0.025000 +2023-04-06 23:28:38,013 epoch 142 - iter 1116/3720 - loss 0.02583124 - time (sec): 193.30 - samples/sec: 4895.76 - lr: 0.025000 +2023-04-06 23:29:42,387 epoch 142 - iter 1488/3720 - loss 0.02585711 - time (sec): 257.67 - samples/sec: 4901.13 - lr: 0.025000 +2023-04-06 23:30:45,098 epoch 142 - iter 1860/3720 - loss 0.02574555 - time (sec): 320.38 - samples/sec: 4915.59 - lr: 0.025000 +2023-04-06 23:31:49,118 epoch 142 - iter 2232/3720 - loss 0.02584393 - time (sec): 384.40 - samples/sec: 4915.32 - lr: 0.025000 +2023-04-06 23:32:52,542 epoch 142 - iter 2604/3720 - loss 0.02579463 - time (sec): 447.83 - samples/sec: 4920.97 - lr: 0.025000 +2023-04-06 23:33:55,836 epoch 142 - iter 2976/3720 - loss 0.02586720 - time (sec): 511.12 - samples/sec: 4928.60 - lr: 0.025000 +2023-04-06 23:35:00,469 epoch 142 - iter 3348/3720 - loss 0.02582206 - time (sec): 575.75 - samples/sec: 4926.09 - lr: 0.025000 +2023-04-06 23:36:04,441 epoch 142 - iter 3720/3720 - loss 0.02575175 - time (sec): 639.73 - samples/sec: 4926.66 - lr: 0.025000 +2023-04-06 23:36:04,441 ---------------------------------------------------------------------------------------------------- +2023-04-06 23:36:04,441 EPOCH 142 done: loss 0.0258 - lr 0.025000 +2023-04-06 23:36:04,441 BAD EPOCHS (no improvement): 1 +2023-04-06 23:36:04,445 ---------------------------------------------------------------------------------------------------- +2023-04-06 23:37:08,262 epoch 143 - iter 372/3720 - loss 0.02531212 - time (sec): 63.82 - samples/sec: 4952.41 - lr: 0.025000 +2023-04-06 23:38:12,616 epoch 143 - iter 744/3720 - loss 0.02551014 - time (sec): 128.17 - samples/sec: 4931.40 - lr: 0.025000 +2023-04-06 23:39:16,962 epoch 143 - iter 1116/3720 - loss 0.02552322 - time (sec): 192.52 - samples/sec: 4926.55 - lr: 0.025000 +2023-04-06 23:40:20,555 epoch 143 - iter 1488/3720 - loss 0.02556579 - time (sec): 256.11 - samples/sec: 4932.25 - lr: 0.025000 +2023-04-06 23:41:24,062 epoch 143 - iter 1860/3720 - loss 0.02581501 - time (sec): 319.62 - samples/sec: 4934.83 - lr: 0.025000 +2023-04-06 23:42:27,208 epoch 143 - iter 2232/3720 - loss 0.02578200 - time (sec): 382.76 - samples/sec: 4945.20 - lr: 0.025000 +2023-04-06 23:43:31,595 epoch 143 - iter 2604/3720 - loss 0.02572099 - time (sec): 447.15 - samples/sec: 4935.20 - lr: 0.025000 +2023-04-06 23:44:35,952 epoch 143 - iter 2976/3720 - loss 0.02558884 - time (sec): 511.51 - samples/sec: 4927.93 - lr: 0.025000 +2023-04-06 23:45:40,135 epoch 143 - iter 3348/3720 - loss 0.02559362 - time (sec): 575.69 - samples/sec: 4929.64 - lr: 0.025000 +2023-04-06 23:46:43,409 epoch 143 - iter 3720/3720 - loss 0.02562851 - time (sec): 638.96 - samples/sec: 4932.53 - lr: 0.025000 +2023-04-06 23:46:43,410 ---------------------------------------------------------------------------------------------------- +2023-04-06 23:46:43,410 EPOCH 143 done: loss 0.0256 - lr 0.025000 +2023-04-06 23:46:43,410 BAD EPOCHS (no improvement): 0 +2023-04-06 23:46:43,413 ---------------------------------------------------------------------------------------------------- +2023-04-06 23:47:47,065 epoch 144 - iter 372/3720 - loss 0.02503982 - time (sec): 63.65 - samples/sec: 4937.81 - lr: 0.025000 +2023-04-06 23:48:50,955 epoch 144 - iter 744/3720 - loss 0.02565553 - time (sec): 127.54 - samples/sec: 4928.72 - lr: 0.025000 +2023-04-06 23:49:55,285 epoch 144 - iter 1116/3720 - loss 0.02550931 - time (sec): 191.87 - samples/sec: 4924.62 - lr: 0.025000 +2023-04-06 23:50:59,428 epoch 144 - iter 1488/3720 - loss 0.02547788 - time (sec): 256.02 - samples/sec: 4923.84 - lr: 0.025000 +2023-04-06 23:52:02,385 epoch 144 - iter 1860/3720 - loss 0.02544773 - time (sec): 318.97 - samples/sec: 4939.46 - lr: 0.025000 +2023-04-06 23:53:05,940 epoch 144 - iter 2232/3720 - loss 0.02567112 - time (sec): 382.53 - samples/sec: 4940.52 - lr: 0.025000 +2023-04-06 23:54:10,215 epoch 144 - iter 2604/3720 - loss 0.02565937 - time (sec): 446.80 - samples/sec: 4937.55 - lr: 0.025000 +2023-04-06 23:55:14,241 epoch 144 - iter 2976/3720 - loss 0.02566799 - time (sec): 510.83 - samples/sec: 4931.94 - lr: 0.025000 +2023-04-06 23:56:18,506 epoch 144 - iter 3348/3720 - loss 0.02562112 - time (sec): 575.09 - samples/sec: 4931.61 - lr: 0.025000 +2023-04-06 23:57:21,784 epoch 144 - iter 3720/3720 - loss 0.02559035 - time (sec): 638.37 - samples/sec: 4937.12 - lr: 0.025000 +2023-04-06 23:57:21,785 ---------------------------------------------------------------------------------------------------- +2023-04-06 23:57:21,785 EPOCH 144 done: loss 0.0256 - lr 0.025000 +2023-04-06 23:57:21,785 BAD EPOCHS (no improvement): 0 +2023-04-06 23:57:21,788 ---------------------------------------------------------------------------------------------------- +2023-04-06 23:58:24,501 epoch 145 - iter 372/3720 - loss 0.02545164 - time (sec): 62.71 - samples/sec: 5042.47 - lr: 0.025000 +2023-04-06 23:59:28,252 epoch 145 - iter 744/3720 - loss 0.02574462 - time (sec): 126.46 - samples/sec: 5001.06 - lr: 0.025000 +2023-04-07 00:00:32,273 epoch 145 - iter 1116/3720 - loss 0.02563708 - time (sec): 190.48 - samples/sec: 4972.09 - lr: 0.025000 +2023-04-07 00:01:34,593 epoch 145 - iter 1488/3720 - loss 0.02546344 - time (sec): 252.80 - samples/sec: 4993.69 - lr: 0.025000 +2023-04-07 00:02:36,830 epoch 145 - iter 1860/3720 - loss 0.02561387 - time (sec): 315.04 - samples/sec: 4997.70 - lr: 0.025000 +2023-04-07 00:03:39,276 epoch 145 - iter 2232/3720 - loss 0.02561802 - time (sec): 377.49 - samples/sec: 5002.92 - lr: 0.025000 +2023-04-07 00:04:43,702 epoch 145 - iter 2604/3720 - loss 0.02560137 - time (sec): 441.91 - samples/sec: 4985.64 - lr: 0.025000 +2023-04-07 00:05:47,108 epoch 145 - iter 2976/3720 - loss 0.02570301 - time (sec): 505.32 - samples/sec: 4982.07 - lr: 0.025000 +2023-04-07 00:06:51,444 epoch 145 - iter 3348/3720 - loss 0.02567101 - time (sec): 569.66 - samples/sec: 4971.75 - lr: 0.025000 +2023-04-07 00:07:56,444 epoch 145 - iter 3720/3720 - loss 0.02563443 - time (sec): 634.66 - samples/sec: 4966.02 - lr: 0.025000 +2023-04-07 00:07:56,444 ---------------------------------------------------------------------------------------------------- +2023-04-07 00:07:56,444 EPOCH 145 done: loss 0.0256 - lr 0.025000 +2023-04-07 00:07:56,445 BAD EPOCHS (no improvement): 1 +2023-04-07 00:07:56,448 ---------------------------------------------------------------------------------------------------- +2023-04-07 00:08:59,126 epoch 146 - iter 372/3720 - loss 0.02589090 - time (sec): 62.68 - samples/sec: 5008.35 - lr: 0.025000 +2023-04-07 00:10:03,439 epoch 146 - iter 744/3720 - loss 0.02526705 - time (sec): 126.99 - samples/sec: 4952.15 - lr: 0.025000 +2023-04-07 00:11:07,046 epoch 146 - iter 1116/3720 - loss 0.02550601 - time (sec): 190.60 - samples/sec: 4958.67 - lr: 0.025000 +2023-04-07 00:12:10,548 epoch 146 - iter 1488/3720 - loss 0.02536717 - time (sec): 254.10 - samples/sec: 4959.25 - lr: 0.025000 +2023-04-07 00:13:14,382 epoch 146 - iter 1860/3720 - loss 0.02534244 - time (sec): 317.93 - samples/sec: 4958.88 - lr: 0.025000 +2023-04-07 00:14:17,039 epoch 146 - iter 2232/3720 - loss 0.02528017 - time (sec): 380.59 - samples/sec: 4968.09 - lr: 0.025000 +2023-04-07 00:15:19,654 epoch 146 - iter 2604/3720 - loss 0.02524634 - time (sec): 443.21 - samples/sec: 4976.96 - lr: 0.025000 +2023-04-07 00:16:23,204 epoch 146 - iter 2976/3720 - loss 0.02522499 - time (sec): 506.76 - samples/sec: 4970.64 - lr: 0.025000 +2023-04-07 00:17:28,245 epoch 146 - iter 3348/3720 - loss 0.02534385 - time (sec): 571.80 - samples/sec: 4961.30 - lr: 0.025000 +2023-04-07 00:18:32,331 epoch 146 - iter 3720/3720 - loss 0.02535678 - time (sec): 635.88 - samples/sec: 4956.43 - lr: 0.025000 +2023-04-07 00:18:32,331 ---------------------------------------------------------------------------------------------------- +2023-04-07 00:18:32,331 EPOCH 146 done: loss 0.0254 - lr 0.025000 +2023-04-07 00:18:32,332 BAD EPOCHS (no improvement): 0 +2023-04-07 00:18:32,365 ---------------------------------------------------------------------------------------------------- +2023-04-07 00:19:37,026 epoch 147 - iter 372/3720 - loss 0.02507179 - time (sec): 64.66 - samples/sec: 4889.70 - lr: 0.025000 +2023-04-07 00:20:41,357 epoch 147 - iter 744/3720 - loss 0.02501378 - time (sec): 128.99 - samples/sec: 4900.85 - lr: 0.025000 +2023-04-07 00:21:45,141 epoch 147 - iter 1116/3720 - loss 0.02522842 - time (sec): 192.78 - samples/sec: 4910.37 - lr: 0.025000 +2023-04-07 00:22:49,600 epoch 147 - iter 1488/3720 - loss 0.02517993 - time (sec): 257.23 - samples/sec: 4916.48 - lr: 0.025000 +2023-04-07 00:23:53,037 epoch 147 - iter 1860/3720 - loss 0.02536139 - time (sec): 320.67 - samples/sec: 4925.55 - lr: 0.025000 +2023-04-07 00:24:57,619 epoch 147 - iter 2232/3720 - loss 0.02547593 - time (sec): 385.25 - samples/sec: 4920.70 - lr: 0.025000 +2023-04-07 00:26:01,113 epoch 147 - iter 2604/3720 - loss 0.02549843 - time (sec): 448.75 - samples/sec: 4925.88 - lr: 0.025000 +2023-04-07 00:27:04,506 epoch 147 - iter 2976/3720 - loss 0.02552815 - time (sec): 512.14 - samples/sec: 4930.06 - lr: 0.025000 +2023-04-07 00:28:08,452 epoch 147 - iter 3348/3720 - loss 0.02553373 - time (sec): 576.09 - samples/sec: 4927.51 - lr: 0.025000 +2023-04-07 00:29:11,291 epoch 147 - iter 3720/3720 - loss 0.02552517 - time (sec): 638.93 - samples/sec: 4932.83 - lr: 0.025000 +2023-04-07 00:29:11,291 ---------------------------------------------------------------------------------------------------- +2023-04-07 00:29:11,291 EPOCH 147 done: loss 0.0255 - lr 0.025000 +2023-04-07 00:29:11,291 BAD EPOCHS (no improvement): 1 +2023-04-07 00:29:11,295 ---------------------------------------------------------------------------------------------------- +2023-04-07 00:30:15,880 epoch 148 - iter 372/3720 - loss 0.02500274 - time (sec): 64.58 - samples/sec: 4882.34 - lr: 0.025000 +2023-04-07 00:31:20,464 epoch 148 - iter 744/3720 - loss 0.02497199 - time (sec): 129.17 - samples/sec: 4898.07 - lr: 0.025000 +2023-04-07 00:32:23,169 epoch 148 - iter 1116/3720 - loss 0.02508581 - time (sec): 191.87 - samples/sec: 4931.86 - lr: 0.025000 +2023-04-07 00:33:27,782 epoch 148 - iter 1488/3720 - loss 0.02529478 - time (sec): 256.49 - samples/sec: 4920.74 - lr: 0.025000 +2023-04-07 00:34:31,503 epoch 148 - iter 1860/3720 - loss 0.02533457 - time (sec): 320.21 - samples/sec: 4925.54 - lr: 0.025000 +2023-04-07 00:35:35,200 epoch 148 - iter 2232/3720 - loss 0.02534177 - time (sec): 383.90 - samples/sec: 4930.17 - lr: 0.025000 +2023-04-07 00:36:37,690 epoch 148 - iter 2604/3720 - loss 0.02534918 - time (sec): 446.40 - samples/sec: 4940.98 - lr: 0.025000 +2023-04-07 00:37:41,976 epoch 148 - iter 2976/3720 - loss 0.02543365 - time (sec): 510.68 - samples/sec: 4937.32 - lr: 0.025000 +2023-04-07 00:38:45,417 epoch 148 - iter 3348/3720 - loss 0.02546538 - time (sec): 574.12 - samples/sec: 4939.68 - lr: 0.025000 +2023-04-07 00:39:49,356 epoch 148 - iter 3720/3720 - loss 0.02551808 - time (sec): 638.06 - samples/sec: 4939.51 - lr: 0.025000 +2023-04-07 00:39:49,356 ---------------------------------------------------------------------------------------------------- +2023-04-07 00:39:49,356 EPOCH 148 done: loss 0.0255 - lr 0.025000 +2023-04-07 00:39:49,356 BAD EPOCHS (no improvement): 2 +2023-04-07 00:39:49,360 ---------------------------------------------------------------------------------------------------- +2023-04-07 00:40:53,940 epoch 149 - iter 372/3720 - loss 0.02527195 - time (sec): 64.58 - samples/sec: 4907.18 - lr: 0.025000 +2023-04-07 00:41:58,077 epoch 149 - iter 744/3720 - loss 0.02541228 - time (sec): 128.72 - samples/sec: 4931.90 - lr: 0.025000 +2023-04-07 00:43:01,475 epoch 149 - iter 1116/3720 - loss 0.02531123 - time (sec): 192.12 - samples/sec: 4926.60 - lr: 0.025000 +2023-04-07 00:44:05,865 epoch 149 - iter 1488/3720 - loss 0.02574382 - time (sec): 256.50 - samples/sec: 4921.44 - lr: 0.025000 +2023-04-07 00:45:08,754 epoch 149 - iter 1860/3720 - loss 0.02557559 - time (sec): 319.39 - samples/sec: 4937.89 - lr: 0.025000 +2023-04-07 00:46:12,748 epoch 149 - iter 2232/3720 - loss 0.02538772 - time (sec): 383.39 - samples/sec: 4934.65 - lr: 0.025000 +2023-04-07 00:47:17,990 epoch 149 - iter 2604/3720 - loss 0.02539580 - time (sec): 448.63 - samples/sec: 4924.78 - lr: 0.025000 +2023-04-07 00:48:21,744 epoch 149 - iter 2976/3720 - loss 0.02543328 - time (sec): 512.38 - samples/sec: 4928.43 - lr: 0.025000 +2023-04-07 00:49:24,803 epoch 149 - iter 3348/3720 - loss 0.02537053 - time (sec): 575.44 - samples/sec: 4934.66 - lr: 0.025000 +2023-04-07 00:50:28,000 epoch 149 - iter 3720/3720 - loss 0.02537367 - time (sec): 638.64 - samples/sec: 4935.04 - lr: 0.025000 +2023-04-07 00:50:28,000 ---------------------------------------------------------------------------------------------------- +2023-04-07 00:50:28,001 EPOCH 149 done: loss 0.0254 - lr 0.025000 +2023-04-07 00:50:28,001 BAD EPOCHS (no improvement): 3 +2023-04-07 00:50:28,004 ---------------------------------------------------------------------------------------------------- +2023-04-07 00:51:31,132 epoch 150 - iter 372/3720 - loss 0.02509917 - time (sec): 63.13 - samples/sec: 4999.77 - lr: 0.025000 +2023-04-07 00:52:33,491 epoch 150 - iter 744/3720 - loss 0.02528357 - time (sec): 125.49 - samples/sec: 5040.43 - lr: 0.025000 +2023-04-07 00:53:37,008 epoch 150 - iter 1116/3720 - loss 0.02521386 - time (sec): 189.00 - samples/sec: 5023.44 - lr: 0.025000 +2023-04-07 00:54:39,974 epoch 150 - iter 1488/3720 - loss 0.02525906 - time (sec): 251.97 - samples/sec: 5026.77 - lr: 0.025000 +2023-04-07 00:55:42,900 epoch 150 - iter 1860/3720 - loss 0.02537075 - time (sec): 314.90 - samples/sec: 5022.86 - lr: 0.025000 +2023-04-07 00:56:44,701 epoch 150 - iter 2232/3720 - loss 0.02534848 - time (sec): 376.70 - samples/sec: 5032.75 - lr: 0.025000 +2023-04-07 00:57:48,820 epoch 150 - iter 2604/3720 - loss 0.02528790 - time (sec): 440.82 - samples/sec: 5021.57 - lr: 0.025000 +2023-04-07 00:58:52,332 epoch 150 - iter 2976/3720 - loss 0.02534070 - time (sec): 504.33 - samples/sec: 5010.36 - lr: 0.025000 +2023-04-07 00:59:55,540 epoch 150 - iter 3348/3720 - loss 0.02529852 - time (sec): 567.54 - samples/sec: 5002.01 - lr: 0.025000 +2023-04-07 01:00:59,069 epoch 150 - iter 3720/3720 - loss 0.02530371 - time (sec): 631.06 - samples/sec: 4994.28 - lr: 0.025000 +2023-04-07 01:00:59,070 ---------------------------------------------------------------------------------------------------- +2023-04-07 01:00:59,070 EPOCH 150 done: loss 0.0253 - lr 0.025000 +2023-04-07 01:00:59,070 BAD EPOCHS (no improvement): 0 +2023-04-07 01:01:06,016 ---------------------------------------------------------------------------------------------------- +2023-04-07 01:01:06,017 Testing using last state of model ... +2023-04-07 01:02:10,849 Evaluating as a multi-label problem: False +2023-04-07 01:02:11,002 0.9066 0.9053 0.9059 0.8494 +2023-04-07 01:02:11,002 +Results: +- F-score (micro) 0.9059 +- F-score (macro) 0.8941 +- Accuracy 0.8494 + +By class: + precision recall f1-score support + + LOC 0.8913 0.9020 0.8967 11495 + PER 0.9592 0.9659 0.9625 7444 + MISC 0.8615 0.8310 0.8460 3946 + ORG 0.8869 0.8559 0.8712 2429 + + micro avg 0.9066 0.9053 0.9059 25314 + macro avg 0.8998 0.8887 0.8941 25314 +weighted avg 0.9062 0.9053 0.9057 25314 + +2023-04-07 01:02:11,002 ----------------------------------------------------------------------------------------------------