diff --git "a/wandb/run-20220317_145036-3tnpukko/files/output.log" "b/wandb/run-20220317_145036-3tnpukko/files/output.log" new file mode 100644--- /dev/null +++ "b/wandb/run-20220317_145036-3tnpukko/files/output.log" @@ -0,0 +1,3371 @@ + + + 0%| | 0/892 [00:00> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:50:42,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:50:44,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 12.227, 'learning_rate': 0.0, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-17 14:50:46,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 1/892 [00:08<2:00:48, 8.14s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:50:48,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:50:49,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:50:51,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 12.7771, 'learning_rate': 0.0, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-17 14:50:53,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%|▏ | 2/892 [00:15<1:52:40, 7.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:50:55,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:50:57,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:50:58,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 12.7177, 'learning_rate': 0.0, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:00,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 3/892 [00:22<1:49:28, 7.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:51:02,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:04,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:06,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 12.635, 'learning_rate': 0.0, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:08,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%|▎ | 4/892 [00:30<1:50:23, 7.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:51:10,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:11,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:13,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 12.2989, 'learning_rate': 0.0, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:15,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 5/892 [00:37<1:47:42, 7.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:51:17,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:18,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:20,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 12.6181, 'learning_rate': 6e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:22,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 1%|▌ | 6/892 [00:44<1:47:11, 7.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:51:24,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:25,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:27,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 11.9585, 'learning_rate': 1.2e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:29,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 7/892 [00:51<1:45:38, 7.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:51:31,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:32,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:34,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 11.24, 'learning_rate': 1.8e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:36,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 1%|▋ | 8/892 [00:58<1:44:20, 7.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:51:38,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:39,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:41,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:43,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 9/892 [01:04<1:42:54, 6.99s/it] + + 1%|▊ | 9/892 [01:04<1:42:54, 6.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:51:44,834 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:46,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:48,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:49,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 11.647, 'learning_rate': 2.9999999999999997e-06, 'epoch': 0.01} + 1%|▉ | 10/892 [01:11<1:42:09, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:51:51,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:53,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:55,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 11.2743, 'learning_rate': 3.6e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-17 14:51:56,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 1%|▉ | 11/892 [01:18<1:41:21, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:51:58,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:00,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:01,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:03,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 12/892 [01:25<1:40:30, 6.85s/it] + + 1%|█ | 12/892 [01:25<1:40:30, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:52:05,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:06,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:08,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:10,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 13/892 [01:31<1:39:37, 6.80s/it] + + 1%|█▏ | 13/892 [01:31<1:39:37, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:52:11,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:13,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:15,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.482, 'learning_rate': 5.399999999999999e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:16,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 14/892 [01:38<1:39:04, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:52:18,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:20,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:21,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:23,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 15/892 [01:45<1:38:11, 6.72s/it] + + 2%|█▎ | 15/892 [01:45<1:38:11, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:52:25,108 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:26,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:28,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:29,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 16/892 [01:51<1:37:08, 6.65s/it] + + 2%|█▍ | 16/892 [01:51<1:37:08, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:52:31,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:33,209 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:34,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:36,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 17/892 [01:58<1:36:16, 6.60s/it] + + 2%|█▌ | 17/892 [01:58<1:36:16, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:52:38,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:39,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:41,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:42,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 18/892 [02:04<1:35:29, 6.56s/it] + + 2%|█▌ | 18/892 [02:04<1:35:29, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:52:44,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:46,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:47,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:49,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.6623, 'learning_rate': 8.4e-06, 'epoch': 0.02} + 2%|█▋ | 19/892 [02:11<1:35:06, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:52:51,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:52,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:54,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4867, 'learning_rate': 8.999999999999999e-06, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:55,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 20/892 [02:17<1:34:18, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:52:57,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:52:58,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:00,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:02,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 21/892 [02:23<1:33:36, 6.45s/it] + 2%|█▉ | 21/892 [02:23<1:33:36, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:53:03,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:05,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:06,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:08,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 22/892 [02:30<1:32:52, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:53:09,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1014, 'learning_rate': 1.02e-05, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:11,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:13,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:14,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 23/892 [02:36<1:31:47, 6.34s/it] + 3%|██ | 23/892 [02:36<1:31:47, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:53:16,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:17,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:19,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:20,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 24/892 [02:42<1:31:35, 6.33s/it] + 3%|██▏ | 24/892 [02:42<1:31:35, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:53:22,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:23,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:25,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:27,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 25/892 [02:49<1:34:51, 6.57s/it] + 3%|██▏ | 25/892 [02:49<1:34:51, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:53:29,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:31,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:29,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:31,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:29,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:34,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:29,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:34,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:29,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 26/892 [02:55<1:32:56, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:53:35,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:38,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:35,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:38,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:35,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 27/892 [03:02<1:31:09, 6.32s/it]g-point operations will not be computed-17 14:53:35,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 27/892 [03:02<1:31:09, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:53:41,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:44,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:41,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:44,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:41,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 28/892 [03:08<1:29:29, 6.22s/it]g-point operations will not be computed-17 14:53:41,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 28/892 [03:08<1:29:29, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:53:47,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:50,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:47,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:50,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:47,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 29/892 [03:13<1:28:05, 6.12s/it]g-point operations will not be computed-17 14:53:47,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 29/892 [03:13<1:28:05, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:53:53,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:56,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:53,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:53:56,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:53,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 30/892 [03:19<1:26:47, 6.04s/it]g-point operations will not be computed-17 14:53:53,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 30/892 [03:19<1:26:47, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:53:59,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:54:02,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:59,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:54:02,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:53:59,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▊ | 31/892 [03:25<1:26:03, 6.00s/it]g-point operations will not be computed-17 14:53:59,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▊ | 31/892 [03:25<1:26:03, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:05,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:54:08,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:54:05,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:54:08,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:54:05,289 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 32/892 [03:31<1:24:36, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:11,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 32/892 [03:31<1:24:36, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:11,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 33/892 [03:37<1:23:36, 5.84s/it]g-point operations will not be computed-17 14:54:11,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 33/892 [03:37<1:23:36, 5.84s/it]g-point operations will not be computed-17 14:54:11,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 33/892 [03:37<1:23:36, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:16,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:54:19,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:54:16,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:54:19,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:54:16,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 34/892 [03:42<1:21:38, 5.71s/it]g-point operations will not be computed-17 14:54:16,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 34/892 [03:42<1:21:38, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:21,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:54:24,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:54:21,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:54:24,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:54:21,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 35/892 [03:47<1:19:44, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:27,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 35/892 [03:47<1:19:44, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:27,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 36/892 [03:53<1:18:40, 5.51s/it]g-point operations will not be computed-17 14:54:27,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 36/892 [03:53<1:18:40, 5.51s/it]g-point operations will not be computed-17 14:54:27,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 36/892 [03:53<1:18:40, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:32,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:54:35,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:54:32,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:54:35,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:54:32,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 37/892 [03:58<1:17:21, 5.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:37,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 37/892 [03:58<1:17:21, 5.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:37,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 38/892 [04:03<1:15:38, 5.31s/it]g-point operations will not be computed-17 14:54:37,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 38/892 [04:03<1:15:38, 5.31s/it]g-point operations will not be computed-17 14:54:37,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 38/892 [04:03<1:15:38, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:54:45,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:54:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:54:45,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:54:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 39/892 [04:08<1:13:52, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:47,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 39/892 [04:08<1:13:52, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:47,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 39/892 [04:08<1:13:52, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:47,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▌ | 40/892 [04:13<1:11:58, 5.07s/it]g-point operations will not be computed-17 14:54:47,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▌ | 40/892 [04:13<1:11:58, 5.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:52,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 41/892 [04:17<1:09:22, 4.89s/it]g-point operations will not be computed-17 14:54:52,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 41/892 [04:17<1:09:22, 4.89s/it]g-point operations will not be computed-17 14:54:52,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 41/892 [04:17<1:09:22, 4.89s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:54:56,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 42/892 [04:21<1:06:46, 4.71s/it]g-point operations will not be computed-17 14:54:56,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 42/892 [04:21<1:06:46, 4.71s/it]g-point operations will not be computed-17 14:54:56,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 42/892 [04:21<1:06:46, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:01,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 43/892 [04:25<1:03:45, 4.51s/it]g-point operations will not be computed-17 14:55:01,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 43/892 [04:25<1:03:45, 4.51s/it]g-point operations will not be computed-17 14:55:01,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 43/892 [04:25<1:03:45, 4.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 43/892 [04:25<1:03:45, 4.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 44/892 [04:29<59:58, 4.24s/it]g-point operations will not be computed-17 14:55:05,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:55:10,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:55:08,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:55:10,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:55:08,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▏ | 45/892 [04:32<55:36, 3.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:11,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▏ | 45/892 [04:32<55:36, 3.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:11,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▏ | 46/892 [04:35<50:46, 3.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:14,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▎ | 47/892 [04:38<46:10, 3.28s/it]g-point operations will not be computed-17 14:55:14,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▎ | 47/892 [04:38<46:10, 3.28s/it]g-point operations will not be computed-17 14:55:14,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▍ | 48/892 [04:40<41:22, 2.94s/it]g-point operations will not be computed-17 14:55:16,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▍ | 48/892 [04:40<41:22, 2.94s/it]g-point operations will not be computed-17 14:55:16,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▌ | 49/892 [04:42<37:11, 2.65s/it]g-point operations will not be computed-17 14:55:18,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▌ | 49/892 [04:42<37:11, 2.65s/it]g-point operations will not be computed-17 14:55:18,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:55:21,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:55:20,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:55:21,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:55:20,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 50/892 [04:44<37:15, 2.66s/it]g-point operations will not be computed-17 14:55:20,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 50/892 [04:44<37:15, 2.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:24,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:55:28,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:55:24,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 51/892 [04:52<57:54, 4.13s/it]g-point operations will not be computed-17 14:55:24,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████��� | 51/892 [04:52<57:54, 4.13s/it]g-point operations will not be computed-17 14:55:24,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 51/892 [04:52<57:54, 4.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:32,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 51/892 [04:52<57:54, 4.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:32,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:55:35,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:55:32,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:55:35,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:55:32,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 52/892 [04:59<1:10:37, 5.04s/it]g-point operations will not be computed-17 14:55:32,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 52/892 [04:59<1:10:37, 5.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:39,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 52/892 [04:59<1:10:37, 5.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:39,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 53/892 [05:06<1:19:37, 5.69s/it]g-point operations will not be computed-17 14:55:39,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 53/892 [05:06<1:19:37, 5.69s/it]g-point operations will not be computed-17 14:55:39,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 53/892 [05:06<1:19:37, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:46,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 53/892 [05:06<1:19:37, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:46,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:55:50,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:55:46,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:55:50,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:55:46,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 54/892 [05:13<1:24:54, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:53,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 54/892 [05:13<1:24:54, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:55:53,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:55:57,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:55:53,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 55/892 [05:20<1:28:13, 6.32s/it]g-point operations will not be computed-17 14:55:53,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 55/892 [05:20<1:28:13, 6.32s/it]g-point operations will not be computed-17 14:55:53,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 55/892 [05:20<1:28:13, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:00,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 55/892 [05:20<1:28:13, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:00,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 56/892 [05:27<1:30:43, 6.51s/it]g-point operations will not be computed-17 14:56:00,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 56/892 [05:27<1:30:43, 6.51s/it]g-point operations will not be computed-17 14:56:00,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 56/892 [05:27<1:30:43, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:07,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 56/892 [05:27<1:30:43, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:07,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:56:10,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:56:07,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 57/892 [05:34<1:32:31, 6.65s/it]g-point operations will not be computed-17 14:56:07,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 57/892 [05:34<1:32:31, 6.65s/it]g-point operations will not be computed-17 14:56:07,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 57/892 [05:34<1:32:31, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:14,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:56:17,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:56:14,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 58/892 [05:41<1:33:24, 6.72s/it]g-point operations will not be computed-17 14:56:14,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 58/892 [05:41<1:33:24, 6.72s/it]g-point operations will not be computed-17 14:56:14,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 58/892 [05:41<1:33:24, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:21,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 58/892 [05:41<1:33:24, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:21,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 59/892 [05:48<1:33:43, 6.75s/it]g-point operations will not be computed-17 14:56:21,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 59/892 [05:48<1:33:43, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:28,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 59/892 [05:48<1:33:43, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:28,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2495, 'learning_rate': 3.1799999999999994e-05, 'epoch': 0.07} +[WARNING|modeling_utils.py:388] 2022-03-17 14:56:31,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:56:28,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 60/892 [05:55<1:33:30, 6.74s/it]g-point operations will not be computed-17 14:56:28,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 60/892 [05:55<1:33:30, 6.74s/it]g-point operations will not be computed-17 14:56:28,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 60/892 [05:55<1:33:30, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:34,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:56:38,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:56:34,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:56:38,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:56:34,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 61/892 [06:01<1:33:24, 6.74s/it]g-point operations will not be computed-17 14:56:34,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 61/892 [06:01<1:33:24, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:41,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 61/892 [06:01<1:33:24, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:41,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▌ | 62/892 [06:08<1:33:02, 6.73s/it]g-point operations will not be computed-17 14:56:41,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▌ | 62/892 [06:08<1:33:02, 6.73s/it]g-point operations will not be computed-17 14:56:41,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▌ | 62/892 [06:08<1:33:02, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:48,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▌ | 62/892 [06:08<1:33:02, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:48,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:56:51,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:56:48,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:56:51,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:56:48,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 63/892 [06:15<1:32:23, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:54,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 63/892 [06:15<1:32:23, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:56:54,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:56:58,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:56:54,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:56:58,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:56:54,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 64/892 [06:21<1:31:43, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:01,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 64/892 [06:21<1:31:43, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:01,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:57:04,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:57:01,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:57:04,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:57:01,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▊ | 65/892 [06:28<1:31:04, 6.61s/it]g-point operations will not be computed-17 14:57:01,448 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▊ | 65/892 [06:28<1:31:04, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:07,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:57:11,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:57:07,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▉ | 66/892 [06:34<1:30:18, 6.56s/it]g-point operations will not be computed-17 14:57:07,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▉ | 66/892 [06:34<1:30:18, 6.56s/it]g-point operations will not be computed-17 14:57:07,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▉ | 66/892 [06:34<1:30:18, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:14,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▉ | 66/892 [06:34<1:30:18, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:14,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 67/892 [06:40<1:29:33, 6.51s/it]g-point operations will not be computed-17 14:57:14,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 67/892 [06:40<1:29:33, 6.51s/it]g-point operations will not be computed-17 14:57:14,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 67/892 [06:40<1:29:33, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:20,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 67/892 [06:40<1:29:33, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:20,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 68/892 [06:47<1:28:58, 6.48s/it]g-point operations will not be computed-17 14:57:20,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 68/892 [06:47<1:28:58, 6.48s/it]g-point operations will not be computed-17 14:57:20,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 68/892 [06:47<1:28:58, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:27,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 68/892 [06:47<1:28:58, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:27,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 69/892 [06:53<1:28:31, 6.45s/it]g-point operations will not be computed-17 14:57:27,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 69/892 [06:53<1:28:31, 6.45s/it]g-point operations will not be computed-17 14:57:27,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 69/892 [06:53<1:28:31, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:33,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 69/892 [06:53<1:28:31, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:33,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 70/892 [07:00<1:27:50, 6.41s/it]g-point operations will not be computed-17 14:57:33,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 70/892 [07:00<1:27:50, 6.41s/it]g-point operations will not be computed-17 14:57:33,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 70/892 [07:00<1:27:50, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:39,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 70/892 [07:00<1:27:50, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:39,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:57:42,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:57:39,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:57:42,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:57:39,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 71/892 [07:06<1:27:15, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:46,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 71/892 [07:06<1:27:15, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:46,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:57:49,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:57:46,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:57:49,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:57:46,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▍ | 72/892 [07:12<1:26:50, 6.35s/it]g-point operations will not be computed-17 14:57:46,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▍ | 72/892 [07:12<1:26:50, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:52,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:57:55,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:57:52,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:57:55,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:57:52,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▌ | 73/892 [07:18<1:25:57, 6.30s/it]g-point operations will not be computed-17 14:57:52,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▌ | 73/892 [07:18<1:25:57, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:57:58,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:58:01,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:57:58,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:58:01,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:57:58,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 74/892 [07:24<1:25:09, 6.25s/it]g-point operations will not be computed-17 14:57:58,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 74/892 [07:24<1:25:09, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:58:04,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:58:07,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:58:04,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 75/892 [07:32<1:28:34, 6.51s/it]g-point operations will not be computed-17 14:58:04,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 75/892 [07:32<1:28:34, 6.51s/it]g-point operations will not be computed-17 14:58:04,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 75/892 [07:32<1:28:34, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:58:11,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:58:14,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:58:11,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 76/892 [07:38<1:26:43, 6.38s/it]g-point operations will not be computed-17 14:58:11,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 76/892 [07:38<1:26:43, 6.38s/it]g-point operations will not be computed-17 14:58:11,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 76/892 [07:38<1:26:43, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:58:17,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 76/892 [07:38<1:26:43, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:58:17,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 77/892 [07:44<1:25:13, 6.27s/it]g-point operations will not be computed-17 14:58:17,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 77/892 [07:44<1:25:13, 6.27s/it]g-point operations will not be computed-17 14:58:17,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 77/892 [07:44<1:25:13, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:58:23,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:58:26,858 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:58:23,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 78/892 [07:50<1:23:53, 6.18s/it]g-point operations will not be computed-17 14:58:23,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 78/892 [07:50<1:23:53, 6.18s/it]g-point operations will not be computed-17 14:58:23,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 78/892 [07:50<1:23:53, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:58:29,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:58:32,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:58:29,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:58:32,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:58:29,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████ | 79/892 [07:56<1:22:36, 6.10s/it]g-point operations will not be computed-17 14:58:29,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████ | 79/892 [07:56<1:22:36, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:58:35,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:58:38,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:58:35,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:58:38,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:58:35,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▏ | 80/892 [08:01<1:21:49, 6.05s/it]g-point operations will not be computed-17 14:58:35,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▏ | 80/892 [08:01<1:21:49, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:58:41,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:58:44,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:58:41,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:58:44,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:58:41,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▎ | 81/892 [08:07<1:20:33, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:58:47,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▎ | 81/892 [08:07<1:20:33, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:58:47,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▎ | 82/892 [08:13<1:19:37, 5.90s/it]g-point operations will not be computed-17 14:58:47,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▎ | 82/892 [08:13<1:19:37, 5.90s/it]g-point operations will not be computed-17 14:58:47,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▎ | 82/892 [08:13<1:19:37, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:58:53,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▎ | 82/892 [08:13<1:19:37, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:58:53,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▍ | 83/892 [08:19<1:18:43, 5.84s/it]g-point operations will not be computed-17 14:58:53,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▍ | 83/892 [08:19<1:18:43, 5.84s/it]g-point operations will not be computed-17 14:58:53,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▍ | 83/892 [08:19<1:18:43, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:58:58,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:59:01,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:58:58,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▌ | 84/892 [08:24<1:17:27, 5.75s/it]g-point operations will not be computed-17 14:58:58,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▌ | 84/892 [08:24<1:17:27, 5.75s/it]g-point operations will not be computed-17 14:58:58,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▌ | 84/892 [08:24<1:17:27, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:04,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:59:07,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:59:04,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:59:07,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:59:04,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 85/892 [08:30<1:16:07, 5.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:09,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:59:12,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:59:09,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 86/892 [08:35<1:14:32, 5.55s/it]g-point operations will not be computed-17 14:59:09,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 86/892 [08:35<1:14:32, 5.55s/it]g-point operations will not be computed-17 14:59:09,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 86/892 [08:35<1:14:32, 5.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:15,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:59:17,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:59:15,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:59:17,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:59:15,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▊ | 87/892 [08:40<1:12:58, 5.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:20,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:59:22,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:59:20,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▉ | 88/892 [08:45<1:11:18, 5.32s/it]g-point operations will not be computed-17 14:59:20,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▉ | 88/892 [08:45<1:11:18, 5.32s/it]g-point operations will not be computed-17 14:59:20,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▉ | 88/892 [08:45<1:11:18, 5.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:25,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:59:27,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:59:25,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:59:27,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:59:25,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▉ | 89/892 [08:50<1:09:28, 5.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:30,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:59:32,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:59:30,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:59:32,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:59:30,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████ | 90/892 [08:55<1:07:26, 5.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:34,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████ | 90/892 [08:55<1:07:26, 5.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:34,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▏ | 91/892 [08:59<1:05:10, 4.88s/it]g-point operations will not be computed-17 14:59:34,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▏ | 91/892 [08:59<1:05:10, 4.88s/it]g-point operations will not be computed-17 14:59:34,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▏ | 91/892 [08:59<1:05:10, 4.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:39,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▎ | 92/892 [09:04<1:02:19, 4.67s/it]g-point operations will not be computed-17 14:59:39,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▎ | 92/892 [09:04<1:02:19, 4.67s/it]g-point operations will not be computed-17 14:59:39,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▎ | 92/892 [09:04<1:02:19, 4.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:43,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▌ | 93/892 [09:07<59:07, 4.44s/it]g-point operations will not be computed-17 14:59:43,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▌ | 93/892 [09:07<59:07, 4.44s/it]g-point operations will not be computed-17 14:59:43,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 14:59:48,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 14:59:47,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▋ | 94/892 [09:11<55:37, 4.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:50,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▋ | 94/892 [09:11<55:37, 4.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:50,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▋ | 95/892 [09:14<52:08, 3.93s/it]g-point operations will not be computed-17 14:59:50,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▋ | 95/892 [09:14<52:08, 3.93s/it]g-point operations will not be computed-17 14:59:50,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▋ | 95/892 [09:14<52:08, 3.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:53,804 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▊ | 96/892 [09:17<48:24, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:56,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▊ | 96/892 [09:17<48:24, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 14:59:56,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▉ | 97/892 [09:20<44:17, 3.34s/it]g-point operations will not be computed-17 14:59:56,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▉ | 97/892 [09:20<44:17, 3.34s/it]g-point operations will not be computed-17 14:59:56,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 98/892 [09:22<39:59, 3.02s/it]g-point operations will not be computed-17 14:59:59,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 98/892 [09:22<39:59, 3.02s/it]g-point operations will not be computed-17 14:59:59,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 99/892 [09:24<36:04, 2.73s/it]g-point operations will not be computed-17 15:00:01,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 99/892 [09:24<36:04, 2.73s/it]g-point operations will not be computed-17 15:00:01,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:00:04,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:03,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:00:04,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:03,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 100/892 [09:27<35:10, 2.66s/it]g-point operations will not be computed-17 15:00:03,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 100/892 [09:27<35:10, 2.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:07,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:00:11,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:07,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████▏ | 101/892 [09:34<54:51, 4.16s/it]g-point operations will not be computed-17 15:00:07,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████▏ | 101/892 [09:34<54:51, 4.16s/it]g-point operations will not be computed-17 15:00:07,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████▏ | 101/892 [09:34<54:51, 4.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:14,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████▏ | 101/892 [09:34<54:51, 4.16s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:14,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:00:18,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:14,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 102/892 [09:42<1:06:55, 5.08s/it]g-point operations will not be computed-17 15:00:14,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 102/892 [09:42<1:06:55, 5.08s/it]g-point operations will not be computed-17 15:00:14,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 102/892 [09:42<1:06:55, 5.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:22,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:00:25,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:22,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:00:25,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:22,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 103/892 [09:49<1:14:30, 5.67s/it]g-point operations will not be computed-17 15:00:22,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 103/892 [09:49<1:14:30, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:29,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 103/892 [09:49<1:14:30, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:29,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:00:32,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:29,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:00:32,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:29,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 104/892 [09:56<1:19:40, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:36,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 104/892 [09:56<1:19:40, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:36,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 104/892 [09:56<1:19:40, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:36,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 104/892 [09:56<1:19:40, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:36,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▎ | 105/892 [10:03<1:23:23, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:36,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▎ | 105/892 [10:03<1:23:23, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:36,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▎ | 105/892 [10:03<1:23:23, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:36,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▎ | 105/892 [10:03<1:23:23, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:36,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▍ | 106/892 [10:10<1:25:26, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▍ | 106/892 [10:10<1:25:26, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1412, 'learning_rate': 5.9999999999999995e-05, 'epoch': 0.12} + 12%|█████████▍ | 106/892 [10:10<1:25:26, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▍ | 107/892 [10:16<1:26:27, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▍ | 107/892 [10:16<1:26:27, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0822, 'learning_rate': 6.0599999999999996e-05, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:00,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:00,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▌ | 108/892 [10:23<1:27:18, 6.68s/it]g-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▌ | 108/892 [10:23<1:27:18, 6.68s/it]g-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▌ | 108/892 [10:23<1:27:18, 6.68s/it]g-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:08,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:08,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7549, 'learning_rate': 6.18e-05, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:08,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:08,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:08,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▋ | 110/892 [10:37<1:27:42, 6.73s/it]g-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▋ | 110/892 [10:37<1:27:42, 6.73s/it]g-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:20,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:20,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▊ | 111/892 [10:43<1:27:13, 6.70s/it]g-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▊ | 111/892 [10:43<1:27:13, 6.70s/it]g-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▊ | 111/892 [10:43<1:27:13, 6.70s/it]g-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▊ | 111/892 [10:43<1:27:13, 6.70s/it]g-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:28,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:28,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:28,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:35,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:35,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8381, 'learning_rate': 6.419999999999999e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:35,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:35,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:35,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:00:50,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████ | 114/892 [11:03<1:25:22, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████ | 114/892 [11:03<1:25:22, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████ | 114/892 [11:03<1:25:22, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████ | 114/892 [11:03<1:25:22, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▏ | 115/892 [11:10<1:24:46, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:51,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:51,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:51,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▎ | 116/892 [11:16<1:24:15, 6.52s/it]g-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:57,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:57,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:01:57,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▎ | 117/892 [11:22<1:23:33, 6.47s/it]g-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▎ | 117/892 [11:22<1:23:33, 6.47s/it]g-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:05,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▍ | 118/892 [11:29<1:22:56, 6.43s/it]g-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▍ | 118/892 [11:29<1:22:56, 6.43s/it]g-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8077, 'learning_rate': 6.72e-05, 'epoch': 0.13} + 13%|██████████▍ | 118/892 [11:29<1:22:56, 6.43s/it]g-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:13,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:13,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9312, 'learning_rate': 6.78e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:13,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:19,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:19,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9596, 'learning_rate': 6.84e-05, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:19,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:26,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:26,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7884, 'learning_rate': 6.9e-05, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:26,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:32,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:32,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0901, 'learning_rate': 6.96e-05, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:32,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:38,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:38,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6784, 'learning_rate': 7.02e-05, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:38,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:44,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:44,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9247, 'learning_rate': 7.079999999999999e-05, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:44,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:44,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:44,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████ | 125/892 [12:13<1:22:21, 6.44s/it]g-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:54,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:54,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:02:54,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:01:43,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 126/892 [12:19<1:21:07, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:02:59,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 126/892 [12:19<1:21:07, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:02:59,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 126/892 [12:19<1:21:07, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:02:59,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 126/892 [12:19<1:21:07, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:02:59,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 127/892 [12:25<1:19:42, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 127/892 [12:25<1:19:42, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:09,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:09,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8704, 'learning_rate': 7.319999999999999e-05, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:09,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:15,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:15,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7229, 'learning_rate': 7.379999999999999e-05, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:19,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▌ | 130/892 [12:43<1:15:33, 5.95s/it]g-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▌ | 130/892 [12:43<1:15:33, 5.95s/it]g-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:24,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:24,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▌ | 131/892 [12:48<1:14:45, 5.89s/it]g-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▌ | 131/892 [12:48<1:14:45, 5.89s/it]g-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:29,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:29,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:05,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▋ | 132/892 [12:54<1:13:41, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:03:34,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▋ | 132/892 [12:54<1:13:41, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:03:34,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8715, 'learning_rate': 7.56e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:38,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:34,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:38,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:34,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8147, 'learning_rate': 7.62e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:42,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:34,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▊ | 134/892 [13:05<1:11:15, 5.64s/it]g-point operations will not be computed-17 15:03:34,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▊ | 134/892 [13:05<1:11:15, 5.64s/it]g-point operations will not be computed-17 15:03:34,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:46,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:34,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:46,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:34,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▉ | 135/892 [13:10<1:09:57, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:03:50,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▉ | 135/892 [13:10<1:09:57, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:03:50,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6857, 'learning_rate': 7.74e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:54,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:50,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:54,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:50,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7652, 'learning_rate': 7.8e-05, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:50,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:03:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:03:50,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▏ | 137/892 [13:21<1:07:45, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:00,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▏ | 137/892 [13:21<1:07:45, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:00,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▏ | 137/892 [13:21<1:07:45, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:00,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:04,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:00,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:06,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:00,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:09,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:00,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:09,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:00,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:09,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:00,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:12,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:00,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:12,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:00,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▍ | 140/892 [13:35<1:01:55, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:14,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:16,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:14,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▊ | 141/892 [13:39<58:57, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:18,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▊ | 141/892 [13:39<58:57, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:18,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:20,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:18,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▉ | 142/892 [13:43<55:34, 4.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:22,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▉ | 142/892 [13:43<55:34, 4.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:22,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:24,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:22,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:24,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:22,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▉ | 143/892 [13:47<52:13, 4.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:26,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▉ | 143/892 [13:47<52:13, 4.18s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:26,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████ | 144/892 [13:50<48:42, 3.91s/it]g-point operations will not be computed-17 15:04:26,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:30,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:29,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:30,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:29,378 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████▏ | 145/892 [13:53<45:24, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:32,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████▏ | 145/892 [13:53<45:24, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:32,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████▎ | 146/892 [13:56<42:00, 3.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:35,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 15:04:35,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 15:04:35,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:38,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:37,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:38,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:37,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:40,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:39,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:40,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:39,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:42,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:41,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:42,317 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:41,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 150/892 [14:05<31:57, 2.58s/it]g-point operations will not be computed-17 15:04:41,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 150/892 [14:05<31:57, 2.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:45,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:49,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:45,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:49,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:45,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 151/892 [14:12<49:50, 4.04s/it]g-point operations will not be computed-17 15:04:45,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 151/892 [14:12<49:50, 4.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:52,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 151/892 [14:12<49:50, 4.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:52,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:56,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:52,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:04:56,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:52,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▍ | 152/892 [14:19<1:01:01, 4.95s/it]g-point operations will not be computed-17 15:04:52,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▍ | 152/892 [14:19<1:01:01, 4.95s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:04:59,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:05:03,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:59,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:05:03,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:04:59,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 153/892 [14:26<1:08:28, 5.56s/it]g-point operations will not be computed-17 15:04:59,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 153/892 [14:26<1:08:28, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 153/892 [14:26<1:08:28, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 153/892 [14:26<1:08:28, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 153/892 [14:26<1:08:28, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 154/892 [14:33<1:13:44, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:05:15,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:05:15,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:05:15,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 155/892 [14:40<1:16:59, 6.27s/it]g-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 155/892 [14:40<1:16:59, 6.27s/it]g-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:05:24,092 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▊ | 156/892 [14:47<1:18:53, 6.43s/it]g-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▊ | 156/892 [14:47<1:18:53, 6.43s/it]g-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8424, 'learning_rate': 8.999999999999999e-05, 'epoch': 0.17} + 17%|█████████████▊ | 156/892 [14:47<1:18:53, 6.43s/it]g-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▊ | 156/892 [14:47<1:18:53, 6.43s/it]g-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▊ | 156/892 [14:47<1:18:53, 6.43s/it]g-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|█████████████▉ | 157/892 [14:55<1:22:14, 6.71s/it]g-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|█████████████▉ | 157/892 [14:55<1:22:14, 6.71s/it]g-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|█████████████▉ | 157/892 [14:55<1:22:14, 6.71s/it]g-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:05:40,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:05:40,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0679, 'learning_rate': 9.12e-05, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-17 15:05:40,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:05:40,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:05:40,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:05:06,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████ | 159/892 [15:08<1:22:34, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:05:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████ | 159/892 [15:08<1:22:34, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:05:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████ | 159/892 [15:08<1:22:34, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:05:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████ | 159/892 [15:08<1:22:34, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:05:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▏ | 160/892 [15:15<1:22:22, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:05:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▏ | 160/892 [15:15<1:22:22, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:05:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:05:58,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:05:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:05:58,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:05:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 161/892 [15:22<1:21:51, 6.72s/it]g-point operations will not be computed-17 15:05:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 161/892 [15:22<1:21:51, 6.72s/it]g-point operations will not be computed-17 15:05:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 161/892 [15:22<1:21:51, 6.72s/it]g-point operations will not be computed-17 15:05:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 161/892 [15:22<1:21:51, 6.72s/it]g-point operations will not be computed-17 15:05:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 161/892 [15:22<1:21:51, 6.72s/it]g-point operations will not be computed-17 15:05:48,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 162/892 [15:28<1:22:26, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 162/892 [15:28<1:22:26, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 162/892 [15:28<1:22:26, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 162/892 [15:28<1:22:26, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▍ | 163/892 [15:35<1:21:34, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:06:16,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:06:16,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:06:16,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▌ | 164/892 [15:42<1:21:01, 6.68s/it]g-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▌ | 164/892 [15:42<1:21:01, 6.68s/it]g-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:06:25,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▌ | 165/892 [15:48<1:20:02, 6.61s/it]g-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▌ | 165/892 [15:48<1:20:02, 6.61s/it]g-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8338, 'learning_rate': 9.539999999999999e-05, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-17 15:06:31,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▋ | 166/892 [15:54<1:19:22, 6.56s/it]g-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▋ | 166/892 [15:54<1:19:22, 6.56s/it]g-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8404, 'learning_rate': 9.599999999999999e-05, 'epoch': 0.19} + 19%|██████████████▋ | 166/892 [15:54<1:19:22, 6.56s/it]g-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:06:39,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:06:39,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8793, 'learning_rate': 9.659999999999999e-05, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-17 15:06:39,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:06:45,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:06:45,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7065, 'learning_rate': 9.719999999999999e-05, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-17 15:06:45,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:06:45,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:06:45,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:08,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▉ | 169/892 [16:14<1:17:25, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▉ | 169/892 [16:14<1:17:25, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▉ | 169/892 [16:14<1:17:25, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▉ | 169/892 [16:14<1:17:25, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████ | 170/892 [16:20<1:17:03, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:01,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:01,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:01,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▏ | 171/892 [16:26<1:16:17, 6.35s/it]g-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:07,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:07,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:07,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▏ | 172/892 [16:32<1:15:50, 6.32s/it]g-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:14,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:14,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:14,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▎ | 173/892 [16:39<1:15:03, 6.26s/it]g-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:20,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:20,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:20,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▍ | 174/892 [16:45<1:14:29, 6.23s/it]g-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:26,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:26,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▍ | 175/892 [16:52<1:17:20, 6.47s/it]g-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▍ | 175/892 [16:52<1:17:20, 6.47s/it]g-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7985, 'learning_rate': 0.0001014, 'epoch': 0.2} + 20%|███████████████▍ | 175/892 [16:52<1:17:20, 6.47s/it]g-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7022, 'learning_rate': 0.000102, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:42,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:42,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:45,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:45,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:45,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▊ | 178/892 [17:09<1:12:39, 6.11s/it]g-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:51,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:51,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:51,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▊ | 179/892 [17:15<1:11:41, 6.03s/it]g-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:56,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:56,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:07:56,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:06:53,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▉ | 180/892 [17:21<1:10:47, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:08:01,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▉ | 180/892 [17:21<1:10:47, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:08:01,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:05,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:01,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:05,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:01,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8464, 'learning_rate': 0.00010499999999999999, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:09,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:01,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████ | 182/892 [17:32<1:08:37, 5.80s/it]g-point operations will not be computed-17 15:08:01,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████ | 182/892 [17:32<1:08:37, 5.80s/it]g-point operations will not be computed-17 15:08:01,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:13,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:01,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:13,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:01,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▏ | 183/892 [17:38<1:07:40, 5.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:08:18,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▏ | 183/892 [17:38<1:07:40, 5.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:08:18,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8652, 'learning_rate': 0.00010619999999999998, 'epoch': 0.21} + 21%|████████████████▏ | 183/892 [17:38<1:07:40, 5.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:08:18,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▏ | 183/892 [17:38<1:07:40, 5.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:08:18,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▎ | 184/892 [17:43<1:06:35, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:08:23,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▎ | 184/892 [17:43<1:06:35, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:08:23,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:27,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:23,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:27,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:23,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.764, 'learning_rate': 0.00010739999999999998, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:31,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:23,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:31,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:23,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▍ | 186/892 [17:54<1:04:19, 5.47s/it]g-point operations will not be computed-17 15:08:23,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:35,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:23,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:37,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:23,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:37,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:23,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8689, 'learning_rate': 0.00010859999999999998, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:41,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:23,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:41,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:23,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▋ | 188/892 [18:04<1:01:59, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:08:44,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▋ | 188/892 [18:04<1:01:59, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:08:44,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:47,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:44,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:47,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:44,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:50,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:44,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:52,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:44,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:52,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:44,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7211, 'learning_rate': 0.00011039999999999999, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:55,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:44,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:08:55,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:44,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|█████████████████▎ | 191/892 [18:18<57:03, 4.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:08:58,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:00,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:58,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:00,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:08:58,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▍ | 192/892 [18:23<54:40, 4.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:02,333 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:04,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:09:02,333 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:04,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:09:02,333 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▌ | 193/892 [18:27<51:55, 4.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:06,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▌ | 194/892 [18:30<48:43, 4.19s/it]g-point operations will not be computed-17 15:09:06,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▌ | 194/892 [18:30<48:43, 4.19s/it]g-point operations will not be computed-17 15:09:06,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▌ | 194/892 [18:30<48:43, 4.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:09,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▋ | 195/892 [18:33<45:27, 3.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:12,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▋ | 195/892 [18:33<45:27, 3.91s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:12,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▊ | 196/892 [18:36<41:51, 3.61s/it]g-point operations will not be computed-17 15:09:12,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▊ | 196/892 [18:36<41:51, 3.61s/it]g-point operations will not be computed-17 15:09:12,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:16,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:09:15,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:16,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:09:15,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:19,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:09:18,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:19,125 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:09:18,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:21,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:09:20,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:21,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:09:20,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:22,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:09:22,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|██████████████████▏ | 200/892 [18:45<29:42, 2.58s/it]g-point operations will not be computed-17 15:09:22,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|██████████████████▏ | 200/892 [18:45<29:42, 2.58s/it]g-point operations will not be computed-17 15:09:22,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|██████████████████▏ | 200/892 [18:45<29:42, 2.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:25,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|██████████████████▏ | 200/892 [18:45<29:42, 2.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:25,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 201/892 [18:53<46:20, 4.02s/it]g-point operations will not be computed-17 15:09:25,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 201/892 [18:53<46:20, 4.02s/it]g-point operations will not be computed-17 15:09:25,904 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 201/892 [18:53<46:20, 4.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:33,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 201/892 [18:53<46:20, 4.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:33,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:36,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:09:33,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 202/892 [19:00<57:04, 4.96s/it]g-point operations will not be computed-17 15:09:33,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 202/892 [19:00<57:04, 4.96s/it]g-point operations will not be computed-17 15:09:33,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 202/892 [19:00<57:04, 4.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:40,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 202/892 [19:00<57:04, 4.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:40,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 15:09:40,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 15:09:40,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|█████████████████▉ | 203/892 [19:07<1:04:26, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:47,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|█████████████████▉ | 203/892 [19:07<1:04:26, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:47,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|█████████████████▉ | 203/892 [19:07<1:04:26, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:47,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████ | 204/892 [19:14<1:08:59, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:47,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████ | 204/892 [19:14<1:08:59, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:09:47,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:56,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:09:47,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:09:56,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:09:47,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 205/892 [19:21<1:11:40, 6.26s/it]g-point operations will not be computed-17 15:09:47,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 205/892 [19:21<1:11:40, 6.26s/it]g-point operations will not be computed-17 15:09:47,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8868, 'learning_rate': 0.0001194, 'epoch': 0.23} + 23%|██████████████████▏ | 205/892 [19:21<1:11:40, 6.26s/it]g-point operations will not be computed-17 15:09:47,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 205/892 [19:21<1:11:40, 6.26s/it]g-point operations will not be computed-17 15:09:47,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 205/892 [19:21<1:11:40, 6.26s/it]g-point operations will not be computed-17 15:09:47,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 206/892 [19:28<1:13:55, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 206/892 [19:28<1:13:55, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 206/892 [19:28<1:13:55, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 206/892 [19:28<1:13:55, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 207/892 [19:34<1:14:48, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:16,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:16,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:16,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▍ | 208/892 [19:41<1:15:40, 6.64s/it]g-point operations will not be computed-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▍ | 208/892 [19:41<1:15:40, 6.64s/it]g-point operations will not be computed-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▍ | 208/892 [19:41<1:15:40, 6.64s/it]g-point operations will not be computed-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:26,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:26,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8493, 'learning_rate': 0.00012179999999999999, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:26,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:26,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:26,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▌ | 210/892 [19:55<1:16:18, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▌ | 210/892 [19:55<1:16:18, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▌ | 210/892 [19:55<1:16:18, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▌ | 210/892 [19:55<1:16:18, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▋ | 211/892 [20:02<1:15:57, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▋ | 211/892 [20:02<1:15:57, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▋ | 211/892 [20:02<1:15:57, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:46,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:46,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8332, 'learning_rate': 0.0001236, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:46,776 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:53,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:53,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7906, 'learning_rate': 0.00012419999999999998, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:53,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:53,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:10:53,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:10:35,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▉ | 214/892 [20:21<1:14:33, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:11:01,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▉ | 214/892 [20:21<1:14:33, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:11:01,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▉ | 214/892 [20:21<1:14:33, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:11:01,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▉ | 214/892 [20:21<1:14:33, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:11:01,530 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████ | 215/892 [20:28<1:13:55, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████ | 215/892 [20:28<1:13:55, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████ | 215/892 [20:28<1:13:55, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▏ | 216/892 [20:34<1:13:26, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▏ | 216/892 [20:34<1:13:26, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:11:15,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:11:15,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▏ | 217/892 [20:40<1:12:56, 6.48s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▏ | 217/892 [20:40<1:12:56, 6.48s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:11:22,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:11:22,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▎ | 218/892 [20:47<1:12:21, 6.44s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▎ | 218/892 [20:47<1:12:21, 6.44s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:11:28,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:11:31,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:11:31,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7483, 'learning_rate': 0.0001278, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-17 15:11:36,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:11:36,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▍ | 220/892 [21:00<1:13:55, 6.60s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▍ | 220/892 [21:00<1:13:55, 6.60s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:11:44,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▌ | 221/892 [21:07<1:15:41, 6.77s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▌ | 221/892 [21:07<1:15:41, 6.77s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7291, 'learning_rate': 0.000129, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-17 15:11:50,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▋ | 222/892 [21:14<1:14:05, 6.63s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▋ | 222/892 [21:14<1:14:05, 6.63s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9811, 'learning_rate': 0.00012959999999999998, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-17 15:11:56,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▊ | 223/892 [21:20<1:12:30, 6.50s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▊ | 223/892 [21:20<1:12:30, 6.50s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:01,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:01,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▊ | 224/892 [21:26<1:10:58, 6.37s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▊ | 224/892 [21:26<1:10:58, 6.37s/it]g-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9872, 'learning_rate': 0.00013079999999999998, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:09,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:09,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:11:07,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▉ | 225/892 [21:33<1:12:50, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▉ | 225/892 [21:33<1:12:50, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:17,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:17,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1846, 'learning_rate': 0.00013199999999999998, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:17,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:23,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:23,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7989, 'learning_rate': 0.0001326, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:23,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:23,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:29,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8591, 'learning_rate': 0.00013319999999999999, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:33,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▎ | 229/892 [21:57<1:07:07, 6.07s/it]g-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▎ | 229/892 [21:57<1:07:07, 6.07s/it]g-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8231, 'learning_rate': 0.0001338, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:39,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▎ | 230/892 [22:03<1:06:26, 6.02s/it]g-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▎ | 230/892 [22:03<1:06:26, 6.02s/it]g-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8881, 'learning_rate': 0.0001344, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:45,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▍ | 231/892 [22:08<1:05:25, 5.94s/it]g-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▍ | 231/892 [22:08<1:05:25, 5.94s/it]g-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:49,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:49,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:13,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▌ | 232/892 [22:14<1:04:26, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:12:54,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▌ | 232/892 [22:14<1:04:26, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:12:54,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9219, 'learning_rate': 0.0001356, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:58,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:54,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:12:58,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:54,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7862, 'learning_rate': 0.0001362, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:02,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:54,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▋ | 234/892 [22:25<1:02:08, 5.67s/it]g-point operations will not be computed-17 15:12:54,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▋ | 234/892 [22:25<1:02:08, 5.67s/it]g-point operations will not be computed-17 15:12:54,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:06,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:54,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:06,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:12:54,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▊ | 235/892 [22:30<1:00:56, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:13:10,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▊ | 235/892 [22:30<1:00:56, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:13:10,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9955, 'learning_rate': 0.0001374, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:14,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:10,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:14,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:10,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8297, 'learning_rate': 0.000138, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:18,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:10,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████▌ | 237/892 [22:41<58:45, 5.38s/it]g-point operations will not be computed-17 15:13:10,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████▌ | 237/892 [22:41<58:45, 5.38s/it]g-point operations will not be computed-17 15:13:10,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:22,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:10,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:24,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:10,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:24,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:10,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0285, 'learning_rate': 0.0001392, 'epoch': 0.27} +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:28,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:10,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████▋ | 239/892 [22:51<56:03, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████▋ | 239/892 [22:51<56:03, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7294, 'learning_rate': 0.00013979999999999998, 'epoch': 0.27} +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:34,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:34,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:36,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:38,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:38,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:40,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:42,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:42,617 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:44,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:46,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:46,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:48,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:49,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:49,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:51,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:51,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:54,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:55,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:55,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:58,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:13:58,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:00,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:00,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:02,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:02,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:03,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:03,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:05,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:08,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:08,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:12,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:12,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0484, 'learning_rate': 0.000147, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:16,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:19,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:19,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.6329, 'learning_rate': 0.00014759999999999998, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:23,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:23,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:26,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:26,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3109, 'learning_rate': 0.0001482, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:26,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:33,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:33,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2561, 'learning_rate': 0.00014879999999999998, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:33,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:33,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▌ | 255/892 [24:02<1:06:27, 6.26s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▌ | 255/892 [24:02<1:06:27, 6.26s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:43,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:43,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▋ | 256/892 [24:09<1:08:19, 6.45s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▋ | 256/892 [24:09<1:08:19, 6.45s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9713, 'learning_rate': 0.00015, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-17 15:14:52,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▊ | 257/892 [24:15<1:09:16, 6.55s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▊ | 257/892 [24:15<1:09:16, 6.55s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9373, 'learning_rate': 0.00015059999999999997, 'epoch': 0.29} + 29%|██████████████████████▊ | 257/892 [24:15<1:09:16, 6.55s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▊ | 257/892 [24:15<1:09:16, 6.55s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▊ | 258/892 [24:22<1:10:01, 6.63s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▊ | 258/892 [24:22<1:10:01, 6.63s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:04,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:04,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▉ | 259/892 [24:29<1:10:23, 6.67s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▉ | 259/892 [24:29<1:10:23, 6.67s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8621, 'learning_rate': 0.00015179999999999998, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:12,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:12,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████ | 260/892 [24:36<1:10:17, 6.67s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████ | 260/892 [24:36<1:10:17, 6.67s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████ | 260/892 [24:36<1:10:17, 6.67s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:20,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:20,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.937, 'learning_rate': 0.00015299999999999998, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:20,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:27,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:27,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6815, 'learning_rate': 0.0001536, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:27,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:27,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:27,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████▎ | 263/892 [24:55<1:09:16, 6.61s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:37,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:37,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:37,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▍ | 264/892 [25:02<1:09:05, 6.60s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:43,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:43,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:43,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▍ | 265/892 [25:08<1:08:29, 6.55s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▍ | 265/892 [25:08<1:08:29, 6.55s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:51,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▌ | 266/892 [25:15<1:08:09, 6.53s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▌ | 266/892 [25:15<1:08:09, 6.53s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9109, 'learning_rate': 0.000156, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-17 15:15:58,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▋ | 267/892 [25:21<1:07:40, 6.50s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▋ | 267/892 [25:21<1:07:40, 6.50s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7336, 'learning_rate': 0.00015659999999999998, 'epoch': 0.3} + 30%|███████████████████████▋ | 267/892 [25:21<1:07:40, 6.50s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:06,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:06,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9493, 'learning_rate': 0.0001572, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:06,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:06,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:06,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▊ | 269/892 [25:34<1:07:02, 6.46s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:16,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:16,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:16,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▉ | 270/892 [25:41<1:06:43, 6.44s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:22,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:22,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:22,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████ | 271/892 [25:47<1:06:05, 6.39s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:28,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:28,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:28,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████ | 272/892 [25:53<1:05:30, 6.34s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:34,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:34,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:34,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▏ | 273/892 [25:59<1:04:49, 6.28s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:40,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:40,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:40,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▎ | 274/892 [26:05<1:04:31, 6.26s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:47,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:47,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▎ | 275/892 [26:12<1:06:46, 6.49s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▎ | 275/892 [26:12<1:06:46, 6.49s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8323, 'learning_rate': 0.0001614, 'epoch': 0.31} + 31%|████████████████████████▎ | 275/892 [26:12<1:06:46, 6.49s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:57,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:57,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8204, 'learning_rate': 0.000162, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-17 15:16:57,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:03,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:03,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8373, 'learning_rate': 0.0001626, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:07,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▌ | 278/892 [26:30<1:02:58, 6.15s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▌ | 278/892 [26:30<1:02:58, 6.15s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7286, 'learning_rate': 0.0001632, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:13,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▋ | 279/892 [26:36<1:02:18, 6.10s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▋ | 279/892 [26:36<1:02:18, 6.10s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7064, 'learning_rate': 0.0001638, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:19,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▊ | 280/892 [26:42<1:01:25, 6.02s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▊ | 280/892 [26:42<1:01:25, 6.02s/it]g-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:23,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:23,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:23,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:13:30,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|████████████████████████▉ | 281/892 [26:48<1:00:40, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:17:28,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|████████████████████████▉ | 281/892 [26:48<1:00:40, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:17:28,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:17:28,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:17:28,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8, 'learning_rate': 0.0001656, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:32,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:17:28,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:37,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:17:28,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:37,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:17:28,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5438, 'learning_rate': 0.0001662, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:41,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:17:28,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▊ | 284/892 [27:05<57:13, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:17:44,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▊ | 284/892 [27:05<57:13, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:17:44,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8274, 'learning_rate': 0.0001668, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:48,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:17:44,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:48,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:17:44,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8702, 'learning_rate': 0.0001674, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:52,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:17:44,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▉ | 286/892 [27:15<55:00, 5.45s/it]g-point operations will not be computed-17 15:17:44,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▉ | 286/892 [27:15<55:00, 5.45s/it]g-point operations will not be computed-17 15:17:44,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:56,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:17:44,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:58,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:17:44,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:17:58,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:17:44,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8917, 'learning_rate': 0.0001686, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 15:18:02,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:17:44,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|██████████████████████████▏ | 288/892 [27:25<52:28, 5.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:04,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|██████████████████████████▏ | 288/892 [27:25<52:28, 5.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:04,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9552, 'learning_rate': 0.00016919999999999997, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-17 15:18:08,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:18:04,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:18:08,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:18:04,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:18:10,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:18:04,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:18:12,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:18:04,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:18:12,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:18:04,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8569, 'learning_rate': 0.00017039999999999997, 'epoch': 0.33} +[WARNING|modeling_utils.py:388] 2022-03-17 15:18:16,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:18:04,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:18:16,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:18:04,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▍ | 291/892 [27:39<47:11, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:18,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▌ | 292/892 [27:43<44:59, 4.50s/it]g-point operations will not be computed-17 15:18:18,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▌ | 292/892 [27:43<44:59, 4.50s/it]g-point operations will not be computed-17 15:18:18,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▌ | 292/892 [27:43<44:59, 4.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:22,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▌ | 292/892 [27:43<44:59, 4.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:22,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▌ | 293/892 [27:46<42:36, 4.27s/it]g-point operations will not be computed-17 15:18:22,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▌ | 293/892 [27:46<42:36, 4.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:25,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▌ | 293/892 [27:46<42:36, 4.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:25,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▋ | 294/892 [27:50<40:00, 4.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:29,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▋ | 294/892 [27:50<40:00, 4.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:29,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:18:30,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:18:29,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▊ | 295/892 [27:53<37:18, 3.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:32,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▊ | 295/892 [27:53<37:18, 3.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:32,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▉ | 296/892 [27:56<34:10, 3.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:34,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▉ | 296/892 [27:56<34:10, 3.44s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:34,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▉ | 297/892 [27:58<31:01, 3.13s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:37,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|███████████████████████████ | 298/892 [28:00<28:01, 2.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:39,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|███████████████████████████ | 298/892 [28:00<28:01, 2.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:39,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6715, 'learning_rate': 0.00017519999999999998, 'epoch': 0.33} + 34%|███████████████████████████▏ | 299/892 [28:02<25:04, 2.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:41,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 300/892 [28:05<24:57, 2.53s/it]g-point operations will not be computed-17 15:18:41,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 300/892 [28:05<24:57, 2.53s/it]g-point operations will not be computed-17 15:18:41,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 300/892 [28:05<24:57, 2.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:45,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 300/892 [28:05<24:57, 2.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:45,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:18:48,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:18:45,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▎ | 301/892 [28:12<39:27, 4.01s/it]g-point operations will not be computed-17 15:18:45,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▎ | 301/892 [28:12<39:27, 4.01s/it]g-point operations will not be computed-17 15:18:45,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▎ | 301/892 [28:12<39:27, 4.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▎ | 301/892 [28:12<39:27, 4.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▍ | 302/892 [28:19<48:30, 4.93s/it]g-point operations will not be computed-17 15:18:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▍ | 302/892 [28:19<48:30, 4.93s/it]g-point operations will not be computed-17 15:18:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▍ | 302/892 [28:19<48:30, 4.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:59,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▍ | 302/892 [28:19<48:30, 4.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:18:59,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:03,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:18:59,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:03,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:18:59,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 303/892 [28:26<54:47, 5.58s/it]g-point operations will not be computed-17 15:18:59,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 303/892 [28:26<54:47, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:10,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:10,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 304/892 [28:33<58:59, 6.02s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 304/892 [28:33<58:59, 6.02s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 304/892 [28:33<58:59, 6.02s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 304/892 [28:33<58:59, 6.02s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 304/892 [28:33<58:59, 6.02s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 305/892 [28:40<1:01:22, 6.27s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:22,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:22,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:22,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 306/892 [28:47<1:02:50, 6.43s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 306/892 [28:47<1:02:50, 6.43s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:30,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 307/892 [28:54<1:03:40, 6.53s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 307/892 [28:54<1:03:40, 6.53s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0468, 'learning_rate': 0.00018059999999999997, 'epoch': 0.34} + 34%|███████████████████████████▏ | 307/892 [28:54<1:03:40, 6.53s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 307/892 [28:54<1:03:40, 6.53s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 307/892 [28:54<1:03:40, 6.53s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 308/892 [29:00<1:04:17, 6.60s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:42,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:42,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:42,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 309/892 [29:07<1:04:21, 6.62s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 309/892 [29:07<1:04:21, 6.62s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:50,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▍ | 310/892 [29:14<1:04:35, 6.66s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▍ | 310/892 [29:14<1:04:35, 6.66s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9634, 'learning_rate': 0.0001824, 'epoch': 0.35} + 35%|███████████████████████████▍ | 310/892 [29:14<1:04:35, 6.66s/it]g-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:59,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:59,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0115, 'learning_rate': 0.00018299999999999998, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:59,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:59,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:19:59,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:19:06,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▋ | 312/892 [29:27<1:04:01, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▋ | 312/892 [29:27<1:04:01, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▋ | 312/892 [29:27<1:04:01, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▋ | 312/892 [29:27<1:04:01, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▋ | 313/892 [29:33<1:03:27, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:15,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:15,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:15,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▊ | 314/892 [29:40<1:03:12, 6.56s/it]g-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:21,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:21,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:21,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▉ | 315/892 [29:46<1:02:37, 6.51s/it]g-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▉ | 315/892 [29:46<1:02:37, 6.51s/it]g-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:29,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▉ | 316/892 [29:53<1:02:18, 6.49s/it]g-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▉ | 316/892 [29:53<1:02:18, 6.49s/it]g-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8409, 'learning_rate': 0.000186, 'epoch': 0.35} + 35%|███████████████████████████▉ | 316/892 [29:53<1:02:18, 6.49s/it]g-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:37,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:37,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7218, 'learning_rate': 0.00018659999999999998, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:37,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:44,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:44,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7217, 'learning_rate': 0.0001872, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:44,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:50,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:50,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7875, 'learning_rate': 0.00018779999999999998, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:50,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:56,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:56,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6982, 'learning_rate': 0.00018839999999999997, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-17 15:20:56,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:21:03,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:21:03,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7792, 'learning_rate': 0.00018899999999999999, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-17 15:21:03,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:21:03,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:21:03,170 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|█████████████████████████████▏ | 322/892 [30:31<59:53, 6.30s/it]g-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:21:12,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:21:12,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:20:07,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|█████████████████████████████▎ | 323/892 [30:37<59:23, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:17,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|█████████████████████████████▎ | 323/892 [30:37<59:23, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:17,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7345, 'learning_rate': 0.0001902, 'epoch': 0.36} + 36%|█████████████████████████████▎ | 323/892 [30:37<59:23, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:17,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|█████████████████████████████▎ | 323/892 [30:37<59:23, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:17,161 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|█████████████████████████████▍ | 324/892 [30:43<59:04, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|█████████████████████████████▍ | 324/892 [30:43<59:04, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|█████████████████████████████▍ | 324/892 [30:43<59:04, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▊ | 325/892 [30:50<1:01:19, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▊ | 325/892 [30:50<1:01:19, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8808, 'learning_rate': 0.0001914, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-17 15:21:33,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|████████████████████████████▊ | 326/892 [30:56<1:00:03, 6.37s/it]g-point operations will not be computed-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|████████████████████████████▊ | 326/892 [30:56<1:00:03, 6.37s/it]g-point operations will not be computed-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8451, 'learning_rate': 0.00019199999999999998, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-17 15:21:39,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▋ | 327/892 [31:02<58:57, 6.26s/it]g-point operations will not be computed-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▋ | 327/892 [31:02<58:57, 6.26s/it]g-point operations will not be computed-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6829, 'learning_rate': 0.0001926, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-17 15:21:45,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▊ | 328/892 [31:08<57:58, 6.17s/it]g-point operations will not be computed-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▊ | 328/892 [31:08<57:58, 6.17s/it]g-point operations will not be computed-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:21:49,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:21:49,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:21:23,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▉ | 329/892 [31:14<56:59, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:54,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▉ | 329/892 [31:14<56:59, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:54,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9283, 'learning_rate': 0.0001938, 'epoch': 0.37} + 37%|█████████████████████████████▉ | 329/892 [31:14<56:59, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:54,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▉ | 330/892 [31:20<56:14, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:54,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▉ | 330/892 [31:20<56:14, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:21:54,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:01,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:21:54,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:01,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:21:54,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:01,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:21:54,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████ | 331/892 [31:26<55:28, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:22:05,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████ | 331/892 [31:26<55:28, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:22:05,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████ | 331/892 [31:26<55:28, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:22:05,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:10,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:05,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:10,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:05,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:14,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:05,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:14,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:05,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████▏ | 333/892 [31:37<53:59, 5.80s/it]g-point operations will not be computed-17 15:22:05,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:18,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:05,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:18,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:05,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:18,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:05,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████▎ | 334/892 [31:42<52:57, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:22:22,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████▎ | 334/892 [31:42<52:57, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:22:22,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:22,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:22,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9196, 'learning_rate': 0.0001974, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:30,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:22,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:30,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:22,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▌ | 336/892 [31:53<50:58, 5.50s/it]g-point operations will not be computed-17 15:22:22,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:34,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:22,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:34,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:22,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:34,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:22,505 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▌ | 337/892 [31:58<49:57, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:22:38,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:40,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:38,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:40,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:38,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▋ | 338/892 [32:03<49:00, 5.31s/it]g-point operations will not be computed-17 15:22:38,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:44,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:38,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:46,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:38,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:46,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:38,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:49,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:38,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:49,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:38,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:49,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:38,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▊ | 340/892 [32:13<46:17, 5.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:22:52,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:54,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:52,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:54,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:52,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▉ | 341/892 [32:17<44:23, 4.83s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:22:57,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:59,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:57,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:22:59,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:22:57,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|███████████████████████████████ | 342/892 [32:21<42:17, 4.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:01,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:02,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:01,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:02,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:01,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|███████████████████████████████▏ | 343/892 [32:25<39:56, 4.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:04,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:06,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:04,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:06,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:04,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▏ | 344/892 [32:29<37:34, 4.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:08,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▏ | 344/892 [32:29<37:34, 4.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:08,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▎ | 345/892 [32:32<35:07, 3.85s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:11,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 15:23:11,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 15:23:11,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:15,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:14,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:15,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:14,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▌ | 347/892 [32:37<29:24, 3.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:16,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▌ | 347/892 [32:37<29:24, 3.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:16,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▌ | 348/892 [32:40<26:33, 2.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:18,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▌ | 348/892 [32:40<26:33, 2.93s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:18,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:21,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:20,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:21,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:20,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▊ | 350/892 [32:44<23:37, 2.62s/it]g-point operations will not be computed-17 15:23:20,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▊ | 350/892 [32:44<23:37, 2.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:24,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▊ | 350/892 [32:44<23:37, 2.62s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:24,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:28,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:24,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:28,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:24,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▊ | 351/892 [32:52<36:55, 4.09s/it]g-point operations will not be computed-17 15:23:24,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▊ | 351/892 [32:52<36:55, 4.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:32,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:35,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:32,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:35,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:32,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▉ | 352/892 [32:59<45:04, 5.01s/it]g-point operations will not be computed-17 15:23:32,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▉ | 352/892 [32:59<45:04, 5.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▉ | 352/892 [32:59<45:04, 5.01s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:42,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:42,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████ | 353/892 [33:06<50:40, 5.64s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:48,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:48,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:23:48,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 354/892 [33:13<54:19, 6.06s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 354/892 [33:13<54:19, 6.06s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|██████████████��█████████████████▏ | 354/892 [33:13<54:19, 6.06s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 354/892 [33:13<54:19, 6.06s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 354/892 [33:13<54:19, 6.06s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 355/892 [33:20<56:38, 6.33s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:24:01,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:24:01,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:24:01,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▎ | 356/892 [33:27<58:02, 6.50s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▎ | 356/892 [33:27<58:02, 6.50s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:24:10,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▍ | 357/892 [33:34<58:43, 6.59s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▍ | 357/892 [33:34<58:43, 6.59s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9887, 'learning_rate': 0.00021059999999999997, 'epoch': 0.4} + 40%|████████████████████████████████▍ | 357/892 [33:34<58:43, 6.59s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▍ | 357/892 [33:34<58:43, 6.59s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▍ | 357/892 [33:34<58:43, 6.59s/it]g-point operations will not be computed-17 15:23:39,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▌ | 358/892 [33:40<59:22, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:24:20,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▌ | 358/892 [33:40<59:22, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:24:20,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▌ | 358/892 [33:40<59:22, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:24:20,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▌ | 358/892 [33:40<59:22, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:24:20,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▌ | 359/892 [33:47<59:40, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:24:20,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▌ | 359/892 [33:47<59:40, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:24:20,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▌ | 359/892 [33:47<59:40, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:24:20,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:24:32,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:20,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:24:32,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:20,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9564, 'learning_rate': 0.00021239999999999996, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-17 15:24:32,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:20,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:24:32,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:20,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:24:32,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:20,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▊ | 361/892 [34:01<59:15, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▊ | 361/892 [34:01<59:15, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▊ | 361/892 [34:01<59:15, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▊ | 361/892 [34:01<59:15, 6.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|████████████████████████████████▊ | 362/892 [34:07<58:55, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:24:49,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:24:49,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|████████████████████████████████▉ | 363/892 [34:14<58:33, 6.64s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|████████████████████████████████▉ | 363/892 [34:14<58:33, 6.64s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7538, 'learning_rate': 0.00021419999999999998, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-17 15:24:57,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████ | 364/892 [34:20<58:14, 6.62s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████ | 364/892 [34:20<58:14, 6.62s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9914, 'learning_rate': 0.00021479999999999996, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:03,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▏ | 365/892 [34:27<57:56, 6.60s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▏ | 365/892 [34:27<57:56, 6.60s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8159, 'learning_rate': 0.00021539999999999998, 'epoch': 0.41} + 41%|█████████████████████████████████▏ | 365/892 [34:27<57:56, 6.60s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:11,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:11,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.678, 'learning_rate': 0.00021599999999999996, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:11,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:11,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:11,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▎ | 367/892 [34:40<57:01, 6.52s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:21,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:21,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▍ | 368/892 [34:46<56:37, 6.48s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▍ | 368/892 [34:46<56:37, 6.48s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:28,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:28,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 369/892 [34:53<56:23, 6.47s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 369/892 [34:53<56:23, 6.47s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8139, 'learning_rate': 0.00021779999999999998, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:36,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 370/892 [34:59<56:09, 6.45s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 370/892 [34:59<56:09, 6.45s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8691, 'learning_rate': 0.00021839999999999997, 'epoch': 0.41} + 41%|█████████████████████████████████▌ | 370/892 [34:59<56:09, 6.45s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:44,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:44,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7698, 'learning_rate': 0.00021899999999999998, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:44,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:50,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:50,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0252, 'learning_rate': 0.00021959999999999997, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:50,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:56,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:56,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7653, 'learning_rate': 0.00022019999999999999, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-17 15:25:56,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:02,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:02,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9352, 'learning_rate': 0.00022079999999999997, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:02,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:02,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████ | 375/892 [35:31<56:15, 6.53s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████ | 375/892 [35:31<56:15, 6.53s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:12,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:12,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 376/892 [35:37<55:05, 6.41s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 376/892 [35:37<55:05, 6.41s/it]g-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:18,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:18,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:24:40,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 377/892 [35:43<53:47, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:26:23,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 377/892 [35:43<53:47, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:26:23,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5804, 'learning_rate': 0.0002226, 'epoch': 0.42} + 42%|██████████████████████████████████▏ | 377/892 [35:43<53:47, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:26:23,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▎ | 378/892 [35:49<52:49, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▎ | 378/892 [35:49<52:49, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9133, 'learning_rate': 0.00022319999999999998, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:33,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:33,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8053, 'learning_rate': 0.0002238, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:33,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:33,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:39,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:39,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:43,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:43,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▌ | 381/892 [36:07<50:30, 5.93s/it]g-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▌ | 381/892 [36:07<50:30, 5.93s/it]g-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:49,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:49,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▋ | 382/892 [36:12<49:34, 5.83s/it]g-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:53,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:53,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:26:53,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:29,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▊ | 383/892 [36:18<48:50, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:26:57,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▊ | 383/892 [36:18<48:50, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:26:57,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▊ | 383/892 [36:18<48:50, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:26:57,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:01,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:57,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:04,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:57,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:04,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:57,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:04,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:26:57,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▉ | 385/892 [36:29<47:07, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:27:08,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▉ | 385/892 [36:29<47:07, 5.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:27:08,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:12,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:08,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:12,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:08,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7029, 'learning_rate': 0.00022799999999999999, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:16,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:08,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:16,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:08,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|███████████████████████████████████▏ | 387/892 [36:39<45:09, 5.37s/it]g-point operations will not be computed-17 15:27:08,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:20,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:08,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:22,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:08,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:22,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:08,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6297, 'learning_rate': 0.0002292, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:26,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:08,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:26,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:08,674 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▎ | 389/892 [36:49<42:56, 5.12s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:27:28,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:30,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:28,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:30,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:28,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▍ | 390/892 [36:53<41:36, 4.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▍ | 390/892 [36:53<41:36, 4.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|████████████████████████████████���██▍ | 390/892 [36:53<41:36, 4.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:36,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:38,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:38,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:40,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:42,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:42,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:44,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:46,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:46,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:48,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:51,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:51,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:53,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:54,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:54,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:57,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:57,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:59,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:27:59,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:01,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:01,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:03,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:03,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5138, 'learning_rate': 0.0002364, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:07,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:07,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:11,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:11,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.6771, 'learning_rate': 0.000237, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:15,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:15,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:15,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:18,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:22,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:22,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:25,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:25,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1976, 'learning_rate': 0.0002382, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:25,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:32,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:32,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0373, 'learning_rate': 0.0002388, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:32,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:32,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▊ | 405/892 [38:01<51:14, 6.31s/it]g-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▊ | 405/892 [38:01<51:14, 6.31s/it]g-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1013, 'learning_rate': 0.0002394, 'epoch': 0.45} + 45%|████████████████████████████████████▊ | 405/892 [38:01<51:14, 6.31s/it]g-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:46,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:46,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9948, 'learning_rate': 0.00023999999999999998, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:46,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:46,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:46,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|████████████████████████████████████▉ | 407/892 [38:15<53:21, 6.60s/it]g-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:56,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:28:56,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████ | 408/892 [38:22<53:49, 6.67s/it]g-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████ | 408/892 [38:22<53:49, 6.67s/it]g-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7801, 'learning_rate': 0.00024119999999999998, 'epoch': 0.46} + 46%|█████████████████████████████████████ | 408/892 [38:22<53:49, 6.67s/it]g-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:06,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:06,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9982, 'learning_rate': 0.0002418, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:06,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:06,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:27:33,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▏ | 410/892 [38:35<53:53, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:29:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▏ | 410/892 [38:35<53:53, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:29:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8896, 'learning_rate': 0.00024239999999999998, 'epoch': 0.46} + 46%|█████████████████████████████████████▏ | 410/892 [38:35<53:53, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:29:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▎ | 411/892 [38:42<53:56, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:29:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▎ | 411/892 [38:42<53:56, 6.73s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:29:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7741, 'learning_rate': 0.000243, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:25,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▍ | 412/892 [38:48<53:26, 6.68s/it]g-point operations will not be computed-17 15:29:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▍ | 412/892 [38:48<53:26, 6.68s/it]g-point operations will not be computed-17 15:29:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8769, 'learning_rate': 0.00024359999999999999, 'epoch': 0.46} + 46%|█████████████████████████████████████▍ | 412/892 [38:48<53:26, 6.68s/it]g-point operations will not be computed-17 15:29:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:33,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:33,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8612, 'learning_rate': 0.00024419999999999997, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:33,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:33,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▌ | 414/892 [39:01<52:38, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▌ | 414/892 [39:01<52:38, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6607, 'learning_rate': 0.0002448, 'epoch': 0.46} + 46%|█████████████████████████████████████▌ | 414/892 [39:01<52:38, 6.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▋ | 415/892 [39:08<52:24, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▋ | 415/892 [39:08<52:24, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6997, 'learning_rate': 0.00024539999999999995, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:51,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▊ | 416/892 [39:14<52:03, 6.56s/it]g-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▊ | 416/892 [39:14<52:03, 6.56s/it]g-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7932, 'learning_rate': 0.00024599999999999996, 'epoch': 0.47} + 47%|█████████████████████████████████████▊ | 416/892 [39:14<52:03, 6.56s/it]g-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:59,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:59,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6429, 'learning_rate': 0.0002466, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:59,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:29:59,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:30:06,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:30:06,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:30:06,068 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:30:12,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:30:12,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.825, 'learning_rate': 0.00024779999999999995, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-17 15:30:12,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:30:18,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:30:18,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8656, 'learning_rate': 0.00024839999999999997, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-17 15:30:18,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:30:18,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:30:18,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:29:41,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 421/892 [39:46<50:01, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:26,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 421/892 [39:46<50:01, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:26,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 421/892 [39:46<50:01, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:26,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 421/892 [39:46<50:01, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:26,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▎ | 422/892 [39:53<49:32, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:32,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▎ | 422/892 [39:53<49:32, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:32,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▎ | 422/892 [39:53<49:32, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:32,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▎ | 422/892 [39:53<49:32, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:32,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▍ | 423/892 [39:59<48:59, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:38,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▍ | 423/892 [39:59<48:59, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:38,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▍ | 423/892 [39:59<48:59, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:38,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▍ | 423/892 [39:59<48:59, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:38,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▌ | 424/892 [40:05<48:42, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▌ | 424/892 [40:05<48:42, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▌ | 424/892 [40:05<48:42, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▌ | 424/892 [40:05<48:42, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▌ | 425/892 [40:12<50:26, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▌ | 425/892 [40:12<50:26, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:30:55,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:30:55,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▋ | 426/892 [40:18<49:30, 6.37s/it]g-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▋ | 426/892 [40:18<49:30, 6.37s/it]g-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:01,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:01,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▊ | 427/892 [40:24<48:41, 6.28s/it]g-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▊ | 427/892 [40:24<48:41, 6.28s/it]g-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:07,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:07,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▊ | 428/892 [40:30<47:58, 6.20s/it]g-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:11,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:11,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:11,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▉ | 429/892 [40:36<47:18, 6.13s/it]g-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:17,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:17,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:17,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:30:45,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████ | 430/892 [40:42<46:35, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:31:22,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████ | 430/892 [40:42<46:35, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:31:22,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:26,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:22,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:26,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:22,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9942, 'learning_rate': 0.00025499999999999996, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:26,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:22,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:32,305 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:22,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:32,305 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:22,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8094, 'learning_rate': 0.0002556, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:36,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:22,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▎ | 433/892 [40:59<45:04, 5.89s/it]g-point operations will not be computed-17 15:31:22,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▎ | 433/892 [40:59<45:04, 5.89s/it]g-point operations will not be computed-17 15:31:22,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:40,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:22,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:40,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:22,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▍ | 434/892 [41:05<44:27, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███��███████████████████████████████████▍ | 434/892 [41:05<44:27, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7551, 'learning_rate': 0.00025679999999999995, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:49,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:49,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6967, 'learning_rate': 0.00025739999999999997, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:53,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▌ | 436/892 [41:16<42:21, 5.57s/it]g-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▌ | 436/892 [41:16<42:21, 5.57s/it]g-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:57,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:59,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:59,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9264, 'learning_rate': 0.0002586, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-17 15:31:59,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:04,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:04,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:07,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:07,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:07,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:31:45,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▊ | 439/892 [41:31<39:31, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:13,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▉ | 440/892 [41:36<38:20, 5.09s/it]g-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▉ | 440/892 [41:36<38:20, 5.09s/it]g-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:16,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:19,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:19,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:21,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:23,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:23,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:25,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:27,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:27,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:29,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:30,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:30,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:32,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:32,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:35,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:37,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:37,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:39,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:39,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:42,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:42,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:44,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:44,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:44,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:44,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:46,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:46,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:50,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:53,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:53,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8256, 'learning_rate': 0.000267, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:57,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:32:57,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:01,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:01,071 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.6904, 'learning_rate': 0.0002676, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:04,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:08,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:08,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.6517, 'learning_rate': 0.00026819999999999996, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:08,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:08,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:32:11,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 454/892 [42:36<43:55, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 454/892 [42:36<43:55, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0165, 'learning_rate': 0.0002688, 'epoch': 0.51} + 51%|█████████████████████████████████████████▏ | 454/892 [42:36<43:55, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▎ | 455/892 [42:43<45:44, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▎ | 455/892 [42:43<45:44, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1745, 'learning_rate': 0.0002694, 'epoch': 0.51} + 51%|█████████████████████████████████████████▎ | 455/892 [42:43<45:44, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▎ | 455/892 [42:43<45:44, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:28,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:28,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:28,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:28,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:28,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 457/892 [42:57<47:33, 6.56s/it]g-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:39,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:39,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:39,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▌ | 458/892 [43:05<51:00, 7.05s/it]g-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:48,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:48,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:48,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▋ | 459/892 [43:13<51:51, 7.19s/it]g-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▋ | 459/892 [43:13<51:51, 7.19s/it]g-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▋ | 459/892 [43:13<51:51, 7.19s/it]g-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:58,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:58,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0076, 'learning_rate': 0.0002724, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:58,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:58,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:33:58,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▊ | 461/892 [43:26<49:39, 6.91s/it]g-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:08,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:08,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:08,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▉ | 462/892 [43:33<48:57, 6.83s/it]g-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▉ | 462/892 [43:33<48:57, 6.83s/it]g-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:16,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████ | 463/892 [43:39<48:15, 6.75s/it]g-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████ | 463/892 [43:39<48:15, 6.75s/it]g-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7875, 'learning_rate': 0.0002742, 'epoch': 0.52} + 52%|██████████████████████████████████████████ | 463/892 [43:39<48:15, 6.75s/it]g-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:24,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:24,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6762, 'learning_rate': 0.0002748, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:24,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:30,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:30,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8027, 'learning_rate': 0.00027539999999999997, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:30,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:30,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:30,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:33:16,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▎ | 466/892 [43:59<46:36, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▎ | 466/892 [43:59<46:36, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▎ | 466/892 [43:59<46:36, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▎ | 466/892 [43:59<46:36, 6.56s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▍ | 467/892 [44:05<46:16, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:47,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:47,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:47,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▍ | 468/892 [44:11<45:48, 6.48s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:53,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:34:53,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▌ | 469/892 [44:18<45:32, 6.46s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▌ | 469/892 [44:18<45:32, 6.46s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.784, 'learning_rate': 0.0002778, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:01,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▋ | 470/892 [44:24<45:08, 6.42s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▋ | 470/892 [44:24<45:08, 6.42s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6701, 'learning_rate': 0.0002784, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:07,623 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 471/892 [44:30<44:42, 6.37s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 471/892 [44:30<44:42, 6.37s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6513, 'learning_rate': 0.000279, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:13,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 472/892 [44:37<44:24, 6.34s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 472/892 [44:37<44:24, 6.34s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6554, 'learning_rate': 0.00027959999999999997, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:20,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▉ | 473/892 [44:43<43:59, 6.30s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▉ | 473/892 [44:43<43:59, 6.30s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6965, 'learning_rate': 0.0002802, 'epoch': 0.53} + 53%|██████████████████████████████████████████▉ | 473/892 [44:43<43:59, 6.30s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:27,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:27,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6918, 'learning_rate': 0.0002808, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:27,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:27,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:27,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|███████████████████████████████████████████▏ | 475/892 [44:56<44:52, 6.46s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:37,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:40,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:40,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7939, 'learning_rate': 0.00028199999999999997, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:40,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:46,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:46,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8769, 'learning_rate': 0.0002826, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:51,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▍ | 478/892 [45:14<42:11, 6.11s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▍ | 478/892 [45:14<42:11, 6.11s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6449, 'learning_rate': 0.00028319999999999994, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-17 15:35:56,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▍ | 479/892 [45:20<41:34, 6.04s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▍ | 479/892 [45:20<41:34, 6.04s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:01,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:01,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:01,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▌ | 480/892 [45:26<40:58, 5.97s/it]g-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:07,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:07,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:07,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:34:39,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▋ | 481/892 [45:31<40:15, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:11,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▋ | 481/892 [45:31<40:15, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:11,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▋ | 481/892 [45:31<40:15, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:11,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▋ | 481/892 [45:31<40:15, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:11,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▊ | 482/892 [45:37<39:47, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:17,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▊ | 482/892 [45:37<39:47, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:17,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|██████████████████████████████���████████████▊ | 482/892 [45:37<39:47, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:17,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:21,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:17,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:21,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:17,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:25,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:17,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:25,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:17,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▉ | 484/892 [45:48<38:22, 5.64s/it]g-point operations will not be computed-17 15:36:17,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:29,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:17,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:29,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:17,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:29,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:17,030 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|████████████████████████████████████████████ | 485/892 [45:53<37:36, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:33,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|████████████████████████████████████████████ | 485/892 [45:53<37:36, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:33,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|████████████████████████████████████████████ | 485/892 [45:53<37:36, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:33,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:37,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:33,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:39,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:33,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:39,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:33,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:39,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:33,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▏ | 487/892 [46:04<36:23, 5.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:43,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▏ | 487/892 [46:04<36:23, 5.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:43,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▏ | 487/892 [46:04<36:23, 5.39s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:43,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:47,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:43,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:49,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:43,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:52,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:43,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:52,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:43,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7287, 'learning_rate': 0.00028979999999999994, 'epoch': 0.55} +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:55,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:43,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:55,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:43,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▍ | 490/892 [46:18<33:14, 4.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:36:57,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:59,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:57,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:36:59,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:36:57,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▌ | 491/892 [46:22<31:54, 4.77s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:02,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:04,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:02,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:04,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:02,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▋ | 492/892 [46:26<30:15, 4.54s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:05,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:07,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:05,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:07,738 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:05,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▊ | 493/892 [46:30<28:21, 4.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:09,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▊ | 493/892 [46:30<28:21, 4.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:09,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▊ | 494/892 [46:33<26:18, 3.97s/it]g-point operations will not be computed-17 15:37:09,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:14,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:12,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:14,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:12,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▉ | 495/892 [46:36<24:15, 3.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:15,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▉ | 495/892 [46:36<24:15, 3.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:15,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████ | 496/892 [46:39<22:13, 3.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:18,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████ | 496/892 [46:39<22:13, 3.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:18,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▏ | 497/892 [46:41<20:16, 3.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:20,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▏ | 497/892 [46:41<20:16, 3.08s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:20,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▏ | 498/892 [46:43<18:15, 2.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:22,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▏ | 498/892 [46:43<18:15, 2.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:22,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▎ | 499/892 [46:45<16:28, 2.51s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:24,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▍ | 500/892 [46:48<16:15, 2.49s/it]g-point operations will not be computed-17 15:37:24,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▍ | 500/892 [46:48<16:15, 2.49s/it]g-point operations will not be computed-17 15:37:24,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▍ | 500/892 [46:48<16:15, 2.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:28,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▍ | 500/892 [46:48<16:15, 2.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:28,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:31,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:28,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:31,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:28,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▍ | 501/892 [46:55<25:49, 3.96s/it]g-point operations will not be computed-17 15:37:28,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▍ | 501/892 [46:55<25:49, 3.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:35,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▍ | 501/892 [46:55<25:49, 3.96s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:35,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▌ | 502/892 [47:02<32:04, 4.94s/it]g-point operations will not be computed-17 15:37:35,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▌ | 502/892 [47:02<32:04, 4.94s/it]g-point operations will not be computed-17 15:37:35,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▌ | 502/892 [47:02<32:04, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:42,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▌ | 502/892 [47:02<32:04, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:42,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:46,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:42,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:46,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:42,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▋ | 503/892 [47:09<36:07, 5.57s/it]g-point operations will not be computed-17 15:37:42,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▋ | 503/892 [47:09<36:07, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▋ | 503/892 [47:09<36:07, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:54,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:54,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1749, 'learning_rate': 0.0002988, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:54,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:54,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:37:54,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|█████████████████████████████████████████████▊ | 505/892 [47:23<40:21, 6.26s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:05,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:05,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:05,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|█████████████████████████████████████████████▉ | 506/892 [47:30<41:20, 6.43s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|█████████████████████████████████████████████▉ | 506/892 [47:30<41:20, 6.43s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|█████████████████████████████████████████████▉ | 506/892 [47:30<41:20, 6.43s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:15,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:15,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9699, 'learning_rate': 0.000299234693877551, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:15,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:15,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:15,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|██████████████████████████████████████████████▏ | 508/892 [47:44<42:20, 6.62s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:25,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:25,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|██████████████████████████████████████████████▏ | 509/892 [47:50<42:25, 6.65s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|██████████████████████████████████████████████▏ | 509/892 [47:50<42:25, 6.65s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9586, 'learning_rate': 0.00029770408163265304, 'epoch': 0.57} + 57%|██████████████████████████████████████████████▏ | 509/892 [47:50<42:25, 6.65s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:35,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:35,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8407, 'learning_rate': 0.0002969387755102041, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:35,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:42,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:42,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7549, 'learning_rate': 0.00029617346938775506, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:42,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:42,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:42,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|██████████████████████████████████████████████▍ | 512/892 [48:10<42:04, 6.64s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|██████████████████████████████████████████████▍ | 512/892 [48:10<42:04, 6.64s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:53,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:38:53,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|██████████████████████████████████████████████▌ | 513/892 [48:17<41:55, 6.64s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|██████████████████████████████████████████████▌ | 513/892 [48:17<41:55, 6.64s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:00,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|██████████████████████████████████████████████▋ | 514/892 [48:24<41:44, 6.63s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|██████████████████████████████████████████████▋ | 514/892 [48:24<41:44, 6.63s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7472, 'learning_rate': 0.0002938775510204081, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:07,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|██████████████████████████████████████████████▊ | 515/892 [48:30<41:23, 6.59s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|██████████████████████████████████████████████▊ | 515/892 [48:30<41:23, 6.59s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7657, 'learning_rate': 0.00029311224489795917, 'epoch': 0.58} + 58%|██████████████████████████████████████████████▊ | 515/892 [48:30<41:23, 6.59s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:15,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:15,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5764, 'learning_rate': 0.0002923469387755102, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:15,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:15,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:15,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|██████████████████████████████████████████████▉ | 517/892 [48:43<40:46, 6.52s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:24,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:24,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|███████████████████████████████████████████████ | 518/892 [48:49<40:30, 6.50s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|███████████████████████████████████████████████ | 518/892 [48:49<40:30, 6.50s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:31,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:31,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|███████████████████████████████████████████████▏ | 519/892 [48:56<40:12, 6.47s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|███████████████████████████████████████████████▏ | 519/892 [48:56<40:12, 6.47s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:37,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:37,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|███████████████████████████████████████████████▏ | 520/892 [49:02<39:43, 6.41s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|███████████████████████████████████████████████▏ | 520/892 [49:02<39:43, 6.41s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:43,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:43,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|███████████████████████████████████████████████▎ | 521/892 [49:08<39:31, 6.39s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|███████████████████████████████████████████████▎ | 521/892 [49:08<39:31, 6.39s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7104, 'learning_rate': 0.0002885204081632653, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:51,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▍ | 522/892 [49:15<39:15, 6.37s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▍ | 522/892 [49:15<39:15, 6.37s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.661, 'learning_rate': 0.0002877551020408163, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-17 15:39:58,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▍ | 523/892 [49:21<38:46, 6.31s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▍ | 523/892 [49:21<38:46, 6.31s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5696, 'learning_rate': 0.0002869897959183673, 'epoch': 0.59} + 59%|███████████████████████████████████████████████▍ | 523/892 [49:21<38:46, 6.31s/it]g-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:05,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:05,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6741, 'learning_rate': 0.00028622448979591836, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:10,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:37:49,805 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▋ | 525/892 [49:34<39:54, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:40:14,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▋ | 525/892 [49:34<39:54, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:40:14,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7646, 'learning_rate': 0.0002854591836734694, 'epoch': 0.59} + 59%|███████████████████████████████████████████████▋ | 525/892 [49:34<39:54, 6.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:40:14,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▊ | 526/892 [49:40<39:04, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:40:14,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▊ | 526/892 [49:40<39:04, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:40:14,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:22,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:14,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:22,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:14,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▊ | 527/892 [49:46<38:17, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:40:26,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▊ | 527/892 [49:46<38:17, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:40:26,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.64, 'learning_rate': 0.00028392857142857137, 'epoch': 0.59} + 59%|███████████████████████████████████████████████▊ | 527/892 [49:46<38:17, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:40:26,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▊ | 527/892 [49:46<38:17, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:40:26,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▉ | 528/892 [49:52<37:40, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▉ | 528/892 [49:52<37:40, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▉ | 528/892 [49:52<37:40, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:36,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:36,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:36,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:36,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:42,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:42,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:47,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:47,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▏ | 531/892 [50:10<35:54, 5.97s/it]g-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▏ | 531/892 [50:10<35:54, 5.97s/it]g-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:52,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:52,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▎ | 532/892 [50:16<35:23, 5.90s/it]g-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:57,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:57,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:40:57,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:40:32,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▍ | 533/892 [50:21<34:44, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:41:01,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▍ | 533/892 [50:21<34:44, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:41:01,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▍ | 533/892 [50:21<34:44, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:41:01,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:05,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:01,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:05,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:01,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:09,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:01,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:09,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:01,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▌ | 535/892 [50:32<33:23, 5.61s/it]g-point operations will not be computed-17 15:41:01,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:13,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:01,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:13,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:01,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:13,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:01,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▋ | 536/892 [50:37<32:44, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:41:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▋ | 536/892 [50:37<32:44, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:41:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▋ | 536/892 [50:37<32:44, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:41:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:21,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:21,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:25,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▊ | 538/892 [50:48<31:36, 5.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▊ | 538/892 [50:48<31:36, 5.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7634, 'learning_rate': 0.00027551020408163264, 'epoch': 0.6} + 60%|████████████████████████████████████████████████▊ | 538/892 [50:48<31:36, 5.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:31,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:33,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:33,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:35,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:37,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:37,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:39,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:41,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:41,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:43,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:45,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:45,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:47,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:48,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:48,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:51,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:51,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:53,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:53,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:55,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:57,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:57,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:59,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:41:59,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:01,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:01,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:03,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:03,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:04,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:04,724 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:08,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:08,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:12,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:12,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:15,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:19,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:22,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:22,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:22,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:26,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:26,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:29,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:29,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:29,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 62%|███████████████████████████████████████████████��██▎ | 554/892 [51:55<33:42, 5.98s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:36,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:36,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:36,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 62%|██████████████████████████████████████████████████▍ | 555/892 [52:02<35:05, 6.25s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 62%|██████████████████████████████████████████████████▍ | 555/892 [52:02<35:05, 6.25s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 62%|██████████████████████████████████████████████████▍ | 555/892 [52:02<35:05, 6.25s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:47,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:47,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9042, 'learning_rate': 0.000261734693877551, 'epoch': 0.62} +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:47,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:47,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:47,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 62%|██████████████████████████████████████████████████▌ | 557/892 [52:15<36:28, 6.53s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:57,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:57,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:42:57,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|██████████████████████████████████████████████████▋ | 558/892 [52:22<36:51, 6.62s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|██████████████████████████████████████████████████▋ | 558/892 [52:22<36:51, 6.62s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:05,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|██████████████████████████████████████████████████▊ | 559/892 [52:29<37:00, 6.67s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|██████████████████████████████████████████████████▊ | 559/892 [52:29<37:00, 6.67s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7679, 'learning_rate': 0.00025943877551020403, 'epoch': 0.63} + 63%|██████████████████████████████████████████████████▊ | 559/892 [52:29<37:00, 6.67s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:14,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:14,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6943, 'learning_rate': 0.00025867346938775507, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:14,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:14,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:14,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|██████████████████████████████████████████████████▉ | 561/892 [52:42<36:39, 6.64s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:23,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:23,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|███████████████████████████████████████████████████ | 562/892 [52:49<36:27, 6.63s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|███████████████████████████████████████████████████ | 562/892 [52:49<36:27, 6.63s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6494, 'learning_rate': 0.0002571428571428571, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:32,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|███████████████████████████████████████████████████ | 563/892 [52:55<36:10, 6.60s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|███████████████████████████████████████████████████ | 563/892 [52:55<36:10, 6.60s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6779, 'learning_rate': 0.00025637755102040814, 'epoch': 0.63} + 63%|███████████████████████████████████████████████████ | 563/892 [52:55<36:10, 6.60s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:40,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:40,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6811, 'learning_rate': 0.0002556122448979592, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:40,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:46,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:46,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7522, 'learning_rate': 0.0002548469387755102, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:46,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:46,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:46,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|███████████████████████████████████████████████████▍ | 566/892 [53:15<35:23, 6.51s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:56,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:56,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:43:56,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|███████████████████████████████████████████████████▍ | 567/892 [53:21<35:06, 6.48s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:02,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:02,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|███████████████████████████████████████████████████▌ | 568/892 [53:27<34:50, 6.45s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|███████████████████████████████████████████████████▌ | 568/892 [53:27<34:50, 6.45s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:09,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:09,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|███████████████████████████████████████████████████▋ | 569/892 [53:34<34:29, 6.41s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|███████████████████████████████████████████████████▋ | 569/892 [53:34<34:29, 6.41s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6458, 'learning_rate': 0.00025178571428571426, 'epoch': 0.64} + 64%|███████████████████████████████████████████████████▋ | 569/892 [53:34<34:29, 6.41s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:18,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:18,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6042, 'learning_rate': 0.0002510204081632653, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:18,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:24,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:24,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4918, 'learning_rate': 0.0002502551020408163, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:24,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:31,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:31,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6797, 'learning_rate': 0.00024948979591836733, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:31,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:37,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:37,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5863, 'learning_rate': 0.00024872448979591837, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:41,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|████████████████████████████████████████████████████ | 574/892 [54:05<32:56, 6.22s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|████████████████████████████████████████████████████ | 574/892 [54:05<32:56, 6.22s/it]g-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4528, 'learning_rate': 0.00024795918367346935, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:47,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:44:47,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:41:27,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|████████████████████████████████████████████████████▏ | 575/892 [54:12<34:19, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:44:52,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|████████████████████████████████████████████████████▏ | 575/892 [54:12<34:19, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:44:52,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|████████████████████████████████████████████████████▏ | 575/892 [54:12<34:19, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:44:52,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|████████████████████████████████████████████████████▏ | 575/892 [54:12<34:19, 6.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:44:52,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████████████████████████████████████████▎ | 576/892 [54:18<33:29, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████████████████████████████████████████▎ | 576/892 [54:18<33:29, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:02,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:02,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6087, 'learning_rate': 0.0002456632653061224, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:02,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:08,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:08,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6959, 'learning_rate': 0.00024489795918367346, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:08,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:14,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:14,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3075, 'learning_rate': 0.00024413265306122447, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:14,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:20,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:20,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7373, 'learning_rate': 0.00024336734693877548, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:24,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████████████████████████████████████████▊ | 581/892 [54:47<30:52, 5.96s/it]g-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████████████████████████████████████████▊ | 581/892 [54:47<30:52, 5.96s/it]g-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7056, 'learning_rate': 0.0002426020408163265, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:30,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████████████████████████████████████████▊ | 582/892 [54:53<30:24, 5.88s/it]g-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████████████████████████████████████████▊ | 582/892 [54:53<30:24, 5.88s/it]g-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:34,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:34,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:34,693 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:44:58,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████████████████████████████████████████▉ | 583/892 [54:59<29:57, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:45:38,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████████████████████████████████████████▉ | 583/892 [54:59<29:57, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:45:38,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:42,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:45:38,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:42,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:45:38,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5181, 'learning_rate': 0.00024030612244897956, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:46,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:45:38,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████ | 585/892 [55:10<28:40, 5.60s/it]g-point operations will not be computed-17 15:45:38,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████ | 585/892 [55:10<28:40, 5.60s/it]g-point operations will not be computed-17 15:45:38,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:51,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:45:38,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:51,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:45:38,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:51,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:45:38,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▏ | 586/892 [55:15<28:11, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:45:54,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▏ | 586/892 [55:15<28:11, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:45:54,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:58,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:45:54,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:45:58,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:45:54,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:01,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:45:54,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:01,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:45:54,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:01,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:45:54,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▍ | 588/892 [55:25<26:58, 5.32s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:05,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:07,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:05,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▍ | 589/892 [55:30<26:16, 5.20s/it]g-point operations will not be computed-17 15:46:05,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▍ | 589/892 [55:30<26:16, 5.20s/it]g-point operations will not be computed-17 15:46:05,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:11,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:05,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:13,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:05,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:13,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:05,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:15,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:05,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:15,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:05,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▋ | 591/892 [55:40<24:41, 4.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:19,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▋ | 591/892 [55:40<24:41, 4.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:19,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:21,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:19,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▊ | 592/892 [55:44<23:41, 4.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:23,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▊ | 592/892 [55:44<23:41, 4.74s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:23,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:25,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:23,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▊ | 593/892 [55:48<22:31, 4.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:27,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▊ | 593/892 [55:48<22:31, 4.52s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:27,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:29,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:27,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:29,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:27,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|█████████████████████████████████████████████████████▉ | 594/892 [55:52<21:11, 4.27s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:31,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████ | 595/892 [55:55<19:44, 3.99s/it]g-point operations will not be computed-17 15:46:31,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████ | 595/892 [55:55<19:44, 3.99s/it]g-point operations will not be computed-17 15:46:31,067 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:35,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:34,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:35,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:34,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████ | 596/892 [55:58<18:06, 3.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:37,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▏ | 597/892 [56:00<16:29, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:39,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▏ | 597/892 [56:00<16:29, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:39,691 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▎ | 598/892 [56:03<14:49, 3.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:41,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▎ | 598/892 [56:03<14:49, 3.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:41,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▍ | 599/892 [56:05<13:10, 2.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:43,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▍ | 599/892 [56:05<13:10, 2.70s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:43,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▍ | 600/892 [56:07<12:56, 2.66s/it]g-point operations will not be computed-17 15:46:43,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▍ | 600/892 [56:07<12:56, 2.66s/it]g-point operations will not be computed-17 15:46:43,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▍ | 600/892 [56:07<12:56, 2.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:47,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▍ | 600/892 [56:07<12:56, 2.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:47,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:51,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:47,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▌ | 601/892 [56:15<19:54, 4.11s/it]g-point operations will not be computed-17 15:46:47,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▌ | 601/892 [56:15<19:54, 4.11s/it]g-point operations will not be computed-17 15:46:47,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▌ | 601/892 [56:15<19:54, 4.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:55,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▌ | 601/892 [56:15<19:54, 4.11s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:46:55,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:58,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:55,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:46:58,713 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:46:55,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▋ | 602/892 [56:22<24:17, 5.03s/it]g-point operations will not be computed-17 15:46:55,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▋ | 602/892 [56:22<24:17, 5.03s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:02,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:47:05,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:47:02,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|██████████████████████████████████████████████████████▊ | 603/892 [56:29<27:10, 5.64s/it]g-point operations will not be computed-17 15:47:02,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|██████████████████████████████████████████████████████▊ | 603/892 [56:29<27:10, 5.64s/it]g-point operations will not be computed-17 15:47:02,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1314, 'learning_rate': 0.00022576530612244895, 'epoch': 0.68} + 68%|██████████████████████████████████████████████████████▊ | 603/892 [56:29<27:10, 5.64s/it]g-point operations will not be computed-17 15:47:02,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|██████████████████████████████████████████████████████▊ | 603/892 [56:29<27:10, 5.64s/it]g-point operations will not be computed-17 15:47:02,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|██████████████████████████████████████████████████████▊ | 603/892 [56:29<27:10, 5.64s/it]g-point operations will not be computed-17 15:47:02,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████��██████████████████████████▊ | 604/892 [56:36<28:59, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:16,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|██████████████████████████████████████████████████████▊ | 604/892 [56:36<28:59, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:16,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|██████████████████████████████████████████████████████▊ | 604/892 [56:36<28:59, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:16,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|██████████████████████████████████████████████████████▉ | 605/892 [56:43<30:07, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:16,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|██████████████████████████████████████████████████████▉ | 605/892 [56:43<30:07, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:16,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8637, 'learning_rate': 0.000224234693877551, 'epoch': 0.68} +[WARNING|modeling_utils.py:388] 2022-03-17 15:47:26,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:47:16,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████ | 606/892 [56:50<30:57, 6.49s/it]g-point operations will not be computed-17 15:47:16,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████ | 606/892 [56:50<30:57, 6.49s/it]g-point operations will not be computed-17 15:47:16,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6627, 'learning_rate': 0.00022346938775510205, 'epoch': 0.68} + 68%|███████████████████████████████████████████████████████ | 606/892 [56:50<30:57, 6.49s/it]g-point operations will not be computed-17 15:47:16,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████ | 606/892 [56:50<30:57, 6.49s/it]g-point operations will not be computed-17 15:47:16,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████ | 606/892 [56:50<30:57, 6.49s/it]g-point operations will not be computed-17 15:47:16,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████ | 607/892 [56:57<31:21, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:36,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████ | 607/892 [56:57<31:21, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:36,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████ | 607/892 [56:57<31:21, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:36,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████▏ | 608/892 [57:03<31:30, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:36,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████▏ | 608/892 [57:03<31:30, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:36,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7518, 'learning_rate': 0.00022193877551020407, 'epoch': 0.68} +[WARNING|modeling_utils.py:388] 2022-03-17 15:47:47,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:47:36,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████▎ | 609/892 [57:10<31:34, 6.69s/it]g-point operations will not be computed-17 15:47:36,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████▎ | 609/892 [57:10<31:34, 6.69s/it]g-point operations will not be computed-17 15:47:36,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.653, 'learning_rate': 0.00022117346938775508, 'epoch': 0.68} + 68%|███████████████████████████████████████████████████████▎ | 609/892 [57:10<31:34, 6.69s/it]g-point operations will not be computed-17 15:47:36,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████▎ | 609/892 [57:10<31:34, 6.69s/it]g-point operations will not be computed-17 15:47:36,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████▎ | 609/892 [57:10<31:34, 6.69s/it]g-point operations will not be computed-17 15:47:36,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████▍ | 610/892 [57:17<31:23, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████▍ | 610/892 [57:17<31:23, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████▍ | 610/892 [57:17<31:23, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████▍ | 611/892 [57:23<31:18, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|████████████████████��██████████████████████████████████▍ | 611/892 [57:23<31:18, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:05,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:05,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:05,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▌ | 612/892 [57:30<31:10, 6.68s/it]g-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▌ | 612/892 [57:30<31:10, 6.68s/it]g-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:13,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:13,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▋ | 613/892 [57:37<31:00, 6.67s/it]g-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▋ | 613/892 [57:37<31:00, 6.67s/it]g-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:20,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▊ | 614/892 [57:43<30:38, 6.61s/it]g-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▊ | 614/892 [57:43<30:38, 6.61s/it]g-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6016, 'learning_rate': 0.0002173469387755102, 'epoch': 0.69} + 69%|███████████████████████████████████████████████████████▊ | 614/892 [57:43<30:38, 6.61s/it]g-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▊ | 614/892 [57:43<30:38, 6.61s/it]g-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▊ | 614/892 [57:43<30:38, 6.61s/it]g-point operations will not be computed-17 15:47:57,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▊ | 615/892 [57:50<30:25, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▊ | 615/892 [57:50<30:25, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▊ | 615/892 [57:50<30:25, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▊ | 615/892 [57:50<30:25, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▉ | 616/892 [57:56<30:07, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:38,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:38,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:38,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|████████████████████████████████████████████████████████ | 617/892 [58:03<29:49, 6.51s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:44,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:44,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:44,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|████████████████████████████████████████████████████████ | 618/892 [58:09<29:32, 6.47s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|████████████████████████████████████████████████████████ | 618/892 [58:09<29:32, 6.47s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:52,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|████████████████████████████████████████████████████████▏ | 619/892 [58:15<29:14, 6.43s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|████████████████████████████████████████████████████████▏ | 619/892 [58:15<29:14, 6.43s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:58,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:48:58,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|████████████████████████████████████████████████████████▎ | 620/892 [58:22<28:59, 6.40s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|████████████████████████████████████████████████████████▎ | 620/892 [58:22<28:59, 6.40s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:05,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|████████████████████████████████████████████████████████▍ | 621/892 [58:28<28:49, 6.38s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|████████████████████████████████████████████████████████▍ | 621/892 [58:28<28:49, 6.38s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4912, 'learning_rate': 0.0002119897959183673, 'epoch': 0.7} +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:11,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|████████████████████████████████████████████████████████▍ | 622/892 [58:34<28:31, 6.34s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|████████████████████████████████████████████████████████▍ | 622/892 [58:34<28:31, 6.34s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.507, 'learning_rate': 0.00021122448979591835, 'epoch': 0.7} + 70%|████████████████████████████████████████████████████████▍ | 622/892 [58:34<28:31, 6.34s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:19,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:19,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6002, 'learning_rate': 0.0002104591836734694, 'epoch': 0.7} +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:19,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:25,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:25,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4304, 'learning_rate': 0.0002096938775510204, 'epoch': 0.7} +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:25,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:25,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:25,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|████████████████████████████████████████████████████████▊ | 625/892 [58:54<29:02, 6.53s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:35,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:35,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:35,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|████████████████████████████████████████████████████████▊ | 626/892 [59:00<28:24, 6.41s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:41,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:41,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:41,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|████████████████████████████████████████████████████████▉ | 627/892 [59:06<27:43, 6.28s/it]g-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:47,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:47,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:49:47,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:48:30,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|█████████████████████████████████████████████████████████ | 628/892 [59:12<27:09, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:49:52,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|█████████████████████████████████████████████████████████ | 628/892 [59:12<27:09, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:49:52,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|█████████████████████████████████████████████████████████ | 628/892 [59:12<27:09, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:49:52,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|█████████████████████████████████████████████████████████ | 628/892 [59:12<27:09, 6.17s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:49:52,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████ | 629/892 [59:18<26:45, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:49:57,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████ | 629/892 [59:18<26:45, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:49:57,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:02,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:49:57,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:02,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:49:57,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6577, 'learning_rate': 0.0002051020408163265, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:02,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:49:57,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:08,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:49:57,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:08,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:49:57,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5518, 'learning_rate': 0.00020433673469387754, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:12,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:49:57,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▍ | 632/892 [59:35<25:35, 5.91s/it]g-point operations will not be computed-17 15:49:57,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▍ | 632/892 [59:35<25:35, 5.91s/it]g-point operations will not be computed-17 15:49:57,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3805, 'learning_rate': 0.00020357142857142856, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:18,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:49:57,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▍ | 633/892 [59:41<25:05, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:50:20,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▍ | 633/892 [59:41<25:05, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:50:20,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5106, 'learning_rate': 0.00020280612244897957, 'epoch': 0.71} + 71%|█████████████████████████████████████████████████████████▍ | 633/892 [59:41<25:05, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:50:20,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▍ | 633/892 [59:41<25:05, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:50:20,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▌ | 634/892 [59:46<24:43, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:50:26,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▌ | 634/892 [59:46<24:43, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:50:26,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:30,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:26,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:30,573 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:26,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5212, 'learning_rate': 0.00020127551020408162, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:34,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:26,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|███████████████��█████████████████████████████████████████▊ | 636/892 [59:57<23:51, 5.59s/it]g-point operations will not be computed-17 15:50:26,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▊ | 636/892 [59:57<23:51, 5.59s/it]g-point operations will not be computed-17 15:50:26,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:38,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:26,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:38,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:26,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:38,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:26,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|████████████████████████████████████████████████████████▍ | 637/892 [1:00:03<23:22, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:50:42,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:45,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:42,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 72%|████████████████████████████████████████████████████████▌ | 638/892 [1:00:08<22:56, 5.42s/it]g-point operations will not be computed-17 15:50:42,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 72%|████████████████████████████████████████████████████████▌ | 638/892 [1:00:08<22:56, 5.42s/it]g-point operations will not be computed-17 15:50:42,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:49,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:42,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:49,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:42,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:49,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:42,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 72%|████████████████████████████████████████████████████████▌ | 639/892 [1:00:13<22:21, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:55,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 72%|████████████████████████████████████████████████████████▋ | 640/892 [1:00:18<21:41, 5.17s/it]g-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 72%|████████████████████████████████████████████████████████▋ | 640/892 [1:00:18<21:41, 5.17s/it]g-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:50:58,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:00,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:00,999 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:03,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:05,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:05,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:07,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:09,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:09,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:11,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:12,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:12,830 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:14,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:14,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:17,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:19,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:19,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:21,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:21,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:23,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:23,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:25,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:25,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:27,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:28,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:28,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7388, 'learning_rate': 0.00018979591836734694, 'epoch': 0.73} +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:32,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:32,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:36,333 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:36,333 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:39,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:39,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:43,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:43,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.492, 'learning_rate': 0.00018826530612244896, 'epoch': 0.73} +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:47,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:47,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:51:47,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:50:52,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|█████████████████████████████████████████████████████████▊ | 653/892 [1:01:12<22:34, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:51:52,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|█████████████████████████████████████████████████████████▊ | 653/892 [1:01:12<22:34, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:51:52,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|█████████████████████████████████████████████████████████▊ | 653/892 [1:01:12<22:34, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:51:52,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|█████████████████████████████████████████████████████████▉ | 654/892 [1:01:19<24:03, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:51:52,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|█████████████████████████████████████████████████████████▉ | 654/892 [1:01:19<24:03, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:51:52,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0356, 'learning_rate': 0.00018673469387755102, 'epoch': 0.73} +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:02,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:51:52,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:02,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:51:52,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|██████████████████████████████████████████████████████████ | 655/892 [1:01:26<24:59, 6.33s/it]g-point operations will not be computed-17 15:51:52,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|██████████████████████████████████████████████████████████ | 655/892 [1:01:26<24:59, 6.33s/it]g-point operations will not be computed-17 15:51:52,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|██████████████████████████████████████████████████████████ | 655/892 [1:01:26<24:59, 6.33s/it]g-point operations will not be computed-17 15:51:52,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|██████████████████████████████████████████████████████████ | 655/892 [1:01:26<24:59, 6.33s/it]g-point operations will not be computed-17 15:51:52,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|██████████████████████████████████████████████████████████ | 656/892 [1:01:33<25:25, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|██████████████████████████████████████████████████████████ | 656/892 [1:01:33<25:25, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7763, 'learning_rate': 0.00018520408163265304, 'epoch': 0.74} + 74%|██████████████████████████████████████████████████████████ | 656/892 [1:01:33<25:25, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|██████████████████████████████████████████████████████████▏ | 657/892 [1:01:39<25:43, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|██████████████████████████████████████████████████████████▏ | 657/892 [1:01:39<25:43, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5477, 'learning_rate': 0.00018443877551020405, 'epoch': 0.74} + 74%|██████████████████████████████████████████████████████████▏ | 657/892 [1:01:39<25:43, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:24,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:24,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8061, 'learning_rate': 0.0001836734693877551, 'epoch': 0.74} +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:24,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:24,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:24,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|██████████████████████████████████████████████████████████▎ | 659/892 [1:01:53<25:57, 6.68s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:35,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:35,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:35,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|██████████████████████████████████████████████████████████▍ | 660/892 [1:02:00<25:51, 6.69s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|██████████████████████████████████████████████████████████▍ | 660/892 [1:02:00<25:51, 6.69s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:43,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:43,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|██████████████████████████████████████████████████████████▌ | 661/892 [1:02:06<25:46, 6.69s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|██████████████████████████████████████████████████████████▌ | 661/892 [1:02:06<25:46, 6.69s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|██████████████████████████████████████████████████████████▌ | 661/892 [1:02:06<25:46, 6.69s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:51,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:51,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3821, 'learning_rate': 0.00018061224489795917, 'epoch': 0.74} +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:51,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:51,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:52:51,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|██████████████████████████████████████████████████████████▋ | 663/892 [1:02:20<25:28, 6.67s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:01,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:01,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:01,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|██████████████████████��███████████████████████████████████▊ | 664/892 [1:02:26<25:14, 6.64s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:08,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|██████████████████████████████████████████████████████████▉ | 665/892 [1:02:33<24:58, 6.60s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|██████████████████████████████████████████████████████████▉ | 665/892 [1:02:33<24:58, 6.60s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|██████████████████████████████████████████████████████████▉ | 665/892 [1:02:33<24:58, 6.60s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|██████████████████████████████████████████████████████████▉ | 665/892 [1:02:33<24:58, 6.60s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:17,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:17,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:22,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|███████████████████████████████████████████████████████████ | 667/892 [1:02:46<24:28, 6.53s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|███████████████████████████████████████████████████████████ | 667/892 [1:02:46<24:28, 6.53s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4584, 'learning_rate': 0.00017678571428571428, 'epoch': 0.75} + 75%|███████████████████████████████████████████████████████████ | 667/892 [1:02:46<24:28, 6.53s/it]g-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:30,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:30,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5485, 'learning_rate': 0.0001760204081632653, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:30,777 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:37,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:37,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6394, 'learning_rate': 0.0001752551020408163, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:37,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:37,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:37,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:52:13,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|███████████████████████████████████████████████████████████▎ | 670/892 [1:03:05<23:42, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|███████████████████████████████████████████████████████████▎ | 670/892 [1:03:05<23:42, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|███████████████████████████████████████████████████████████▎ | 670/892 [1:03:05<23:42, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|███████████████████████████████████████████████████████████▎ | 670/892 [1:03:05<23:42, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|███████████████████████████████████████████████████████████▍ | 671/892 [1:03:11<23:26, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:52,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:52,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:52,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|███████████████████████████████████████████████████████████▌ | 672/892 [1:03:17<23:12, 6.33s/it]g-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:59,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:59,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:53:59,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|███████████████████████████████████████████████████████████▌ | 673/892 [1:03:24<23:00, 6.31s/it]g-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:05,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:05,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:05,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|███████████████████████████████████████████████████████████▋ | 674/892 [1:03:30<22:48, 6.28s/it]g-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:11,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:11,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|███████████████████████████████████████████████████████████▊ | 675/892 [1:03:37<23:39, 6.54s/it]g-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|███████████████████████████████████████████████████████████▊ | 675/892 [1:03:37<23:39, 6.54s/it]g-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3872, 'learning_rate': 0.00017066326530612244, 'epoch': 0.76} + 76%|███████████████████████████████████████████████████████████▊ | 675/892 [1:03:37<23:39, 6.54s/it]g-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:21,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:21,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4303, 'learning_rate': 0.00016989795918367345, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:26,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|███████████████████████████████████████████████████████████▉ | 677/892 [1:03:49<22:31, 6.29s/it]g-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|███████████████████████████████████████████████████████████▉ | 677/892 [1:03:49<22:31, 6.29s/it]g-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3736, 'learning_rate': 0.0001691326530612245, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:32,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|████████████████████████████████████████████████████████████ | 678/892 [1:03:55<22:06, 6.20s/it]g-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|████████████████████████████████████████████████████████████ | 678/892 [1:03:55<22:06, 6.20s/it]g-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1379, 'learning_rate': 0.00016836734693877547, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:38,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|████████████████████████████████████████████████████████████▏ | 679/892 [1:04:01<21:43, 6.12s/it]g-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|████████████████████████████████████████████████████████████▏ | 679/892 [1:04:01<21:43, 6.12s/it]g-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:42,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:42,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:42,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|████████████████████████████████████████████████████████████▏ | 680/892 [1:04:07<21:18, 6.03s/it]g-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:48,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:48,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:48,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:53:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|████████████████████████████████████████████████████████████▎ | 681/892 [1:04:13<21:01, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:54:52,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|████████████████████████████████████████████████████████████▎ | 681/892 [1:04:13<21:01, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:54:52,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:57,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:54:52,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:57,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:54:52,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2144, 'learning_rate': 0.00016530612244897955, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-17 15:54:57,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:54:52,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:02,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:54:52,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:02,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:54:52,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3885, 'learning_rate': 0.0001645408163265306, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:07,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:54:52,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|████████████████████████████████████████████████████████████▌ | 684/892 [1:04:30<20:03, 5.78s/it]g-point operations will not be computed-17 15:54:52,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|████████████████████████████████████████████████████████████▌ | 684/892 [1:04:30<20:03, 5.78s/it]g-point operations will not be computed-17 15:54:52,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:11,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:54:52,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:11,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:54:52,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:11,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:54:52,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|████████████████████████████████████████████████████████████▋ | 685/892 [1:04:35<19:36, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:55:15,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|████████████████████████████████████████████████████████████▋ | 685/892 [1:04:35<19:36, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:55:15,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:19,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:15,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:19,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:15,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3419, 'learning_rate': 0.00016224489795918368, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:23,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:15,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|████████████████████████████████████████████████████████████▊ | 687/892 [1:04:46<18:50, 5.51s/it]g-point operations will not be computed-17 15:55:15,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|████████████████████████████████████████████████████████████▊ | 687/892 [1:04:46<18:50, 5.51s/it]g-point operations will not be computed-17 15:55:15,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:27,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:15,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:27,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:15,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:27,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:15,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|████████████████████████████████████████████████████████████▉ | 688/892 [1:04:51<18:26, 5.42s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:55:31,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:33,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:31,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|█████████████████████████████████████████████████████████████ | 689/892 [1:04:56<17:57, 5.31s/it]g-point operations will not be computed-17 15:55:31,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|█████████████████████████████████████████████████████████████ | 689/892 [1:04:56<17:57, 5.31s/it]g-point operations will not be computed-17 15:55:31,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:37,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:31,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:39,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:31,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:39,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:31,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5397, 'learning_rate': 0.00015918367346938776, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:43,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:31,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:43,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:31,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|█████████████████████████████████████████████████████████████▏ | 691/892 [1:05:06<16:44, 5.00s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:55:45,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:47,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:45,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▎ | 692/892 [1:05:10<15:59, 4.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:55:49,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▎ | 692/892 [1:05:10<15:59, 4.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:55:49,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:51,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:49,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:55:51,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:55:49,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▍ | 693/892 [1:05:14<15:01, 4.53s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:55:53,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▍ | 694/892 [1:05:17<13:56, 4.23s/it]g-point operations will not be computed-17 15:55:53,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▍ | 694/892 [1:05:17<13:56, 4.23s/it]g-point operations will not be computed-17 15:55:53,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▍ | 694/892 [1:05:17<13:56, 4.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:55:56,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▌ | 695/892 [1:05:21<12:52, 3.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:55:59,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████��███████████▌ | 695/892 [1:05:21<12:52, 3.92s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:55:59,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▋ | 696/892 [1:05:23<11:46, 3.61s/it]g-point operations will not be computed-17 15:55:59,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▋ | 696/892 [1:05:23<11:46, 3.61s/it]g-point operations will not be computed-17 15:55:59,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:04,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:02,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:04,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:02,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▋ | 697/892 [1:05:26<10:43, 3.30s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:56:05,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:08,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:07,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:08,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:07,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.7754, 'learning_rate': 0.0001530612244897959, 'epoch': 0.78} +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:10,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:09,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▉ | 700/892 [1:05:33<08:18, 2.60s/it]g-point operations will not be computed-17 15:56:09,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▉ | 700/892 [1:05:33<08:18, 2.60s/it]g-point operations will not be computed-17 15:56:09,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▉ | 700/892 [1:05:33<08:18, 2.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:56:13,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|█████████████████████████████████████████████████████████████▉ | 700/892 [1:05:33<08:18, 2.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:56:13,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:16,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:13,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:16,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:13,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████ | 701/892 [1:05:40<12:50, 4.04s/it]g-point operations will not be computed-17 15:56:13,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████ | 701/892 [1:05:40<12:50, 4.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:56:20,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:23,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:20,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████▏ | 702/892 [1:05:47<15:44, 4.97s/it]g-point operations will not be computed-17 15:56:20,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████▏ | 702/892 [1:05:47<15:44, 4.97s/it]g-point operations will not be computed-17 15:56:20,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████▏ | 702/892 [1:05:47<15:44, 4.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████▏ | 702/892 [1:05:47<15:44, 4.97s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:31,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:31,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████▎ | 703/892 [1:05:54<17:31, 5.57s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:36,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:36,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████▎ | 704/892 [1:06:01<18:41, 5.97s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████▎ | 704/892 [1:06:01<18:41, 5.97s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8596, 'learning_rate': 0.00014846938775510204, 'epoch': 0.79} + 79%|██████████████████████████████████████████████████████████████▎ | 704/892 [1:06:01<18:41, 5.97s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:46,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:46,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7869, 'learning_rate': 0.00014770408163265305, 'epoch': 0.79} +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:46,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:46,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:46,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████▌ | 706/892 [1:06:15<19:55, 6.43s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████▌ | 706/892 [1:06:15<19:55, 6.43s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:56:58,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████▌ | 707/892 [1:06:22<20:19, 6.59s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████▌ | 707/892 [1:06:22<20:19, 6.59s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.759, 'learning_rate': 0.0001461734693877551, 'epoch': 0.79} + 79%|██████████████████████████████████████████████████████████████▌ | 707/892 [1:06:22<20:19, 6.59s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:07,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:07,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7732, 'learning_rate': 0.00014540816326530611, 'epoch': 0.79} +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:07,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:07,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████▊ | 709/892 [1:06:35<20:25, 6.70s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|██████████████████████████████████████████████████████████████▊ | 709/892 [1:06:35<20:25, 6.70s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6, 'learning_rate': 0.00014464285714285713, 'epoch': 0.79} +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:18,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|██████████████████████████████████████████████████████████████▉ | 710/892 [1:06:42<20:17, 6.69s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|██████████████████████████████████████████████████████████████▉ | 710/892 [1:06:42<20:17, 6.69s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5738, 'learning_rate': 0.00014387755102040814, 'epoch': 0.8} + 80%|██████████████████████████████████████████████████████████████▉ | 710/892 [1:06:42<20:17, 6.69s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:27,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:27,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4732, 'learning_rate': 0.00014311224489795918, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:27,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:27,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:27,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████ | 712/892 [1:06:55<19:54, 6.63s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:37,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:37,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▏ | 713/892 [1:07:02<19:44, 6.62s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▏ | 713/892 [1:07:02<19:44, 6.62s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:43,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:43,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▏ | 714/892 [1:07:08<19:36, 6.61s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▏ | 714/892 [1:07:08<19:36, 6.61s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6063, 'learning_rate': 0.00014081632653061224, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:51,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▎ | 715/892 [1:07:15<19:25, 6.59s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▎ | 715/892 [1:07:15<19:25, 6.59s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5329, 'learning_rate': 0.00014005102040816326, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-17 15:57:58,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▍ | 716/892 [1:07:21<19:09, 6.53s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▍ | 716/892 [1:07:21<19:09, 6.53s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3883, 'learning_rate': 0.00013928571428571427, 'epoch': 0.8} + 80%|███████████████████████████████████████████████████████████████▍ | 716/892 [1:07:21<19:09, 6.53s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▍ | 716/892 [1:07:21<19:09, 6.53s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▍ | 716/892 [1:07:21<19:09, 6.53s/it]g-point operations will not be computed-17 15:56:27,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▌ | 717/892 [1:07:28<18:56, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:58:07,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▌ | 717/892 [1:07:28<18:56, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:58:07,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▌ | 717/892 [1:07:28<18:56, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:58:07,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▌ | 717/892 [1:07:28<18:56, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:58:07,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▌ | 718/892 [1:07:34<18:42, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:58:14,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▌ | 718/892 [1:07:34<18:42, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:58:14,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▌ | 718/892 [1:07:34<18:42, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:58:14,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|███████████████████████████████████████████████████████████████▌ | 718/892 [1:07:34<18:42, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:58:14,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|███████████████████████████████████████████████████████████████▋ | 719/892 [1:07:40<18:29, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|███████████████████████████████████████████████████████████████▋ | 719/892 [1:07:40<18:29, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|██████████████████████████████████████████████��████████████████▋ | 719/892 [1:07:40<18:29, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|███████████████████████████████████████████████████████████████▊ | 720/892 [1:07:47<18:17, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|███████████████████████████████████████████████████████████████▊ | 720/892 [1:07:47<18:17, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:58:28,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:58:28,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|███████████████████████████████████████████████████████████████▊ | 721/892 [1:07:53<18:07, 6.36s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|███████████████████████████████████████████████████████████████▊ | 721/892 [1:07:53<18:07, 6.36s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3025, 'learning_rate': 0.00013545918367346936, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-17 15:58:36,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|███████████████████████████████████████████████████████████████▉ | 722/892 [1:07:59<17:58, 6.34s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|███████████████████████████████████████████████████████████████▉ | 722/892 [1:07:59<17:58, 6.34s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:58:41,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:58:41,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|████████████████████████████████████████████████████████████████ | 723/892 [1:08:06<17:47, 6.32s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|████████████████████████████████████████████████████████████████ | 723/892 [1:08:06<17:47, 6.32s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:58:47,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:58:47,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|████████████████████████████████████████████████████████████████ | 724/892 [1:08:12<17:30, 6.25s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|████████████████████████████████████████████████████████████████ | 724/892 [1:08:12<17:30, 6.25s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:58:53,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:58:53,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|████████████████████████████████████████████████████████████████▏ | 725/892 [1:08:19<18:08, 6.52s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|████████████████████████████████████████████████████████████████▏ | 725/892 [1:08:19<18:08, 6.52s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.361, 'learning_rate': 0.00013239795918367346, 'epoch': 0.81} + 81%|████████████████████████████████████████████████████████████████▏ | 725/892 [1:08:19<18:08, 6.52s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|████████████████████████████████████████████████████████████████▏ | 725/892 [1:08:19<18:08, 6.52s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:03,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:03,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:03,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:03,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:09,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:09,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:14,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:14,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|████████████████████████████████████████████████████████████████▍ | 728/892 [1:08:37<16:56, 6.20s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|████████████████████████████████████████████████████████████████▍ | 728/892 [1:08:37<16:56, 6.20s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:19,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:19,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|████████████████████████████████████████████████████████████████▌ | 729/892 [1:08:43<16:31, 6.08s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:24,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:24,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:24,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|████████████████████████████████████████████████████████████████▋ | 730/892 [1:08:48<16:08, 5.98s/it]g-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:30,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:30,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:30,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:58:20,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|████████████████████████████████████████████████████████████████▋ | 731/892 [1:08:54<15:49, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:59:34,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|███████████████████████████████████████████���████████████████████▋ | 731/892 [1:08:54<15:49, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:59:34,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:38,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:59:34,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:38,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:59:34,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3405, 'learning_rate': 0.0001270408163265306, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:42,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:59:34,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:42,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:59:34,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|████████████████████████████████████████████████████████████████▉ | 733/892 [1:09:05<15:15, 5.76s/it]g-point operations will not be computed-17 15:59:34,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:46,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:59:34,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:46,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:59:34,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:46,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:59:34,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|█████████████████████████████████████████████████████████████████ | 734/892 [1:09:11<14:50, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-17 15:59:50,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:53,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:59:50,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|█████████████████████████████████████████████████████████████████ | 735/892 [1:09:16<14:28, 5.53s/it]g-point operations will not be computed-17 15:59:50,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|█████████████████████████████████████████████████████████████████ | 735/892 [1:09:16<14:28, 5.53s/it]g-point operations will not be computed-17 15:59:50,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:57,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:59:50,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:57,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:59:50,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 15:59:57,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 15:59:50,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|██████████���██████████████████████████████████████████████████████▏ | 736/892 [1:09:21<14:09, 5.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:01,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|█████████████████████████████████████████████████████████████████▏ | 736/892 [1:09:21<14:09, 5.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:01,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:05,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:01,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:05,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:01,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3069, 'learning_rate': 0.0001232142857142857, 'epoch': 0.83} +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:08,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:01,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:08,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:01,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|█████████████████████████████████████████████████████████████████▎ | 738/892 [1:09:31<13:26, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:11,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|█████████████████████████████████████████████████████████████████▎ | 738/892 [1:09:31<13:26, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:11,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:14,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:11,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:14,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:11,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:17,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:11,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:19,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:11,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:19,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:11,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:21,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:11,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:23,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:11,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:23,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:11,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3386, 'learning_rate': 0.00012015306122448978, 'epoch': 0.83} +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:27,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:11,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:27,052 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:11,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|█████████████████████████████████████████████████████████████████▋ | 742/892 [1:09:49<11:31, 4.61s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:29,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:31,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:29,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:31,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:29,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|█████████████████████████████████████████████████████████████████▊ | 743/892 [1:09:53<11:00, 4.43s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:33,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|█████████████████████████████████████████████████████████████████▉ | 744/892 [1:09:57<10:24, 4.22s/it]g-point operations will not be computed-17 16:00:33,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|█████████████████████████████████████████████████████████████████▉ | 744/892 [1:09:57<10:24, 4.22s/it]g-point operations will not be computed-17 16:00:33,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|█████████████████████████████████████████████████████████████████▉ | 744/892 [1:09:57<10:24, 4.22s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:36,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|█████████████████████████████████████████████████████████████████▉ | 745/892 [1:10:01<09:44, 3.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:40,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|█████████████████████████████████████████████████████████████████▉ | 745/892 [1:10:01<09:44, 3.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:40,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:41,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:40,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:41,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:40,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:44,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:43,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▏ | 747/892 [1:10:06<08:09, 3.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:45,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▏ | 747/892 [1:10:06<08:09, 3.38s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:45,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▏ | 748/892 [1:10:08<07:17, 3.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:47,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▏ | 748/892 [1:10:08<07:17, 3.04s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:47,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▎ | 749/892 [1:10:10<06:27, 2.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:49,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▎ | 749/892 [1:10:10<06:27, 2.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:49,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▍ | 750/892 [1:10:13<06:13, 2.63s/it]g-point operations will not be computed-17 16:00:49,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▍ | 750/892 [1:10:13<06:13, 2.63s/it]g-point operations will not be computed-17 16:00:49,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▍ | 750/892 [1:10:13<06:13, 2.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:53,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▍ | 750/892 [1:10:13<06:13, 2.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:00:53,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:57,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:53,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:00:57,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:00:53,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▌ | 751/892 [1:10:20<09:31, 4.06s/it]g-point operations will not be computed-17 16:00:53,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▌ | 751/892 [1:10:20<09:31, 4.06s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:01:00,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:01:04,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:00,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▌ | 752/892 [1:10:27<11:38, 4.99s/it]g-point operations will not be computed-17 16:01:00,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▌ | 752/892 [1:10:27<11:38, 4.99s/it]g-point operations will not be computed-17 16:01:00,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▌ | 752/892 [1:10:27<11:38, 4.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:01:07,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▌ | 752/892 [1:10:27<11:38, 4.99s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:01:07,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:01:11,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:07,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:01:11,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:07,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▋ | 753/892 [1:10:35<13:00, 5.62s/it]g-point operations will not be computed-17 16:01:07,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|██████████████████████████████████████████████████████████████████▋ | 753/892 [1:10:35<13:00, 5.62s/it]g-point operations will not be computed-17 16:01:07,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:01:18,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:07,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|██████████████████████████████████████████████████████████████████▊ | 754/892 [1:10:42<13:52, 6.03s/it]g-point operations will not be computed-17 16:01:07,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|██████████████████████████████████████████████████████████████████▊ | 754/892 [1:10:42<13:52, 6.03s/it]g-point operations will not be computed-17 16:01:07,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7787, 'learning_rate': 0.00011020408163265306, 'epoch': 0.85} + 85%|██████████████████████████████████████████████████████████████████▊ | 754/892 [1:10:42<13:52, 6.03s/it]g-point operations will not be computed-17 16:01:07,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|██���███████████████████████████████████████████████████████████████▊ | 754/892 [1:10:42<13:52, 6.03s/it]g-point operations will not be computed-17 16:01:07,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|██████████████████████████████████████████████████████████████████▊ | 754/892 [1:10:42<13:52, 6.03s/it]g-point operations will not be computed-17 16:01:07,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|██████████████████████████████████████████████████████████████████▊ | 755/892 [1:10:48<14:21, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:01:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|██████████████████████████████████████████████████████████████████▊ | 755/892 [1:10:48<14:21, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:01:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|██████████████████████████████████████████████████████████████████▊ | 755/892 [1:10:48<14:21, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:01:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|██████████████████████████████████████████████████████████████████▉ | 756/892 [1:10:55<14:39, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:01:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|██████████████████████████████████████████████████████████████████▉ | 756/892 [1:10:55<14:39, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:01:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7847, 'learning_rate': 0.0001086734693877551, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-17 16:01:39,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|███████████████████████████████████████████████████████████████████ | 757/892 [1:11:02<14:42, 6.54s/it]g-point operations will not be computed-17 16:01:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|███████████████████████████████████████████████████████████████████ | 757/892 [1:11:02<14:42, 6.54s/it]g-point operations will not be computed-17 16:01:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5984, 'learning_rate': 0.00010790816326530611, 'epoch': 0.85} + 85%|███████████████████████████████████████████████████████████████████ | 757/892 [1:11:02<14:42, 6.54s/it]g-point operations will not be computed-17 16:01:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|███████████████████████████████████████████████████████████████████ | 757/892 [1:11:02<14:42, 6.54s/it]g-point operations will not be computed-17 16:01:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|████████████████████████████████████████████��██████████████████████ | 757/892 [1:11:02<14:42, 6.54s/it]g-point operations will not be computed-17 16:01:28,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|███████████████████████████████████████████████████████████████████▏ | 758/892 [1:11:09<14:47, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|███████████████████████████████████████████████████████████████████▏ | 758/892 [1:11:09<14:47, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|███████████████████████████████████████████████████████████████████▏ | 758/892 [1:11:09<14:47, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|███████████████████████████████████████████████████████████████████▏ | 759/892 [1:11:16<14:47, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|███████████████████████████████████████████████████████████████████▏ | 759/892 [1:11:16<14:47, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5638, 'learning_rate': 0.00010637755102040815, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-17 16:01:59,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|███████████████████████████████████████████████████████████████████▎ | 760/892 [1:11:22<14:41, 6.68s/it]g-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|███████████████████████████████████████████████████████████████████▎ | 760/892 [1:11:22<14:41, 6.68s/it]g-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5597, 'learning_rate': 0.00010561224489795918, 'epoch': 0.85} + 85%|███████████████████████████████████████████████████████████████████▎ | 760/892 [1:11:22<14:41, 6.68s/it]g-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:07,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:07,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4244, 'learning_rate': 0.0001048469387755102, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:07,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:14,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:14,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4303, 'learning_rate': 0.00010408163265306121, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:14,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:14,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:14,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|███████████████████████████████████████████████████████████████████▌ | 763/892 [1:11:42<14:16, 6.64s/it]g-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:24,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:24,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:24,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|███████████████████████████████████████████████████████████████████▋ | 764/892 [1:11:49<14:07, 6.62s/it]g-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:30,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:30,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:30,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|███████████████████████████████████████████████████████████████████▊ | 765/892 [1:11:55<13:57, 6.59s/it]g-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|███████████████████████████████████████████████████████████████████▊ | 765/892 [1:11:55<13:57, 6.59s/it]g-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|███████████████████████████████████████████████████████████████████▊ | 765/892 [1:11:55<13:57, 6.59s/it]g-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|█████████���█████████████████████████████████████████████████████████▊ | 765/892 [1:11:55<13:57, 6.59s/it]g-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:40,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:40,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:40,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:46,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:46,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2721, 'learning_rate': 0.00010025510204081632, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:46,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:46,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:02:46,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:01:49,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|████████████████████████████████████████████████████████████████████ | 768/892 [1:12:15<13:23, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:02:54,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|████████████████████████████████████████████████████████████████████ | 768/892 [1:12:15<13:23, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:02:54,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|████████████████████████████████████████████████████████████████████ | 768/892 [1:12:15<13:23, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:02:54,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|████████████████████████████████████████████████████████████████████ | 768/892 [1:12:15<13:23, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:02:54,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|████████████████████████████████████████████████████████████████████ | 769/892 [1:12:21<13:12, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:03:01,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|████████████████████████████████████████████████████████████████████ | 769/892 [1:12:21<13:12, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:03:01,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|████████████████████████████████████████████████████████████████████ | 769/892 [1:12:21<13:12, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:03:01,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|████████████████████████████████████████████████████████████████████ | 769/892 [1:12:21<13:12, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:03:01,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|████████████████████████████████████████████████████████████████████▏ | 770/892 [1:12:27<13:00, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|████████████████████████████████████████████████████████████████████▏ | 770/892 [1:12:27<13:00, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|████████████████████████████████████████████████████████████████████▏ | 770/892 [1:12:27<13:00, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|████████████████████████████████████████████████████████████████████▏ | 770/892 [1:12:27<13:00, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|████████████████████████████████████████████████████████████████████▎ | 771/892 [1:12:33<12:50, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:15,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:15,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:15,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|████████████████████████████████████████████████████████████████████▎ | 772/892 [1:12:40<12:41, 6.34s/it]g-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|████████████████████████████████████████████████████████████████████▎ | 772/892 [1:12:40<12:41, 6.34s/it]g-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:23,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:23,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|████████████████████████████████████████████████████████████████████▍ | 773/892 [1:12:46<12:33, 6.33s/it]g-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:27,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:27,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:27,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|████████████████████████████████████████████████████████████████████▌ | 774/892 [1:12:52<12:21, 6.28s/it]g-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:33,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:33,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|████████████████████████████████████████████████████████████████████▋ | 775/892 [1:12:59<12:41, 6.51s/it]g-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|████████████████████████████████████████████████████████████████████▋ | 775/892 [1:12:59<12:41, 6.51s/it]g-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0283, 'learning_rate': 9.413265306122448e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:42,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|████████████████████████████████████████████████████████████████████▋ | 776/892 [1:13:05<12:17, 6.36s/it]g-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|████████████████████████████████████████████████████████████████████▋ | 776/892 [1:13:05<12:17, 6.36s/it]g-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2473, 'learning_rate': 9.336734693877551e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:48,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:48,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|██████████████████████���█████████████████████████████████████████████▊ | 777/892 [1:13:11<11:56, 6.23s/it]g-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|████████████████████████████████████████████████████████████████████▊ | 777/892 [1:13:11<11:56, 6.23s/it]g-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:54,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:54,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|████████████████████████████████████████████████████████████████████▉ | 778/892 [1:13:17<11:40, 6.15s/it]g-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:58,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:58,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:03:58,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|████████████████████████████████████████████████████████████████████▉ | 779/892 [1:13:23<11:24, 6.06s/it]g-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:04,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:04,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:04,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:03:07,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|█████████████████████████████████████████████████████████████████████ | 780/892 [1:13:29<11:09, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|█████████████████████████████████████████████████████████████████████ | 780/892 [1:13:29<11:09, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:13,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:13,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1021, 'learning_rate': 8.954081632653061e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:13,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:19,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:19,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1532, 'learning_rate': 8.877551020408162e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:23,311 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 88%|█████████████████████████████████████████████████████████████████████▎ | 783/892 [1:13:46<10:33, 5.82s/it]g-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 88%|█████████████████████████████████████████████████████████████████████▎ | 783/892 [1:13:46<10:33, 5.82s/it]g-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2019, 'learning_rate': 8.801020408163265e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:28,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:28,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 88%|█████████████████████████████████████████████████████████████████████▍ | 784/892 [1:13:52<10:16, 5.71s/it]g-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:32,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:35,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:35,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1634, 'learning_rate': 8.647959183673469e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:39,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 88%|█████████████████████████████████████████████████████████████████████▌ | 786/892 [1:14:02<09:45, 5.53s/it]g-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 88%|█████████████████████████████████████████████████████████████████��███▌ | 786/892 [1:14:02<09:45, 5.53s/it]g-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:43,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:43,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:43,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:08,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 88%|█████████████████████████████████████████████████████████████████████▋ | 787/892 [1:14:07<09:26, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:04:47,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:49,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:47,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 88%|█████████████████████████████████████████████████████████████████████▊ | 788/892 [1:14:12<09:09, 5.29s/it]g-point operations will not be computed-17 16:04:47,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 88%|█████████████████████████████████████████████████████████████████████▊ | 788/892 [1:14:12<09:09, 5.29s/it]g-point operations will not be computed-17 16:04:47,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:53,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:47,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:55,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:47,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:55,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:47,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1432, 'learning_rate': 8.341836734693876e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-17 16:04:59,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:04:47,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 89%|█████████████████████████████████████████████████████████████████████▉ | 790/892 [1:14:22<08:35, 5.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 89%|█████████████████████████████████████████████████████████████████████▉ | 790/892 [1:14:22<08:35, 5.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:04,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 89%|██████████████████████████████████████████████████████████████████████ | 791/892 [1:14:27<08:18, 4.93s/it]g-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 89%|██████████████████████████████████████████████████████████████████████ | 791/892 [1:14:27<08:18, 4.93s/it]g-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:07,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:09,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:09,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:11,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:13,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:13,683 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:15,605 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:17,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:17,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:20,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:20,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:22,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:23,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:23,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:26,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:26,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:28,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:28,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:30,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:30,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:31,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:31,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:32,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:36,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:36,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:40,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:40,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0181, 'learning_rate': 7.423469387755102e-05, 'epoch': 0.9} +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:44,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:44,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:44,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:47,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:51,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:51,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:51,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:54,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:54,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:59,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:05:59,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|███████████████████████████████████████████████████████████████████████▏ | 804/892 [1:15:23<08:45, 5.97s/it]g-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|███████████████████████████████████████████████████████████████████████▏ | 804/892 [1:15:23<08:45, 5.97s/it]g-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|███████████████████████████████████████████████████████████████████████▏ | 804/892 [1:15:23<08:45, 5.97s/it]g-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|███████████████████████████████████████████████████████████████████████▏ | 804/892 [1:15:23<08:45, 5.97s/it]g-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|███████████████████████████████████████████████████████████████████████▏ | 804/892 [1:15:23<08:45, 5.97s/it]g-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|███████████████████████████████████████████████████████████████████████▎ | 805/892 [1:15:30<09:02, 6.23s/it]g-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|███████████████████████████████████████████████████████████████████████▎ | 805/892 [1:15:30<09:02, 6.23s/it]g-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:13,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:13,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|███████████████████████████████████████████████████████████████████████▍ | 806/892 [1:15:36<09:10, 6.41s/it]g-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|███████████████████████████████████████████████████████████████████████▍ | 806/892 [1:15:36<09:10, 6.41s/it]g-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|███████████████████████████████████████████████████████████████████████▍ | 806/892 [1:15:36<09:10, 6.41s/it]g-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|███████████████████████████████████████████████████████████████████████▍ | 806/892 [1:15:36<09:10, 6.41s/it]g-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:21,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:21,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:21,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:21,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:21,770 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:05:01,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|███████████████████████████████████████████████████████████████████████▌ | 808/892 [1:15:50<09:13, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|███████████████████████████████████████████████████████████████████████▌ | 808/892 [1:15:50<09:13, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|███████████████████████████████████████████████████████████████████████▌ | 808/892 [1:15:50<09:13, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|███████████████████████████████████████████████████████████████████████▌ | 808/892 [1:15:50<09:13, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|███████████████████████████████████████████████████████████████████████▋ | 809/892 [1:15:56<09:07, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|███████████████████████████████████████████████████████████████████████▋ | 809/892 [1:15:56<09:07, 6.60s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:40,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:40,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|███████████████████████████████████████████████████████████████████████▋ | 810/892 [1:16:03<09:02, 6.62s/it]g-point operations will not be computed-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|███████████████████████████████████████████████████████████████████████▋ | 810/892 [1:16:03<09:02, 6.62s/it]g-point operations will not be computed-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|███████████████████████████████████████████████████████████████████████▋ | 810/892 [1:16:03<09:02, 6.62s/it]g-point operations will not be computed-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:48,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:48,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4591, 'learning_rate': 6.658163265306122e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:48,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:48,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:06:48,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:30,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|███████████████████████████████████████████████████████████████████████▉ | 812/892 [1:16:16<08:47, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|███████████████████████████████████████████████████████████████████████▉ | 812/892 [1:16:16<08:47, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|███████████████████████████████████████████████████████████████████████▉ | 812/892 [1:16:16<08:47, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|███████████████████████████████████████████████████████████████████████▉ | 812/892 [1:16:16<08:47, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|████████████████████████████████████████████████████████████████████████ | 813/892 [1:16:23<08:37, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:04,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:04,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:04,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|████████████████████████████████████████████████████████████████████████ | 814/892 [1:16:29<08:27, 6.51s/it]g-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:11,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:11,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:11,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|████████████████████████████████████████████████████████████████████████▏ | 815/892 [1:16:36<08:20, 6.49s/it]g-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:17,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:17,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:17,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|████████████████████████████████████████████████████████████████████████▎ | 816/892 [1:16:42<08:11, 6.47s/it]g-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|████████████████████████████████████████████████████████████████████████▎ | 816/892 [1:16:42<08:11, 6.47s/it]g-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|████████████████████████████████████████████████████████████████████████▎ | 816/892 [1:16:42<08:11, 6.47s/it]g-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:27,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:27,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1727, 'learning_rate': 6.198979591836734e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:27,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:33,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:33,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1451, 'learning_rate': 6.122448979591836e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:33,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:39,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:39,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0258, 'learning_rate': 6.045918367346938e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:39,580 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:45,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:45,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1776, 'learning_rate': 5.96938775510204e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:45,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0993, 'learning_rate': 5.892857142857142e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:51,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:58,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:58,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0599, 'learning_rate': 5.816326530612244e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:58,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:58,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:07:58,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:06:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 92%|████████████████████████████████████████████████████████████████████████▉ | 823/892 [1:17:26<07:07, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 92%|████████████████████████████████████████████████████████████████████████▉ | 823/892 [1:17:26<07:07, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:10,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:10,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1469, 'learning_rate': 5.663265306122448e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:10,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:10,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 92%|█████████████████████████████████████████████████████████████████████████ | 825/892 [1:17:39<07:07, 6.39s/it]g-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 92%|█████████████████████████████████████████████████████████████████████████ | 825/892 [1:17:39<07:07, 6.39s/it]g-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:20,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:20,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:20,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▏ | 826/892 [1:17:45<06:54, 6.28s/it]g-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████��███████████████████████████████████████████████████████████████▏ | 826/892 [1:17:45<06:54, 6.28s/it]g-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:27,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:27,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▏ | 827/892 [1:17:50<06:40, 6.16s/it]g-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:32,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:32,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:32,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▎ | 828/892 [1:17:56<06:26, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:08:36,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▎ | 828/892 [1:17:56<06:26, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:08:36,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▎ | 828/892 [1:17:56<06:26, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:08:36,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▎ | 828/892 [1:17:56<06:26, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:08:36,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▍ | 829/892 [1:18:02<06:16, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:08:42,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▍ | 829/892 [1:18:02<06:16, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:08:42,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:46,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:42,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:46,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:42,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1883, 'learning_rate': 5.204081632653061e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:50,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:42,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▌ | 831/892 [1:18:14<05:57, 5.86s/it]g-point operations will not be computed-17 16:08:42,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▌ | 831/892 [1:18:14<05:57, 5.86s/it]g-point operations will not be computed-17 16:08:42,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9742, 'learning_rate': 5.1275510204081626e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-17 16:08:56,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:42,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▋ | 832/892 [1:18:19<05:48, 5.81s/it]g-point operations will not be computed-17 16:08:42,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▋ | 832/892 [1:18:19<05:48, 5.81s/it]g-point operations will not be computed-17 16:08:42,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:00,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:42,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:00,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:42,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:00,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:08:42,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▊ | 833/892 [1:18:25<05:39, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:09:04,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|█████████████████████████████████████████████████████████████████████████▊ | 833/892 [1:18:25<05:39, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:09:04,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:08,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:04,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:08,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:04,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0522, 'learning_rate': 4.897959183673468e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:12,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:04,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|█████████████████████████████████████████████████████████████████████████▉ | 835/892 [1:18:36<05:16, 5.56s/it]g-point operations will not be computed-17 16:09:04,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|█████████████████████████████████████████████████████████████████████████▉ | 835/892 [1:18:36<05:16, 5.56s/it]g-point operations will not be computed-17 16:09:04,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:16,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:04,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:16,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:04,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:16,957 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:04,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|██████████████████████████████████████████████████████████████████████████ | 836/892 [1:18:41<05:05, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:09:20,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|██████████████████████████████████████████████████████████████████████████ | 836/892 [1:18:41<05:05, 5.46s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:09:20,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:24,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:20,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:24,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:20,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:27,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:20,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:27,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:20,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:27,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:20,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|██████████████████████████████████████████████████████████████████████████▏ | 838/892 [1:18:51<04:42, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:09:30,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:33,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:30,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|██████████████████████████████████████████████████████████████████████████▎ | 839/892 [1:18:56<04:29, 5.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|██████████████████████████████████████████████████████████████████████████▎ | 839/892 [1:18:56<04:29, 5.09s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:37,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|██████████████████████████████████████████████████████████████████████████▍ | 840/892 [1:19:00<04:14, 4.89s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|██████████████████████████████████████████████████████████████████████████▍ | 840/892 [1:19:00<04:14, 4.89s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:40,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:42,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:42,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:45,004 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:46,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:46,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:48,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:50,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:50,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:53,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:53,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:55,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:58,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:58,098 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:59,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:09:59,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:01,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:01,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:03,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:03,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:05,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:05,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:06,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:06,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:08,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:12,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:15,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:15,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:19,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:19,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:19,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:22,938 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:26,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:26,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:26,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:29,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:29,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:33,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:33,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:33,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|███████████████████████████████████████████████████████████████████████████▋ | 854/892 [1:19:58<03:48, 6.00s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:40,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:40,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:40,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|███████████████████████████████████████████████████████████████████████████▋ | 855/892 [1:20:05<03:52, 6.29s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|██████████████████████████████████████��████████████████████████████████████▋ | 855/892 [1:20:05<03:52, 6.29s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:10:49,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|███████████████████████████████████████████████████████████████████████████▊ | 856/892 [1:20:12<03:52, 6.46s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|███████████████████████████████████████████████████████████████████████████▊ | 856/892 [1:20:12<03:52, 6.46s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4819, 'learning_rate': 3.214285714285714e-05, 'epoch': 0.96} + 96%|███████████████████████████████████████████████████████████████████████████▊ | 856/892 [1:20:12<03:52, 6.46s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|███████████████████████████████████████████████████████████████████████████▊ | 856/892 [1:20:12<03:52, 6.46s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|███████████████████████████████████████████████████████████████████████████▊ | 856/892 [1:20:12<03:52, 6.46s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|███████████████████████████████████████████████████████████████████████████▉ | 857/892 [1:20:19<03:49, 6.57s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:01,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:01,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:01,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|███████████████████████████████████████████████████████████████████████████▉ | 858/892 [1:20:26<03:45, 6.64s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|███████████████████████████████████████████████████████████████████████████▉ | 858/892 [1:20:26<03:45, 6.64s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|███████████████████████████████████████████████���███████████████████████████▉ | 858/892 [1:20:26<03:45, 6.64s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:11,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:11,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.201, 'learning_rate': 2.98469387755102e-05, 'epoch': 0.96} +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:11,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:11,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:11,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|████████████████████████████████████████████████████████████████████████████▏ | 860/892 [1:20:40<03:41, 6.94s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|████████████████████████████████████████████████████████████████████████████▏ | 860/892 [1:20:40<03:41, 6.94s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|████████████████████████████████████████████████████████████████████████████▏ | 860/892 [1:20:40<03:41, 6.94s/it]g-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:25,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:25,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.41, 'learning_rate': 2.831632653061224e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:25,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:25,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:25,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:09:35,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|████████████████████████████████████████████████████████████████████████████▎ | 862/892 [1:20:53<03:23, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|█████████████████████████████████████████████��██████████████████████████████▎ | 862/892 [1:20:53<03:23, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|████████████████████████████████████████████████████████████████████████████▎ | 862/892 [1:20:53<03:23, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|████████████████████████████████████████████████████████████████████████████▎ | 862/892 [1:20:53<03:23, 6.79s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|████████████████████████████████████████████████████████████████████████████▍ | 863/892 [1:21:00<03:14, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:41,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:41,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:41,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|████████████████████████████████████████████████████████████████████████████▌ | 864/892 [1:21:06<03:05, 6.61s/it]g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:48,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:48,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:48,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|████████████████████████████████████████████████████████████████████████████▌ | 865/892 [1:21:13<02:56, 6.53s/it]g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|████████████████████████████████████████████████████████████████████████████▌ | 865/892 [1:21:13<02:56, 6.53s/it]g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:11:56,339 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|████████████████████████████████████████████████████████████████████████████▋ | 866/892 [1:21:19<02:50, 6.55s/it]g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|████████████████████████████████████████████████████████████████████████████▋ | 866/892 [1:21:19<02:50, 6.55s/it]g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9931, 'learning_rate': 2.448979591836734e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:02,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|████████████████████████████████████████████████████████████████████████████▊ | 867/892 [1:21:26<02:41, 6.48s/it]g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|████████████████████████████████████████████████████████████████████████████▊ | 867/892 [1:21:26<02:41, 6.48s/it]g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.201, 'learning_rate': 2.3724489795918367e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:08,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0319, 'learning_rate': 2.2959183673469387e-05, 'epoch': 0.97} + g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:16,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:16,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9311, 'learning_rate': 2.2193877551020406e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:16,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:22,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:22,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2493, 'learning_rate': 2.1428571428571425e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:22,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:29,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:29,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9831, 'learning_rate': 2.0663265306122444e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:29,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:35,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:35,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0472, 'learning_rate': 1.989795918367347e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:35,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:41,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:41,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1426, 'learning_rate': 1.913265306122449e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:45,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 98%|█████████████████████████████████████████████████████████████████████████████▍ | 874/892 [1:22:09<01:49, 6.08s/it]g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 98%|█████████████████████████████████████████████████████████████████████████████▍ | 874/892 [1:22:09<01:49, 6.08s/it]g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0451, 'learning_rate': 1.8367346938775508e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:51,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:51,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:51,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1395, 'learning_rate': 1.760204081632653e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:51,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:59,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:12:59,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9079, 'learning_rate': 1.683673469387755e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:04,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 98%|█████████████████████████████████████████████████████████████████████████████▋ | 877/892 [1:22:27<01:30, 6.06s/it]g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 98%|█████████████████████████████████████████████████████████████████████████████▋ | 877/892 [1:22:27<01:30, 6.06s/it]g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.9106, 'learning_rate': 1.607142857142857e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:09,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 98%|█████████████████████████████████████████████████████████████████████████████▊ | 878/892 [1:22:33<01:22, 5.92s/it]g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 98%|█████████████████████████████████████████████████████████████████████████████▊ | 878/892 [1:22:33<01:22, 5.92s/it]g-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:14,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:14,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:14,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:11:33,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|█████████████████████████████████████████████████████████████████████████████▊ | 879/892 [1:22:38<01:15, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:13:18,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:20,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:18,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|█████████████████████████████████████████████████████████████████████████████▉ | 880/892 [1:22:43<01:08, 5.67s/it]g-point operations will not be computed-17 16:13:18,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|█████████████████████████████████████████████████████████████████████████████▉ | 880/892 [1:22:43<01:08, 5.67s/it]g-point operations will not be computed-17 16:13:18,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:24,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:18,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:24,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:18,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:24,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:18,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|██████████████████████████████████████████████████████████████████████████████ | 881/892 [1:22:49<01:00, 5.53s/it]g-point operations will not be computed-17 16:13:18,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:29,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:18,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:32,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:18,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:32,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:18,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.0127, 'learning_rate': 1.224489795918367e-05, 'epoch': 0.99} +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:36,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:18,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:36,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:18,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|██████████████████████████████████████████████████████████████████████████████▏| 883/892 [1:22:59<00:47, 5.26s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:13:38,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:40,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:38,588 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|██████████████████████████████████████████████████████████████████████████████▎| 884/892 [1:23:03<00:40, 5.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:13:43,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|██████████████████████████████████████████████████████████████████████████████▎| 884/892 [1:23:03<00:40, 5.05s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:13:43,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:45,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:43,042 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|██████████████████████████████████████████████████████████████████████████████▍| 885/892 [1:23:07<00:33, 4.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:13:47,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|██████████████████████████████████���███████████████████████████████████████████▍| 885/892 [1:23:07<00:33, 4.78s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:13:47,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:48,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:47,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|██████████████████████████████████████████████████████████████████████████████▍| 886/892 [1:23:11<00:27, 4.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:13:50,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|██████████████████████████████████████████████████████████████████████████████▍| 886/892 [1:23:11<00:27, 4.50s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:13:50,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:52,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:50,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:52,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:50,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|██████████████████████████████████████████████████████████████████████████████▌| 887/892 [1:23:15<00:21, 4.21s/it][WARNING|modeling_utils.py:388] 2022-03-17 16:13:54,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +100%|██████████████████████████████████████████████████████████████████████████████▋| 888/892 [1:23:18<00:15, 3.87s/it]g-point operations will not be computed-17 16:13:54,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +100%|██████████████████████████████████████████████████████████████████████████████▋| 888/892 [1:23:18<00:15, 3.87s/it]g-point operations will not be computed-17 16:13:54,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:58,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:57,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:13:58,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:57,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:14:01,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:59,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:14:01,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:13:59,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:14:03,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:14:02,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-17 16:14:03,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-17 16:14:02,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|trainer.py:2114] 2022-03-17 16:14:05,221 >> Saving model checkpoint to ./=)███| 892/892 [1:23:26<00:00, 2.44s/it][INFO|trainer.py:1492] 2022-03-17 16:14:05,218 >> 4,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|trainer.py:2114] 2022-03-17 16:14:05,221 >> Saving model checkpoint to ./=)███| 892/892 [1:23:26<00:00, 2.44s/it][INFO|trainer.py:1492] 2022-03-17 16:14:05,218 >> 4,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 3.0179, 'learning_rate': 4.591836734693877e-06, 'epoch': 1.0} +[INFO|trainer.py:2114] 2022-03-17 16:14:17,880 >> Saving model checkpoint to ./ ./pytorch_model.bin:26<00:00, 2.44s/it][INFO|trainer.py:1492] 2022-03-17 16:14:05,218 >> 4,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +Adding files tracked by Git LFS: ['wandb/run-20220317_145036-3tnpukko/run-3tnpukko.wandb']. This may take a bit of time if the files are large.2022-03-17 16:14:05,218 >> 4,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +Adding files tracked by Git LFS: ['wandb/run-20220317_145036-3tnpukko/run-3tnpukko.wandb']. This may take a bit of time if the files are large.2022-03-17 16:14:05,218 >> 4,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed