diff --git "a/wandb/run-20220303_033953-1eigbhyo/files/output.log" "b/wandb/run-20220303_033953-1eigbhyo/files/output.log" new file mode 100644--- /dev/null +++ "b/wandb/run-20220303_033953-1eigbhyo/files/output.log" @@ -0,0 +1,2305 @@ + + + 0%| | 0/892 [00:00> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:39:59,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:01,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7965, 'learning_rate': 0.0, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:03,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 1/892 [00:08<2:01:09, 8.16s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:40:05,163 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:06,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:08,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0502, 'learning_rate': 0.0, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:10,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%|▏ | 2/892 [00:15<1:55:12, 7.77s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:40:12,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:14,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:16,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9118, 'learning_rate': 2e-06, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:18,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%|▎ | 3/892 [00:23<1:52:51, 7.62s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:40:20,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:21,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:23,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8924, 'learning_rate': 4e-06, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:25,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 4/892 [00:30<1:50:39, 7.48s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:40:27,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:29,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:30,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.713, 'learning_rate': 6e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:32,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 1%|▍ | 5/892 [00:37<1:49:17, 7.39s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:40:34,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:36,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:38,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7862, 'learning_rate': 8e-06, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:39,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 6/892 [00:44<1:48:29, 7.35s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:40:41,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:43,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:45,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7066, 'learning_rate': 1e-05, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:47,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 1%|▋ | 7/892 [00:52<1:47:41, 7.30s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:40:49,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:50,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:52,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:54,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5681, 'learning_rate': 1.2e-05, 'epoch': 0.01} + 1%|▋ | 8/892 [00:59<1:47:03, 7.27s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:40:56,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:57,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:40:59,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6685, 'learning_rate': 1.4e-05, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:01,402 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 1%|▊ | 9/892 [01:06<1:46:12, 7.22s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:41:03,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:05,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:06,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:08,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4888, 'learning_rate': 1.6e-05, 'epoch': 0.01} + 1%|▉ | 10/892 [01:13<1:45:34, 7.18s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:41:10,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:12,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:13,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.566, 'learning_rate': 1.8e-05, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:15,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 1%|▉ | 11/892 [01:20<1:44:32, 7.12s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:41:17,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:18,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:20,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:22,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 12/892 [01:27<1:43:34, 7.06s/it] + + 1%|█ | 12/892 [01:27<1:43:34, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:41:24,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:26,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:27,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4308, 'learning_rate': 2.2e-05, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:29,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 1%|█▏ | 13/892 [01:34<1:43:33, 7.07s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:41:31,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:33,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:34,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:36,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 14/892 [01:41<1:43:21, 7.06s/it] + + 2%|█▎ | 14/892 [01:41<1:43:21, 7.06s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:41:38,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:40,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:41,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3274, 'learning_rate': 2.6e-05, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:43,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 15/892 [01:48<1:42:49, 7.04s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:41:45,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:47,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:48,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:50,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 16/892 [01:55<1:41:50, 6.98s/it] + + 2%|█▍ | 16/892 [01:55<1:41:50, 6.98s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:41:52,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:53,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:55,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:41:57,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 17/892 [02:02<1:41:07, 6.93s/it] + + 2%|█▌ | 17/892 [02:02<1:41:07, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:41:58,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:00,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:02,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5591, 'learning_rate': 3.2e-05, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:03,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 18/892 [02:08<1:40:05, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:42:05,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:07,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:09,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2522, 'learning_rate': 3.4000000000000007e-05, 'epoch': 0.02} +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:10,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 2%|█▋ | 19/892 [02:15<1:39:38, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:42:12,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:14,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:15,737 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:17,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 20/892 [02:22<1:38:46, 6.80s/it] + + 2%|█▊ | 20/892 [02:22<1:38:46, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:42:19,099 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:20,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:22,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:23,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 21/892 [02:28<1:37:26, 6.71s/it] + + 2%|█▉ | 21/892 [02:28<1:37:26, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:42:25,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:27,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:28,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:30,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3206, 'learning_rate': 4e-05, 'epoch': 0.02} + 2%|█▉ | 22/892 [02:35<1:36:27, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:42:32,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:33,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:35,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3652, 'learning_rate': 4.2000000000000004e-05, 'epoch': 0.03} +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:36,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 23/892 [02:41<1:35:29, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:42:38,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:40,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:41,798 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:43,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 24/892 [02:48<1:35:02, 6.57s/it] + 3%|██▏ | 24/892 [02:48<1:35:02, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:42:45,049 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:46,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:48,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:50,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 25/892 [02:55<1:36:15, 6.66s/it] + 3%|██▏ | 25/892 [02:55<1:36:15, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:42:51,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:53,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:42:51,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:56,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:42:51,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:42:56,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:42:51,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 26/892 [03:01<1:35:06, 6.59s/it] + 3%|██▎ | 26/892 [03:01<1:35:06, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:42:58,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 26/892 [03:01<1:35:06, 6.59s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:42:58,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-03 03:42:58,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-03 03:42:58,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 27/892 [03:07<1:33:54, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:04,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 27/892 [03:07<1:33:54, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:04,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:43:07,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:43:04,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 28/892 [03:14<1:32:58, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:11,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 28/892 [03:14<1:32:58, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:11,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1507, 'learning_rate': 5.2e-05, 'epoch': 0.03} +[WARNING|modeling_utils.py:388] 2022-03-03 03:43:14,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:43:11,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 29/892 [03:20<1:32:08, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:17,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 29/892 [03:20<1:32:08, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:17,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.1699, 'learning_rate': 5.4e-05, 'epoch': 0.03} +[WARNING|modeling_utils.py:388] 2022-03-03 03:43:20,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:43:17,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 30/892 [03:26<1:30:54, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:23,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 30/892 [03:26<1:30:54, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:23,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3846, 'learning_rate': 5.6e-05, 'epoch': 0.03} +[WARNING|modeling_utils.py:388] 2022-03-03 03:43:26,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:43:23,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:43:26,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:43:23,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▊ | 31/892 [03:32<1:29:47, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:29,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▊ | 31/892 [03:32<1:29:47, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:29,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 32/892 [03:38<1:28:43, 6.19s/it]g-point operations will not be computed-03 03:43:29,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 32/892 [03:38<1:28:43, 6.19s/it]g-point operations will not be computed-03 03:43:29,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 32/892 [03:38<1:28:43, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:35,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 32/892 [03:38<1:28:43, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:35,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 33/892 [03:44<1:27:39, 6.12s/it]g-point operations will not be computed-03 03:43:35,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 33/892 [03:44<1:27:39, 6.12s/it]g-point operations will not be computed-03 03:43:35,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 33/892 [03:44<1:27:39, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:41,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:43:44,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:43:41,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:43:44,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:43:41,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 34/892 [03:50<1:25:55, 6.01s/it]g-point operations will not be computed-03 03:43:41,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 34/892 [03:50<1:25:55, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:47,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:43:49,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:43:47,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:43:49,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:43:47,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 35/892 [03:56<1:24:24, 5.91s/it]g-point operations will not be computed-03 03:43:47,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 35/892 [03:56<1:24:24, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:52,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:43:55,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:43:52,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:43:55,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:43:52,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 36/892 [04:01<1:23:11, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:58,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 36/892 [04:01<1:23:11, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:58,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 36/892 [04:01<1:23:11, 5.83s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:43:58,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 37/892 [04:07<1:21:19, 5.71s/it]g-point operations will not be computed-03 03:43:58,386 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 37/892 [04:07<1:21:19, 5.71s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:44:03,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:44:06,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:44:03,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:44:06,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:44:03,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 38/892 [04:12<1:19:45, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:44:09,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 38/892 [04:12<1:19:45, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:44:09,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 39/892 [04:17<1:18:07, 5.50s/it]g-point operations will not be computed-03 03:44:09,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 39/892 [04:17<1:18:07, 5.50s/it]g-point operations will not be computed-03 03:44:09,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 39/892 [04:17<1:18:07, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:44:14,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:44:16,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:44:14,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:44:16,782 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:44:14,320 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▌ | 40/892 [04:22<1:16:06, 5.36s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:44:19,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▌ | 40/892 [04:22<1:16:06, 5.36s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:44:19,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 41/892 [04:27<1:14:14, 5.23s/it]g-point operations will not be computed-03 03:44:19,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 41/892 [04:27<1:14:14, 5.23s/it]g-point operations will not be computed-03 03:44:19,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 41/892 [04:27<1:14:14, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:44:24,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 42/892 [04:32<1:11:16, 5.03s/it]g-point operations will not be computed-03 03:44:24,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 42/892 [04:32<1:11:16, 5.03s/it]g-point operations will not be computed-03 03:44:24,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 42/892 [04:32<1:11:16, 5.03s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:44:28,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-03 03:44:28,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-03 03:44:28,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 43/892 [04:36<1:08:06, 4.81s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:44:32,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 44/892 [04:40<1:04:25, 4.56s/it]g-point operations will not be computed-03 03:44:32,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 44/892 [04:40<1:04:25, 4.56s/it]g-point operations will not be computed-03 03:44:32,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 44/892 [04:40<1:04:25, 4.56s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:44:36,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 45/892 [04:44<1:00:07, 4.26s/it]g-point operations will not be computed-03 03:44:36,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 45/892 [04:44<1:00:07, 4.26s/it]g-point operations will not be computed-03 03:44:36,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:44:41,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:44:40,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:44:41,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:44:40,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▏ | 46/892 [04:47<55:39, 3.95s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:44:43,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▎ | 47/892 [04:50<51:13, 3.64s/it]g-point operations will not be computed-03 03:44:43,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▎ | 47/892 [04:50<51:13, 3.64s/it]g-point operations will not be computed-03 03:44:43,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▍ | 48/892 [04:53<46:47, 3.33s/it]g-point operations will not be computed-03 03:44:46,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▍ | 48/892 [04:53<46:47, 3.33s/it]g-point operations will not be computed-03 03:44:46,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:44:49,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:44:48,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:44:49,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:44:48,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:44:52,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:44:51,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 50/892 [04:58<41:40, 2.97s/it]g-point operations will not be computed-03 03:44:51,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 50/892 [04:58<41:40, 2.97s/it]g-point operations will not be computed-03 03:44:51,118 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 50/892 [04:58<41:40, 2.97s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:44:55,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 50/892 [04:58<41:40, 2.97s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:44:55,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:44:59,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:44:55,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 51/892 [05:05<1:01:11, 4.37s/it]g-point operations will not be computed-03 03:44:55,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 51/892 [05:05<1:01:11, 4.37s/it]g-point operations will not be computed-03 03:44:55,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 51/892 [05:05<1:01:11, 4.37s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:02,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 51/892 [05:05<1:01:11, 4.37s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:02,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 52/892 [05:13<1:13:38, 5.26s/it]g-point operations will not be computed-03 03:45:02,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 52/892 [05:13<1:13:38, 5.26s/it]g-point operations will not be computed-03 03:45:02,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 52/892 [05:13<1:13:38, 5.26s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:10,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 52/892 [05:13<1:13:38, 5.26s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:10,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:45:13,772 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:45:10,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 53/892 [05:20<1:22:24, 5.89s/it]g-point operations will not be computed-03 03:45:10,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 53/892 [05:20<1:22:24, 5.89s/it]g-point operations will not be computed-03 03:45:10,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 53/892 [05:20<1:22:24, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:17,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 53/892 [05:20<1:22:24, 5.89s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:17,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:45:20,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:45:17,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:45:20,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:45:17,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 54/892 [05:27<1:27:40, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:24,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▊ | 54/892 [05:27<1:27:40, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:24,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:45:28,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:45:24,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 55/892 [05:34<1:31:15, 6.54s/it]g-point operations will not be computed-03 03:45:24,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 55/892 [05:34<1:31:15, 6.54s/it]g-point operations will not be computed-03 03:45:24,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 55/892 [05:34<1:31:15, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:31,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 55/892 [05:34<1:31:15, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:31,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:45:35,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:45:31,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:45:35,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:45:31,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 56/892 [05:42<1:33:52, 6.74s/it]g-point operations will not be computed-03 03:45:31,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 56/892 [05:42<1:33:52, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:38,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:45:42,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:45:38,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 57/892 [05:49<1:35:24, 6.86s/it]g-point operations will not be computed-03 03:45:38,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 57/892 [05:49<1:35:24, 6.86s/it]g-point operations will not be computed-03 03:45:38,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 57/892 [05:49<1:35:24, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:46,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████ | 57/892 [05:49<1:35:24, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:46,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:45:49,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:45:46,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:45:49,583 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:45:46,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 58/892 [05:56<1:36:04, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:53,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 58/892 [05:56<1:36:04, 6.91s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:45:53,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:45:56,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:45:53,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 59/892 [06:03<1:36:45, 6.97s/it]g-point operations will not be computed-03 03:45:53,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 59/892 [06:03<1:36:45, 6.97s/it]g-point operations will not be computed-03 03:45:53,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 59/892 [06:03<1:36:45, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:00,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 59/892 [06:03<1:36:45, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:00,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:46:03,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:46:00,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:46:03,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:46:00,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 60/892 [06:10<1:36:37, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:07,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 60/892 [06:10<1:36:37, 6.97s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:07,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:46:10,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:46:07,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 61/892 [06:17<1:36:21, 6.96s/it]g-point operations will not be computed-03 03:46:07,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 61/892 [06:17<1:36:21, 6.96s/it]g-point operations will not be computed-03 03:46:07,180 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 61/892 [06:17<1:36:21, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:14,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 61/892 [06:17<1:36:21, 6.96s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:14,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▌ | 62/892 [06:24<1:36:06, 6.95s/it]g-point operations will not be computed-03 03:46:14,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▌ | 62/892 [06:24<1:36:06, 6.95s/it]g-point operations will not be computed-03 03:46:14,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▌ | 62/892 [06:24<1:36:06, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:20,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▌ | 62/892 [06:24<1:36:06, 6.95s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:20,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:46:24,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:46:20,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 63/892 [06:30<1:35:13, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:27,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 63/892 [06:30<1:35:13, 6.89s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:27,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2169, 'learning_rate': 0.000122, 'epoch': 0.07} +[WARNING|modeling_utils.py:388] 2022-03-03 03:46:31,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:46:27,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 64/892 [06:37<1:34:54, 6.88s/it]g-point operations will not be computed-03 03:46:27,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 64/892 [06:37<1:34:54, 6.88s/it]g-point operations will not be computed-03 03:46:27,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 64/892 [06:37<1:34:54, 6.88s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:34,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:46:37,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:46:34,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:46:37,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:46:34,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▊ | 65/892 [06:44<1:34:15, 6.84s/it]g-point operations will not be computed-03 03:46:34,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▊ | 65/892 [06:44<1:34:15, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:41,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:46:44,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:46:41,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▉ | 66/892 [06:51<1:33:17, 6.78s/it]g-point operations will not be computed-03 03:46:41,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▉ | 66/892 [06:51<1:33:17, 6.78s/it]g-point operations will not be computed-03 03:46:41,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▉ | 66/892 [06:51<1:33:17, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:47,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▉ | 66/892 [06:51<1:33:17, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:47,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:46:51,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:46:47,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:46:51,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:46:47,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 67/892 [06:57<1:32:59, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:54,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 67/892 [06:57<1:32:59, 6.76s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:46:54,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:46:57,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:46:54,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:46:57,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:46:54,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 68/892 [07:04<1:32:36, 6.74s/it]g-point operations will not be computed-03 03:46:54,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 68/892 [07:04<1:32:36, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:01,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:04,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:01,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:04,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:01,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 69/892 [07:11<1:32:11, 6.72s/it]g-point operations will not be computed-03 03:47:01,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 69/892 [07:11<1:32:11, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:08,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 69/892 [07:11<1:32:11, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:08,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:11,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:08,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:11,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:08,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 70/892 [07:17<1:31:42, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:14,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 70/892 [07:17<1:31:42, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:14,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:17,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:14,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:17,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:14,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 71/892 [07:24<1:31:02, 6.65s/it]g-point operations will not be computed-03 03:47:14,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▎ | 71/892 [07:24<1:31:02, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:21,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:24,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:21,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:24,447 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:21,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▍ | 72/892 [07:31<1:30:37, 6.63s/it]g-point operations will not be computed-03 03:47:21,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▍ | 72/892 [07:31<1:30:37, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:27,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:30,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:27,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:30,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:27,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▌ | 73/892 [07:37<1:29:47, 6.58s/it]g-point operations will not be computed-03 03:47:27,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▌ | 73/892 [07:37<1:29:47, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:34,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:37,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:34,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:37,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:34,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 74/892 [07:43<1:29:13, 6.54s/it]g-point operations will not be computed-03 03:47:34,223 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 74/892 [07:43<1:29:13, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:40,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 74/892 [07:43<1:29:13, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:40,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:43,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:40,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:43,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:40,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 75/892 [07:50<1:30:15, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:47,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 75/892 [07:50<1:30:15, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:47,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:50,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:47,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:50,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:47,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 76/892 [07:57<1:28:55, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:53,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▊ | 76/892 [07:57<1:28:55, 6.54s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:47:53,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:56,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:53,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:47:56,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:47:53,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 77/892 [08:03<1:28:03, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:48:00,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 77/892 [08:03<1:28:03, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:48:00,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:03,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:00,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:03,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:00,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 78/892 [08:09<1:26:44, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:48:06,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|██████▉ | 78/892 [08:09<1:26:44, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:48:06,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:09,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:06,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:09,304 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:06,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████ | 79/892 [08:15<1:25:41, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:48:12,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████ | 79/892 [08:15<1:25:41, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:48:12,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:15,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:12,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:15,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:12,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▏ | 80/892 [08:21<1:24:49, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:48:18,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▏ | 80/892 [08:21<1:24:49, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:48:18,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:21,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:18,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:21,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:18,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▎ | 81/892 [08:27<1:23:41, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:48:24,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▎ | 81/892 [08:27<1:23:41, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:48:24,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:28,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:24,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:28,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:24,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2937, 'learning_rate': 0.00016, 'epoch': 0.09} +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:28,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:24,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:28,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:24,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:28,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:24,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▍ | 83/892 [08:39<1:22:00, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▍ | 83/892 [08:39<1:22:00, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:40,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:40,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4215, 'learning_rate': 0.000164, 'epoch': 0.09} +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:45,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 85/892 [08:51<1:19:33, 5.91s/it]g-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▌ | 85/892 [08:51<1:19:33, 5.91s/it]g-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4092, 'learning_rate': 0.00016600000000000002, 'epoch': 0.1} +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:50,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:50,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▋ | 86/892 [08:56<1:18:11, 5.82s/it]g-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:54,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:57,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:48:57,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3505, 'learning_rate': 0.00017, 'epoch': 0.1} +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:01,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▉ | 88/892 [09:07<1:15:23, 5.63s/it]g-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▉ | 88/892 [09:07<1:15:23, 5.63s/it]g-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:05,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:05,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:05,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:48:36,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▉ | 89/892 [09:13<1:13:41, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:09,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▉ | 89/892 [09:13<1:13:41, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:09,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:13,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:09,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:13,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:09,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:15,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:09,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:18,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:09,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:18,082 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:09,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7094, 'learning_rate': 0.000178, 'epoch': 0.1} +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:21,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:09,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▎ | 92/892 [09:27<1:06:50, 5.01s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:23,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▎ | 92/892 [09:27<1:06:50, 5.01s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:23,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:25,890 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:23,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▎ | 93/892 [09:31<1:03:51, 4.80s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:28,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▎ | 93/892 [09:31<1:03:51, 4.80s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:28,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:29,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:28,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 94/892 [09:35<1:00:22, 4.54s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:31,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▍ | 94/892 [09:35<1:00:22, 4.54s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:31,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:33,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:31,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:33,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:31,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▋ | 95/892 [09:39<56:53, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:35,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:37,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:35,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:37,164 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:35,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▊ | 96/892 [09:42<53:14, 4.01s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:38,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▊ | 96/892 [09:42<53:14, 4.01s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:38,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▉ | 97/892 [09:45<48:55, 3.69s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:41,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 98/892 [09:48<44:53, 3.39s/it]g-point operations will not be computed-03 03:49:41,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 98/892 [09:48<44:53, 3.39s/it]g-point operations will not be computed-03 03:49:41,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 99/892 [09:50<40:55, 3.10s/it]g-point operations will not be computed-03 03:49:44,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 99/892 [09:50<40:55, 3.10s/it]g-point operations will not be computed-03 03:49:44,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:47,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:46,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:47,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:46,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 100/892 [09:53<39:00, 2.96s/it]g-point operations will not be computed-03 03:49:46,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 100/892 [09:53<39:00, 2.96s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:50,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 100/892 [09:53<39:00, 2.96s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:50,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:54,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:50,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:49:54,506 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:50,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████▏ | 101/892 [10:01<57:51, 4.39s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████▏ | 101/892 [10:01<57:51, 4.39s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:50:01,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 102/892 [10:08<1:09:45, 5.30s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 102/892 [10:08<1:09:45, 5.30s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6228, 'learning_rate': 0.0002, 'epoch': 0.11} + 11%|█████████ | 102/892 [10:08<1:09:45, 5.30s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 102/892 [10:08<1:09:45, 5.30s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████ | 102/892 [10:08<1:09:45, 5.30s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████ | 103/892 [10:15<1:17:00, 5.86s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:50:14,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:50:14,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 104/892 [10:23<1:22:21, 6.27s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 104/892 [10:23<1:22:21, 6.27s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4669, 'learning_rate': 0.000204, 'epoch': 0.12} + 12%|█████████▏ | 104/892 [10:23<1:22:21, 6.27s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▏ | 104/892 [10:23<1:22:21, 6.27s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▎ | 105/892 [10:30<1:26:06, 6.56s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▎ | 105/892 [10:30<1:26:06, 6.56s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:50:28,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:50:28,984 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▍ | 106/892 [10:37<1:27:53, 6.71s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▍ | 106/892 [10:37<1:27:53, 6.71s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4893, 'learning_rate': 0.000208, 'epoch': 0.12} + 12%|█████████▍ | 106/892 [10:37<1:27:53, 6.71s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▍ | 106/892 [10:37<1:27:53, 6.71s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▍ | 106/892 [10:37<1:27:53, 6.71s/it]g-point operations will not be computed-03 03:49:58,263 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▍ | 107/892 [10:44<1:28:42, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▍ | 107/892 [10:44<1:28:42, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▍ | 107/892 [10:44<1:28:42, 6.78s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▌ | 108/892 [10:51<1:29:23, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▌ | 108/892 [10:51<1:29:23, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6778, 'learning_rate': 0.000212, 'epoch': 0.12} + 12%|█████████▌ | 108/892 [10:51<1:29:23, 6.84s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:50:53,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:50:53,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.2605, 'learning_rate': 0.000214, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-03 03:50:53,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:50:53,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▋ | 110/892 [11:05<1:30:26, 6.94s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▋ | 110/892 [11:05<1:30:26, 6.94s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.431, 'learning_rate': 0.000216, 'epoch': 0.12} +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:05,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▊ | 111/892 [11:12<1:29:57, 6.91s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▊ | 111/892 [11:12<1:29:57, 6.91s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.52, 'learning_rate': 0.000218, 'epoch': 0.12} + 12%|█████████▊ | 111/892 [11:12<1:29:57, 6.91s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:14,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:14,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5446, 'learning_rate': 0.00022, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:14,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:14,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████ | 113/892 [11:25<1:29:06, 6.86s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████ | 113/892 [11:25<1:29:06, 6.86s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:24,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:24,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████ | 114/892 [11:32<1:28:41, 6.84s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████ | 114/892 [11:32<1:28:41, 6.84s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.3684, 'learning_rate': 0.000224, 'epoch': 0.13} + 13%|██████████ | 114/892 [11:32<1:28:41, 6.84s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:34,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:34,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5161, 'learning_rate': 0.00022600000000000002, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:34,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:34,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:34,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▎ | 116/892 [11:46<1:27:26, 6.76s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:44,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:44,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:44,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▎ | 117/892 [11:52<1:27:00, 6.74s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▎ | 117/892 [11:52<1:27:00, 6.74s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:52,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:51:52,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▍ | 118/892 [11:59<1:26:15, 6.69s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▍ | 118/892 [11:59<1:26:15, 6.69s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▍ | 118/892 [11:59<1:26:15, 6.69s/it]g-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:00,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:00,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5091, 'learning_rate': 0.00023400000000000002, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:00,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:00,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:00,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:50:41,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▋ | 120/892 [12:12<1:25:29, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▋ | 120/892 [12:12<1:25:29, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▋ | 120/892 [12:12<1:25:29, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▋ | 120/892 [12:12<1:25:29, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▋ | 121/892 [12:19<1:25:13, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:17,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:17,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:17,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▊ | 122/892 [12:25<1:24:19, 6.57s/it]g-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:23,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:23,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:23,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▉ | 123/892 [12:31<1:23:39, 6.53s/it]g-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▉ | 123/892 [12:31<1:23:39, 6.53s/it]g-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:31,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▉ | 124/892 [12:38<1:22:56, 6.48s/it]g-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|██████████▉ | 124/892 [12:38<1:22:56, 6.48s/it]g-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4989, 'learning_rate': 0.000244, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:38,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████ | 125/892 [12:45<1:24:15, 6.59s/it]g-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████ | 125/892 [12:45<1:24:15, 6.59s/it]g-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.55, 'learning_rate': 0.000246, 'epoch': 0.14} + 14%|███████████ | 125/892 [12:45<1:24:15, 6.59s/it]g-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:46,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:46,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5464, 'learning_rate': 0.000248, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:46,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:46,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:52:46,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:52:09,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 127/892 [12:57<1:22:36, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:52:54,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 127/892 [12:57<1:22:36, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:52:54,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 127/892 [12:57<1:22:36, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:52:54,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 127/892 [12:57<1:22:36, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:52:54,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▎ | 128/892 [13:04<1:21:19, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:00,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▎ | 128/892 [13:04<1:21:19, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:00,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▎ | 128/892 [13:04<1:21:19, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:00,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▎ | 128/892 [13:04<1:21:19, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:00,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▍ | 129/892 [13:10<1:20:28, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:06,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▍ | 129/892 [13:10<1:20:28, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:06,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▍ | 129/892 [13:10<1:20:28, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:06,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▍ | 129/892 [13:10<1:20:28, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:06,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▌ | 130/892 [13:16<1:19:12, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▌ | 130/892 [13:16<1:19:12, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:17,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:17,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4956, 'learning_rate': 0.00025800000000000004, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:17,454 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:23,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:23,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6595, 'learning_rate': 0.00026000000000000003, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:23,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:29,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:29,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5596, 'learning_rate': 0.000262, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:33,721 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▊ | 134/892 [13:40<1:15:19, 5.96s/it]g-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▊ | 134/892 [13:40<1:15:19, 5.96s/it]g-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6203, 'learning_rate': 0.000264, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:39,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:39,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▉ | 135/892 [13:45<1:14:12, 5.88s/it]g-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:43,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:43,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:43,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:13,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████ | 136/892 [13:51<1:12:45, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:47,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:50,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:47,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:50,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:47,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▏ | 137/892 [13:56<1:11:14, 5.66s/it]g-point operations will not be computed-03 03:53:47,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:54,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:47,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:54,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:47,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:53:54,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:47,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▏ | 138/892 [14:01<1:09:39, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:58,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▏ | 138/892 [14:01<1:09:39, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:58,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▏ | 138/892 [14:01<1:09:39, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:53:58,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:02,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:58,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:04,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:58,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:06,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:58,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:06,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:58,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.4214, 'learning_rate': 0.00027600000000000004, 'epoch': 0.16} +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:10,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:58,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:10,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:53:58,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▍ | 141/892 [14:16<1:02:46, 5.02s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:54:12,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:14,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:12,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:14,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:12,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▉ | 142/892 [14:20<59:34, 4.77s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▉ | 142/892 [14:20<59:34, 4.77s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▉ | 142/892 [14:20<59:34, 4.77s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:19,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:21,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:21,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:23,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:23,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:26,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:28,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:28,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:31,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:31,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:32,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:35,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:35,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:36,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:36,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:38,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:38,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:40,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:40,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:44,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:44,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:44,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:47,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:47,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:51,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:55,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:55,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9597, 'learning_rate': 0.0003, 'epoch': 0.17} +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:58,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:58,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:54:58,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 153/892 [15:07<1:11:04, 5.77s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▌ | 153/892 [15:07<1:11:04, 5.77s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:07,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 154/892 [15:14<1:16:03, 6.18s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 154/892 [15:14<1:16:03, 6.18s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5698, 'learning_rate': 0.000304, 'epoch': 0.17} + 17%|█████████████▋ | 154/892 [15:14<1:16:03, 6.18s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 154/892 [15:14<1:16:03, 6.18s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 154/892 [15:14<1:16:03, 6.18s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 155/892 [15:21<1:19:17, 6.46s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:20,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:20,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▊ | 156/892 [15:28<1:21:17, 6.63s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▊ | 156/892 [15:28<1:21:17, 6.63s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7222, 'learning_rate': 0.000308, 'epoch': 0.17} + 17%|█████████████▊ | 156/892 [15:28<1:21:17, 6.63s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:30,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:30,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0516, 'learning_rate': 0.00031, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:30,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:30,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|█████████████▉ | 158/892 [15:42<1:23:25, 6.82s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|█████████████▉ | 158/892 [15:42<1:23:25, 6.82s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8873, 'learning_rate': 0.000312, 'epoch': 0.18} + 18%|█████████████▉ | 158/892 [15:42<1:23:25, 6.82s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:44,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:44,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9982, 'learning_rate': 0.000314, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:44,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:44,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:44,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▏ | 160/892 [15:56<1:24:11, 6.90s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:54,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:55:54,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|████��█████████▎ | 161/892 [16:03<1:23:42, 6.87s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 161/892 [16:03<1:23:42, 6.87s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6326, 'learning_rate': 0.00031800000000000003, 'epoch': 0.18} + 18%|██████████████▎ | 161/892 [16:03<1:23:42, 6.87s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 161/892 [16:03<1:23:42, 6.87s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 161/892 [16:03<1:23:42, 6.87s/it]g-point operations will not be computed-03 03:54:16,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 162/892 [16:10<1:23:22, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 162/892 [16:10<1:23:22, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 162/892 [16:10<1:23:22, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 162/892 [16:10<1:23:22, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▍ | 163/892 [16:16<1:22:55, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:56:15,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:56:15,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▌ | 164/892 [16:23<1:22:31, 6.80s/it]g-point operations will not be computed-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▌ | 164/892 [16:23<1:22:31, 6.80s/it]g-point operations will not be computed-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8179, 'learning_rate': 0.000324, 'epoch': 0.18} + 18%|██████████████▌ | 164/892 [16:23<1:22:31, 6.80s/it]g-point operations will not be computed-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:56:25,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:56:25,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6294, 'learning_rate': 0.000326, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-03 03:56:25,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:56:25,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:56:25,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:06,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▋ | 166/892 [16:37<1:21:39, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▋ | 166/892 [16:37<1:21:39, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▋ | 166/892 [16:37<1:21:39, 6.75s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▊ | 167/892 [16:43<1:21:01, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▊ | 167/892 [16:43<1:21:01, 6.71s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:56:41,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:56:41,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▉ | 168/892 [16:50<1:20:26, 6.67s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▉ | 168/892 [16:50<1:20:26, 6.67s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5294, 'learning_rate': 0.00033200000000000005, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-03 03:56:50,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▉ | 169/892 [16:56<1:19:40, 6.61s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|██████████████▉ | 169/892 [16:56<1:19:40, 6.61s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4458, 'learning_rate': 0.00033400000000000004, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-03 03:56:56,661 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████ | 170/892 [17:03<1:19:26, 6.60s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████ | 170/892 [17:03<1:19:26, 6.60s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7599, 'learning_rate': 0.00033600000000000004, 'epoch': 0.19} + 19%|███████████████ | 170/892 [17:03<1:19:26, 6.60s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:04,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:04,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8152, 'learning_rate': 0.00033800000000000003, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:04,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:04,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▏ | 172/892 [17:16<1:18:35, 6.55s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▏ | 172/892 [17:16<1:18:35, 6.55s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:14,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:14,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▎ | 173/892 [17:22<1:17:54, 6.50s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▎ | 173/892 [17:22<1:17:54, 6.50s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:20,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:20,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▍ | 174/892 [17:28<1:17:05, 6.44s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▍ | 174/892 [17:28<1:17:05, 6.44s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:27,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:27,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▍ | 175/892 [17:35<1:18:15, 6.55s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▍ | 175/892 [17:35<1:18:15, 6.55s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5978, 'learning_rate': 0.000346, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:35,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▌ | 176/892 [17:42<1:17:18, 6.48s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▌ | 176/892 [17:42<1:17:18, 6.48s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6663, 'learning_rate': 0.000348, 'epoch': 0.2} + 20%|███████████████▌ | 176/892 [17:42<1:17:18, 6.48s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▌ | 176/892 [17:42<1:17:18, 6.48s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:43,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:43,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:43,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:43,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:49,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:49,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:49,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:49,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:55,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:57:55,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:00,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:00,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▉ | 180/892 [18:06<1:13:24, 6.19s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|███████████████▉ | 180/892 [18:06<1:13:24, 6.19s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:06,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:06,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████ | 181/892 [18:12<1:12:30, 6.12s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████ | 181/892 [18:12<1:12:30, 6.12s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:11,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:11,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████ | 182/892 [18:18<1:11:50, 6.07s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████ | 182/892 [18:18<1:11:50, 6.07s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:17,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:17,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▏ | 183/892 [18:24<1:10:45, 5.99s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:22,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:22,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:22,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▎ | 184/892 [18:29<1:09:32, 5.89s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:27,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:30,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:30,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8057, 'learning_rate': 0.000366, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:34,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:34,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▍ | 186/892 [18:40<1:07:02, 5.70s/it]g-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:38,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:38,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:38,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:56:33,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▌ | 187/892 [18:46<1:05:53, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:58:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▌ | 187/892 [18:46<1:05:53, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:58:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:46,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:58:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:46,678 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:58:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5574, 'learning_rate': 0.000372, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:50,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:58:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:50,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:58:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▋ | 189/892 [18:56<1:03:24, 5.41s/it]g-point operations will not be computed-03 03:58:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:54,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:58:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:56,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:58:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:58:56,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:58:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.6756, 'learning_rate': 0.00037600000000000003, 'epoch': 0.21} +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:58:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:00,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:58:42,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▉ | 191/892 [19:06<1:00:11, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:05,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:05,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▍ | 192/892 [19:11<57:53, 4.96s/it]g-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:08,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:08,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:10,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:12,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:12,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:14,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:16,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:16,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:18,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:21,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:21,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:22,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:22,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:24,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:26,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:26,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:29,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:29,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:30,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:30,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:31,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:35,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:35,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:39,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:39,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9359, 'learning_rate': 0.000398, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:42,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:42,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:42,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:46,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:46,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 03:59:52,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|█████████████████▉ | 203/892 [19:58<1:06:47, 5.82s/it]g-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|█████████████████▉ | 203/892 [19:58<1:06:47, 5.82s/it]g-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4457, 'learning_rate': 0.000402, 'epoch': 0.23} + 23%|█████████████████▉ | 203/892 [19:58<1:06:47, 5.82s/it]g-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|█████████████████▉ | 203/892 [19:58<1:06:47, 5.82s/it]g-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|█████████████████▉ | 203/892 [19:58<1:06:47, 5.82s/it]g-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████ | 204/892 [20:05<1:11:02, 6.20s/it]g-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:00:04,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:00:04,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 205/892 [20:12<1:13:49, 6.45s/it]g-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 205/892 [20:12<1:13:49, 6.45s/it]g-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7054, 'learning_rate': 0.00040600000000000006, 'epoch': 0.23} + 23%|██████████████████▏ | 205/892 [20:12<1:13:49, 6.45s/it]g-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 205/892 [20:12<1:13:49, 6.45s/it]g-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 205/892 [20:12<1:13:49, 6.45s/it]g-point operations will not be computed-03 03:59:02,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 206/892 [20:20<1:16:04, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 206/892 [20:20<1:16:04, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▏ | 206/892 [20:20<1:16:04, 6.65s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 207/892 [20:27<1:17:16, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▎ | 207/892 [20:27<1:17:16, 6.77s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7219, 'learning_rate': 0.00041, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-03 04:00:27,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▍ | 208/892 [20:34<1:17:57, 6.84s/it]g-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▍ | 208/892 [20:34<1:17:57, 6.84s/it]g-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.5005, 'learning_rate': 0.000412, 'epoch': 0.23} + 23%|██████████████████▍ | 208/892 [20:34<1:17:57, 6.84s/it]g-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▍ | 208/892 [20:34<1:17:57, 6.84s/it]g-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▌ | 209/892 [20:40<1:18:05, 6.86s/it]g-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▌ | 209/892 [20:40<1:18:05, 6.86s/it]g-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7144, 'learning_rate': 0.000414, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-03 04:00:41,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▌ | 210/892 [20:47<1:18:14, 6.88s/it]g-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▌ | 210/892 [20:47<1:18:14, 6.88s/it]g-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8477, 'learning_rate': 0.000416, 'epoch': 0.24} + 24%|██████████████████▌ | 210/892 [20:47<1:18:14, 6.88s/it]g-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:00:49,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:00:49,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:00:49,863 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:00:53,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:00:53,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▊ | 212/892 [21:01<1:17:42, 6.86s/it]g-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▊ | 212/892 [21:01<1:17:42, 6.86s/it]g-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8034, 'learning_rate': 0.00042, 'epoch': 0.24} + 24%|██████████████████▊ | 212/892 [21:01<1:17:42, 6.86s/it]g-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:03,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:03,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9817, 'learning_rate': 0.000422, 'epoch': 0.24} +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:03,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:03,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:00:16,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▉ | 214/892 [21:15<1:17:02, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|██████████████████▉ | 214/892 [21:15<1:17:02, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8543, 'learning_rate': 0.000424, 'epoch': 0.24} + 24%|██████████████████▉ | 214/892 [21:15<1:17:02, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████ | 215/892 [21:21<1:16:57, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████ | 215/892 [21:21<1:16:57, 6.82s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:20,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:20,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▏ | 216/892 [21:28<1:16:21, 6.78s/it]g-point operations will not be computed-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▏ | 216/892 [21:28<1:16:21, 6.78s/it]g-point operations will not be computed-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8308, 'learning_rate': 0.000428, 'epoch': 0.24} + 24%|███████████████████▏ | 216/892 [21:28<1:16:21, 6.78s/it]g-point operations will not be computed-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▏ | 216/892 [21:28<1:16:21, 6.78s/it]g-point operations will not be computed-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:30,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:30,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:30,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:30,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:30,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:12,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▎ | 218/892 [21:41<1:15:08, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▎ | 218/892 [21:41<1:15:08, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▎ | 218/892 [21:41<1:15:08, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▎ | 218/892 [21:41<1:15:08, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▍ | 219/892 [21:48<1:14:30, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:46,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:46,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:46,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▍ | 220/892 [21:55<1:14:17, 6.63s/it]g-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:53,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:53,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:01:53,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▌ | 221/892 [22:01<1:13:48, 6.60s/it]g-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▌ | 221/892 [22:01<1:13:48, 6.60s/it]g-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▌ | 221/892 [22:01<1:13:48, 6.60s/it]g-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7249, 'learning_rate': 0.00044, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:03,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:09,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:09,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9072, 'learning_rate': 0.000442, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:09,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:09,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:09,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:01:38,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▊ | 224/892 [22:20<1:12:01, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▊ | 224/892 [22:20<1:12:01, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▊ | 224/892 [22:20<1:12:01, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▊ | 224/892 [22:20<1:12:01, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|███████████████████▉ | 225/892 [22:27<1:12:46, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:25,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:25,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:25,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|████████████████████ | 226/892 [22:33<1:11:58, 6.48s/it]g-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:32,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:32,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:32,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|████████████████████ | 227/892 [22:40<1:11:01, 6.41s/it]g-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:38,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:38,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:38,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▏ | 228/892 [22:46<1:10:03, 6.33s/it]g-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:44,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:44,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:44,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▎ | 229/892 [22:52<1:09:08, 6.26s/it]g-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:50,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:50,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:02:50,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:02:17,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▎ | 230/892 [22:58<1:08:19, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:02:54,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▎ | 230/892 [22:58<1:08:19, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:02:54,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▎ | 230/892 [22:58<1:08:19, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:02:54,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▎ | 230/892 [22:58<1:08:19, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:02:54,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▍ | 231/892 [23:04<1:07:40, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:03:01,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▍ | 231/892 [23:04<1:07:40, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:03:01,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▍ | 231/892 [23:04<1:07:40, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:03:01,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▍ | 231/892 [23:04<1:07:40, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:03:01,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▌ | 232/892 [23:10<1:07:02, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:03:01,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:08,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:01,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:08,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:01,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:08,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:01,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▋ | 233/892 [23:16<1:05:58, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:03:12,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▋ | 233/892 [23:16<1:05:58, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:03:12,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:16,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:12,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:16,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:12,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9863, 'learning_rate': 0.00046400000000000006, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:21,079 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:12,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▊ | 235/892 [23:27<1:03:37, 5.81s/it]g-point operations will not be computed-03 04:03:12,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▊ | 235/892 [23:27<1:03:37, 5.81s/it]g-point operations will not be computed-03 04:03:12,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:25,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:12,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:25,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:12,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:25,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:12,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▉ | 236/892 [23:32<1:02:34, 5.72s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:03:29,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|████████████████████▉ | 236/892 [23:32<1:02:34, 5.72s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:03:29,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:33,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:29,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:33,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:29,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.703, 'learning_rate': 0.00047, 'epoch': 0.27} +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:37,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:29,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████ | 238/892 [23:43<1:00:11, 5.52s/it]g-point operations will not be computed-03 04:03:29,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████ | 238/892 [23:43<1:00:11, 5.52s/it]g-point operations will not be computed-03 04:03:29,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:41,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:29,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:41,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:29,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:41,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:29,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████▋ | 239/892 [23:48<58:53, 5.41s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:03:45,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:47,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:45,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████▊ | 240/892 [23:53<57:24, 5.28s/it]g-point operations will not be computed-03 04:03:45,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████▊ | 240/892 [23:53<57:24, 5.28s/it]g-point operations will not be computed-03 04:03:45,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:51,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:45,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:53,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:45,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:53,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:45,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:55,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:45,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:57,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:45,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:03:57,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:45,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3981, 'learning_rate': 0.00048, 'epoch': 0.27} +[WARNING|modeling_utils.py:388] 2022-03-03 04:04:01,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:45,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:04:01,120 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:03:45,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|██████████████████████ | 243/892 [24:07<50:35, 4.68s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:04:03,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|██████████████████████▏ | 244/892 [24:10<47:43, 4.42s/it]g-point operations will not be computed-03 04:04:03,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|██████████████████████▏ | 244/892 [24:10<47:43, 4.42s/it]g-point operations will not be computed-03 04:04:03,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|██████████████████████▏ | 244/892 [24:10<47:43, 4.42s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:04:06,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|██████████████████████▏ | 245/892 [24:14<44:50, 4.16s/it]g-point operations will not be computed-03 04:04:06,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|██████████████████████▏ | 245/892 [24:14<44:50, 4.16s/it]g-point operations will not be computed-03 04:04:06,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:04:11,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:10,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▎ | 246/892 [24:17<41:45, 3.88s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:04:13,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▎ | 246/892 [24:17<41:45, 3.88s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:04:13,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 247/892 [24:20<38:34, 3.59s/it]g-point operations will not be computed-03 04:04:13,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 247/892 [24:20<38:34, 3.59s/it]g-point operations will not be computed-03 04:04:13,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▌ | 248/892 [24:23<35:20, 3.29s/it]g-point operations will not be computed-03 04:04:16,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▌ | 248/892 [24:23<35:20, 3.29s/it]g-point operations will not be computed-03 04:04:16,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:04:19,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:18,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:04:22,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:21,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:04:22,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:21,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▋ | 250/892 [24:28<30:50, 2.88s/it]g-point operations will not be computed-03 04:04:21,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▋ | 250/892 [24:28<30:50, 2.88s/it]g-point operations will not be computed-03 04:04:21,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▋ | 250/892 [24:28<30:50, 2.88s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:04:25,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▋ | 250/892 [24:28<30:50, 2.88s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:04:25,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:04:28,833 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:25,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▊ | 251/892 [24:35<45:52, 4.29s/it]g-point operations will not be computed-03 04:04:25,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▊ | 251/892 [24:35<45:52, 4.29s/it]g-point operations will not be computed-03 04:04:25,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▊ | 251/892 [24:35<45:52, 4.29s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:04:32,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:04:36,225 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:32,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▉ | 252/892 [24:42<55:30, 5.20s/it]g-point operations will not be computed-03 04:04:32,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▉ | 252/892 [24:42<55:30, 5.20s/it]g-point operations will not be computed-03 04:04:32,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▉ | 252/892 [24:42<55:30, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██��███████████████████▉ | 252/892 [24:42<55:30, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▉ | 252/892 [24:42<55:30, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 253/892 [24:50<1:01:55, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 253/892 [24:50<1:01:55, 5.81s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0797, 'learning_rate': 0.0005020000000000001, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-03 04:04:50,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 254/892 [24:57<1:05:56, 6.20s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 254/892 [24:57<1:05:56, 6.20s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8901, 'learning_rate': 0.000504, 'epoch': 0.28} + 28%|██████████████████████▍ | 254/892 [24:57<1:05:56, 6.20s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 254/892 [24:57<1:05:56, 6.20s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▍ | 254/892 [24:57<1:05:56, 6.20s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▌ | 255/892 [25:04<1:08:40, 6.47s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:05:03,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:05:03,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:05:03,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▋ | 256/892 [25:11<1:10:31, 6.65s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▋ | 256/892 [25:11<1:10:31, 6.65s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▋ | 256/892 [25:11<1:10:31, 6.65s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:05:13,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:05:13,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1246, 'learning_rate': 0.00051, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-03 04:05:13,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:05:13,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:05:13,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▊ | 258/892 [25:25<1:12:17, 6.84s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▊ | 258/892 [25:25<1:12:17, 6.84s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:05:25,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▉ | 259/892 [25:32<1:12:33, 6.88s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▉ | 259/892 [25:32<1:12:33, 6.88s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8121, 'learning_rate': 0.000514, 'epoch': 0.29} + 29%|██████████████████████▉ | 259/892 [25:32<1:12:33, 6.88s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▉ | 259/892 [25:32<1:12:33, 6.88s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|██████████████████████▉ | 259/892 [25:32<1:12:33, 6.88s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████ | 260/892 [25:39<1:12:47, 6.91s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:05:38,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:05:38,111 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████ | 261/892 [25:46<1:12:52, 6.93s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████ | 261/892 [25:46<1:12:52, 6.93s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8734, 'learning_rate': 0.000518, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-03 04:05:46,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████▏ | 262/892 [25:53<1:12:21, 6.89s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████▏ | 262/892 [25:53<1:12:21, 6.89s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9371, 'learning_rate': 0.0005200000000000001, 'epoch': 0.29} + 29%|███████████████████████▏ | 262/892 [25:53<1:12:21, 6.89s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████▏ | 262/892 [25:53<1:12:21, 6.89s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████▏ | 262/892 [25:53<1:12:21, 6.89s/it]g-point operations will not be computed-03 04:04:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████▎ | 263/892 [26:00<1:11:58, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████▎ | 263/892 [26:00<1:11:58, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████▎ | 263/892 [26:00<1:11:58, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▍ | 264/892 [26:06<1:11:29, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▍ | 264/892 [26:06<1:11:29, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8513, 'learning_rate': 0.000524, 'epoch': 0.3} + 30%|███████████████████████▍ | 264/892 [26:06<1:11:29, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:08,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:08,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.242, 'learning_rate': 0.000526, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:08,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:15,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:15,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0909, 'learning_rate': 0.000528, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:15,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:15,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▋ | 267/892 [26:27<1:10:29, 6.77s/it]g-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▋ | 267/892 [26:27<1:10:29, 6.77s/it]g-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:25,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:25,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▋ | 268/892 [26:33<1:10:02, 6.74s/it]g-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████████████████▋ | 268/892 [26:33<1:10:02, 6.74s/it]g-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2137, 'learning_rate': 0.000532, 'epoch': 0.3} + 30%|███████████████████████▋ | 268/892 [26:33<1:10:02, 6.74s/it]g-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:35,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:35,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7544, 'learning_rate': 0.0005340000000000001, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:35,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:42,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:42,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0531, 'learning_rate': 0.000536, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:42,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:42,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:06:42,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:05:56,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████ | 271/892 [26:53<1:08:54, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████ | 271/892 [26:53<1:08:54, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████ | 271/892 [26:53<1:08:54, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████ | 272/892 [27:00<1:08:23, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████ | 272/892 [27:00<1:08:23, 6.62s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9672, 'learning_rate': 0.00054, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:00,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▏ | 273/892 [27:06<1:07:41, 6.56s/it]g-point operations will not be computed-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▏ | 273/892 [27:06<1:07:41, 6.56s/it]g-point operations will not be computed-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1118, 'learning_rate': 0.0005420000000000001, 'epoch': 0.31} + 31%|████████████████████████▏ | 273/892 [27:06<1:07:41, 6.56s/it]g-point operations will not be computed-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:08,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:08,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.766, 'learning_rate': 0.0005440000000000001, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:08,046 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:14,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:14,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2889, 'learning_rate': 0.000546, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:14,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:14,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:14,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:06:50,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▍ | 276/892 [27:26<1:07:15, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:22,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▍ | 276/892 [27:26<1:07:15, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:22,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▍ | 276/892 [27:26<1:07:15, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:22,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▍ | 276/892 [27:26<1:07:15, 6.55s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:22,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▌ | 277/892 [27:32<1:06:20, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:29,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▌ | 277/892 [27:32<1:06:20, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:29,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▌ | 277/892 [27:32<1:06:20, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:29,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▌ | 277/892 [27:32<1:06:20, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:29,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▌ | 278/892 [27:38<1:05:25, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:35,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▌ | 278/892 [27:38<1:05:25, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:35,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|███████���████████████████▌ | 278/892 [27:38<1:05:25, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:35,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▌ | 278/892 [27:38<1:05:25, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:35,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▋ | 279/892 [27:44<1:04:37, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:41,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▋ | 279/892 [27:44<1:04:37, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:41,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▋ | 279/892 [27:44<1:04:37, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:41,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▋ | 279/892 [27:44<1:04:37, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:41,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▊ | 280/892 [27:50<1:03:46, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▊ | 280/892 [27:50<1:03:46, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:52,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:52,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7573, 'learning_rate': 0.000558, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:52,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:58,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:58,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7975, 'learning_rate': 0.0005600000000000001, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:58,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:07:58,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:03,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:03,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:03,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:03,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:09,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:09,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:13,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:13,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▉ | 285/892 [28:20<59:03, 5.84s/it]g-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:18,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:18,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:18,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:07:47,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▉ | 286/892 [28:25<57:58, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:08:22,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▉ | 286/892 [28:25<57:58, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:08:22,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▉ | 286/892 [28:25<57:58, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:08:22,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:26,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:22,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:28,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:22,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:28,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:22,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:28,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:22,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|██████████████████████████▏ | 288/892 [28:36<55:26, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|██████████████████████████▏ | 288/892 [28:36<55:26, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|██████████████████████████▏ | 288/892 [28:36<55:26, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:36,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:38,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:41,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:41,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1764, 'learning_rate': 0.000576, 'epoch': 0.33} +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:44,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:44,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▍ | 291/892 [28:50<50:31, 5.04s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:48,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:48,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:50,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:52,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:52,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:54,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:56,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:56,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:57,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:59,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:08:59,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:03,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:03,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:04,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:06,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:06,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:08,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:08,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:11,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:11,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:13,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:14,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:14,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4224, 'learning_rate': 0.000596, 'epoch': 0.34} +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:18,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:18,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:18,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:22,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:26,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:26,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:26,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:29,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:33,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:33,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 303/892 [29:42<57:41, 5.88s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 303/892 [29:42<57:41, 5.88s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.911, 'learning_rate': 0.000602, 'epoch': 0.34} + 34%|███████████████████████████▌ | 303/892 [29:42<57:41, 5.88s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 303/892 [29:42<57:41, 5.88s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▌ | 303/892 [29:42<57:41, 5.88s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|██████████████████████████▉ | 304/892 [29:49<1:01:40, 6.29s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|██████████████████████████▉ | 304/892 [29:49<1:01:40, 6.29s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:09:50,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 305/892 [29:56<1:03:53, 6.53s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 305/892 [29:56<1:03:53, 6.53s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0028, 'learning_rate': 0.000606, 'epoch': 0.34} + 34%|███████████████████████████ | 305/892 [29:56<1:03:53, 6.53s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 305/892 [29:56<1:03:53, 6.53s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 305/892 [29:56<1:03:53, 6.53s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 306/892 [30:03<1:05:17, 6.69s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████ | 306/892 [30:03<1:05:17, 6.69s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:04,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 307/892 [30:10<1:06:21, 6.81s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 307/892 [30:10<1:06:21, 6.81s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8418, 'learning_rate': 0.00061, 'epoch': 0.34} + 34%|███████████████████████████▏ | 307/892 [30:10<1:06:21, 6.81s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:12,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:12,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2496, 'learning_rate': 0.000612, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:12,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:12,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:12,944 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 309/892 [30:24<1:07:08, 6.91s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▎ | 309/892 [30:24<1:07:08, 6.91s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:25,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▍ | 310/892 [30:31<1:07:14, 6.93s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▍ | 310/892 [30:31<1:07:14, 6.93s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1208, 'learning_rate': 0.000616, 'epoch': 0.35} + 35%|███████████████████████████▍ | 310/892 [30:31<1:07:14, 6.93s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▍ | 310/892 [30:31<1:07:14, 6.93s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▍ | 310/892 [30:31<1:07:14, 6.93s/it]g-point operations will not be computed-03 04:08:32,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▌ | 311/892 [30:38<1:07:11, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▌ | 311/892 [30:38<1:07:11, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▌ | 311/892 [30:38<1:07:11, 6.94s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▋ | 312/892 [30:45<1:06:40, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▋ | 312/892 [30:45<1:06:40, 6.90s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9914, 'learning_rate': 0.00062, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:45,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:45,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:45,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.042, 'learning_rate': 0.000622, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:45,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:45,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:45,862 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▊ | 314/892 [30:59<1:05:57, 6.85s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:57,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:10:57,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▉ | 315/892 [31:06<1:05:42, 6.83s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|███████████████████████████▉ | 315/892 [31:06<1:05:42, 6.83s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8236, 'learning_rate': 0.000626, 'epoch': 0.35} + 35%|███████████████████████████▉ | 315/892 [31:06<1:05:42, 6.83s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:07,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:07,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1062, 'learning_rate': 0.000628, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:07,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:14,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:14,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.823, 'learning_rate': 0.00063, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:14,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:14,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:14,500 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▏ | 318/892 [31:26<1:04:20, 6.72s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▏ | 318/892 [31:26<1:04:20, 6.72s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:26,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▎ | 319/892 [31:32<1:04:00, 6.70s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▎ | 319/892 [31:32<1:04:00, 6.70s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8754, 'learning_rate': 0.000634, 'epoch': 0.36} + 36%|████████████████████████████▎ | 319/892 [31:32<1:04:00, 6.70s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:34,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:34,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8727, 'learning_rate': 0.0006360000000000001, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:34,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:40,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:40,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2652, 'learning_rate': 0.000638, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:40,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:40,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▌ | 322/892 [31:52<1:02:47, 6.61s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▌ | 322/892 [31:52<1:02:47, 6.61s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:50,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:50,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▌ | 323/892 [31:58<1:02:16, 6.57s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▌ | 323/892 [31:58<1:02:16, 6.57s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:57,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:11:57,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▋ | 324/892 [32:05<1:01:48, 6.53s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▋ | 324/892 [32:05<1:01:48, 6.53s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▊ | 325/892 [32:12<1:02:28, 6.61s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▊ | 325/892 [32:12<1:02:28, 6.61s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1065, 'learning_rate': 0.000646, 'epoch': 0.36} + 36%|████████████████████████████▊ | 325/892 [32:12<1:02:28, 6.61s/it]g-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:13,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:13,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0236, 'learning_rate': 0.000648, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:13,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:19,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:19,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.7007, 'learning_rate': 0.0006500000000000001, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:19,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:25,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:25,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9706, 'learning_rate': 0.000652, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:25,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:25,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:25,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:10:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▉ | 329/892 [32:37<59:17, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:12:33,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▉ | 329/892 [32:37<59:17, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:12:33,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▉ | 329/892 [32:37<59:17, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:12:33,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3813, 'learning_rate': 0.000656, 'epoch': 0.37} + 37%|█████████████████████████████▉ | 330/892 [32:43<58:35, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▉ | 330/892 [32:43<58:35, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▉ | 330/892 [32:43<58:35, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:44,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:44,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:44,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:50,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:50,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8357, 'learning_rate': 0.00066, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:50,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:50,226 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:56,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:12:56,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████▎ | 334/892 [33:06<55:29, 5.97s/it]g-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:04,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:04,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:04,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▍ | 335/892 [33:12<54:35, 5.88s/it]g-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:10,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:10,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:10,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:12:39,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▌ | 336/892 [33:18<53:45, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:13:14,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▌ | 336/892 [33:18<53:45, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:13:14,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▌ | 336/892 [33:18<53:45, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:13:14,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:18,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:14,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:21,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:14,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:21,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:14,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:21,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:14,668 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▋ | 338/892 [33:28<51:27, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:13:25,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▋ | 338/892 [33:28<51:27, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:13:25,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:29,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:25,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:29,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:25,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:31,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:25,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:31,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:25,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:31,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:25,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▊ | 340/892 [33:39<48:43, 5.30s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:37,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▉ | 341/892 [33:43<47:10, 5.14s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▉ | 341/892 [33:43<47:10, 5.14s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:41,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:41,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:43,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:45,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:47,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:47,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:49,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:51,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:51,165 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:53,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:53,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:54,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:57,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:57,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:59,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:13:59,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:02,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:03,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:03,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:05,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:05,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:08,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:08,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1623, 'learning_rate': 0.000696, 'epoch': 0.39} +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:12,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:12,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:15,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:15,987 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.7402, 'learning_rate': 0.0006979999999999999, 'epoch': 0.39} +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:19,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:19,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:19,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:23,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:23,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:28,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████ | 353/892 [34:35<52:06, 5.80s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████ | 353/892 [34:35<52:06, 5.80s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1392, 'learning_rate': 0.0007019999999999999, 'epoch': 0.4} + 40%|████████████████████████████████ | 353/892 [34:35<52:06, 5.80s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████ | 353/892 [34:35<52:06, 5.80s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████ | 353/892 [34:35<52:06, 5.80s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 354/892 [34:42<55:39, 6.21s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 354/892 [34:42<55:39, 6.21s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:42,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 355/892 [34:49<57:49, 6.46s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 355/892 [34:49<57:49, 6.46s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0127, 'learning_rate': 0.0007059999999999999, 'epoch': 0.4} + 40%|████████████████████████████████▏ | 355/892 [34:49<57:49, 6.46s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 355/892 [34:49<57:49, 6.46s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▏ | 355/892 [34:49<57:49, 6.46s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▎ | 356/892 [34:56<59:16, 6.64s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▎ | 356/892 [34:56<59:16, 6.64s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:14:56,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▌ | 357/892 [35:03<1:00:02, 6.73s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▌ | 357/892 [35:03<1:00:02, 6.73s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3195, 'learning_rate': 0.00071, 'epoch': 0.4} + 40%|███████████████████████████████▌ | 357/892 [35:03<1:00:02, 6.73s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:05,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:05,708 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2799, 'learning_rate': 0.000712, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:09,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▊ | 359/892 [35:17<1:01:03, 6.87s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▊ | 359/892 [35:17<1:01:03, 6.87s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2069, 'learning_rate': 0.000714, 'epoch': 0.4} + 40%|███████████████████████████████▊ | 359/892 [35:17<1:01:03, 6.87s/it]g-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:19,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:19,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1036, 'learning_rate': 0.000716, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:19,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:19,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:19,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:13:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▉ | 361/892 [35:31<1:00:36, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|█████████████████████████████���█▉ | 361/892 [35:31<1:00:36, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|███████████████████████████████▉ | 361/892 [35:31<1:00:36, 6.85s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|████████████████████████████████ | 362/892 [35:38<1:00:17, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|████████████████████████████████ | 362/892 [35:38<1:00:17, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0837, 'learning_rate': 0.0007199999999999999, 'epoch': 0.41} + 41%|████████████████████████████████ | 362/892 [35:38<1:00:17, 6.83s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:39,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:39,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8481, 'learning_rate': 0.000722, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:39,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:39,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:39,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████ | 364/892 [35:51<59:54, 6.81s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:50,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:50,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▏ | 365/892 [35:58<59:30, 6.78s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▏ | 365/892 [35:58<59:30, 6.78s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:56,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:15:56,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▏ | 366/892 [36:05<59:06, 6.74s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▏ | 366/892 [36:05<59:06, 6.74s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2159, 'learning_rate': 0.000728, 'epoch': 0.41} + 41%|█████████████████████████████████▏ | 366/892 [36:05<59:06, 6.74s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:06,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:06,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0045, 'learning_rate': 0.00073, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:06,633 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:13,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:13,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:13,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1269, 'learning_rate': 0.000732, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:13,237 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 369/892 [36:24<57:53, 6.64s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 369/892 [36:24<57:53, 6.64s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:23,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:23,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 370/892 [36:31<57:34, 6.62s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|███████████████████████████████���█▌ | 370/892 [36:31<57:34, 6.62s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2436, 'learning_rate': 0.000736, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:31,301 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▋ | 371/892 [36:37<57:10, 6.58s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▋ | 371/892 [36:37<57:10, 6.58s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9266, 'learning_rate': 0.000738, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:37,762 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▊ | 372/892 [36:44<56:58, 6.57s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▊ | 372/892 [36:44<56:58, 6.57s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1939, 'learning_rate': 0.00074, 'epoch': 0.42} + 42%|█████████████████████████████████▊ | 372/892 [36:44<56:58, 6.57s/it]g-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:45,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:45,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1638, 'learning_rate': 0.000742, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:45,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:16:45,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:15:28,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▉ | 374/892 [36:57<55:50, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▉ | 374/892 [36:57<55:50, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.5325, 'learning_rate': 0.000744, 'epoch': 0.42} + 42%|█████████████████████████████████▉ | 374/892 [36:57<55:50, 6.47s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████���████ | 375/892 [37:04<56:40, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████ | 375/892 [37:04<56:40, 6.58s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8427, 'learning_rate': 0.000746, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:03,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 376/892 [37:10<56:03, 6.52s/it]g-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 376/892 [37:10<56:03, 6.52s/it]g-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1271, 'learning_rate': 0.000748, 'epoch': 0.42} + 42%|██████████████████████████████████▏ | 376/892 [37:10<56:03, 6.52s/it]g-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▏ | 376/892 [37:10<56:03, 6.52s/it]g-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:11,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:11,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:16,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:16,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▎ | 378/892 [37:22<54:08, 6.32s/it]g-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▎ | 378/892 [37:22<54:08, 6.32s/it]g-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:22,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:22,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▍ | 379/892 [37:28<53:30, 6.26s/it]g-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▍ | 379/892 [37:28<53:30, 6.26s/it]g-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:28,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:28,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▌ | 380/892 [37:34<52:54, 6.20s/it]g-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▌ | 380/892 [37:34<52:54, 6.20s/it]g-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:34,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:34,340 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▌ | 381/892 [37:40<52:09, 6.13s/it]g-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:38,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:38,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:38,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▋ | 382/892 [37:46<51:34, 6.07s/it]g-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:44,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:44,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:44,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:16:53,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▊ | 383/892 [37:52<50:55, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▊ | 383/892 [37:52<50:55, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:53,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:53,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0459, 'learning_rate': 0.000764, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:53,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:59,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:17:59,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9586, 'learning_rate': 0.0007660000000000001, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:03,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:03,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|███████████████████████████████████ | 386/892 [38:09<48:27, 5.75s/it]g-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:07,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:09,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:09,919 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0477, 'learning_rate': 0.0007700000000000001, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:13,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|███████████████████████████████████▏ | 388/892 [38:20<46:26, 5.53s/it]g-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|███████████████████████████████████▏ | 388/892 [38:20<46:26, 5.53s/it]g-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:17,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:17,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:17,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:17:49,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▎ | 389/892 [38:25<45:35, 5.44s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:18:21,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▎ | 389/892 [38:25<45:35, 5.44s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:18:21,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:25,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:21,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:25,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:21,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:27,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:21,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:30,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:21,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:30,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:21,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:32,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:21,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:32,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:21,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:32,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:21,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▌ | 392/892 [38:39<41:17, 4.96s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:18:35,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:37,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:35,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:37,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:35,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▋ | 393/892 [38:43<39:29, 4.75s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:18:40,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:42,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:40,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:42,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:40,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▊ | 394/892 [38:47<37:33, 4.52s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:18:44,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▊ | 395/892 [38:51<35:25, 4.28s/it]g-point operations will not be computed-03 04:18:44,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▊ | 395/892 [38:51<35:25, 4.28s/it]g-point operations will not be computed-03 04:18:44,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▊ | 395/892 [38:51<35:25, 4.28s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:18:47,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▉ | 396/892 [38:54<32:59, 3.99s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:18:50,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▉ | 396/892 [38:54<32:59, 3.99s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:18:50,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████ | 397/892 [38:57<30:16, 3.67s/it]g-point operations will not be computed-03 04:18:50,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████ | 397/892 [38:57<30:16, 3.67s/it]g-point operations will not be computed-03 04:18:50,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:54,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:53,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:18:54,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:18:53,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▏ | 398/892 [39:00<27:30, 3.34s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:18:56,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▏ | 399/892 [39:02<24:51, 3.03s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:18:58,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▏ | 399/892 [39:02<24:51, 3.03s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:18:58,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▎ | 400/892 [39:05<23:47, 2.90s/it]g-point operations will not be computed-03 04:18:58,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▎ | 400/892 [39:05<23:47, 2.90s/it]g-point operations will not be computed-03 04:18:58,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████���███████████████████████▎ | 400/892 [39:05<23:47, 2.90s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:19:02,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▎ | 400/892 [39:05<23:47, 2.90s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:19:02,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:19:06,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:02,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▍ | 401/892 [39:12<35:20, 4.32s/it]g-point operations will not be computed-03 04:19:02,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▍ | 401/892 [39:12<35:20, 4.32s/it]g-point operations will not be computed-03 04:19:02,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▍ | 401/892 [39:12<35:20, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:19:09,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▍ | 401/892 [39:12<35:20, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:19:09,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:19:13,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:09,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:19:13,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:09,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▌ | 402/892 [39:20<42:28, 5.20s/it]g-point operations will not be computed-03 04:19:09,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:19:18,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:09,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:19:18,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:09,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▌ | 403/892 [39:27<47:20, 5.81s/it]g-point operations will not be computed-03 04:19:09,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▌ | 403/892 [39:27<47:20, 5.81s/it]g-point operations will not be computed-03 04:19:09,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4463, 'learning_rate': 0.0008020000000000001, 'epoch': 0.45} + 45%|████████████████████████████████████▌ | 403/892 [39:27<47:20, 5.81s/it]g-point operations will not be computed-03 04:19:09,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▌ | 403/892 [39:27<47:20, 5.81s/it]g-point operations will not be computed-03 04:19:09,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▋ | 404/892 [39:34<50:37, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▋ | 404/892 [39:34<50:37, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0944, 'learning_rate': 0.000804, 'epoch': 0.45} + 45%|████████████████████████████████████▋ | 404/892 [39:34<50:37, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▊ | 405/892 [39:41<52:50, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▊ | 405/892 [39:41<52:50, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3147, 'learning_rate': 0.0008060000000000001, 'epoch': 0.45} + 45%|████████████████████████████████████▊ | 405/892 [39:41<52:50, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▊ | 405/892 [39:41<52:50, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▊ | 405/892 [39:41<52:50, 6.51s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|████████████████████████████████████▊ | 406/892 [39:48<54:04, 6.67s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:19:47,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:19:47,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|████████████████████████████████████▉ | 407/892 [39:55<54:39, 6.76s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|████████████████████████████████████▉ | 407/892 [39:55<54:39, 6.76s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.163, 'learning_rate': 0.0008100000000000001, 'epoch': 0.46} + 46%|████████████████████████████████████▉ | 407/892 [39:55<54:39, 6.76s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:19:57,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:19:57,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0185, 'learning_rate': 0.0008120000000000001, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-03 04:19:57,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:19:57,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▏ | 409/892 [40:09<55:34, 6.90s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▏ | 409/892 [40:09<55:34, 6.90s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:08,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:08,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:08,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▏ | 410/892 [40:16<55:33, 6.92s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▏ | 410/892 [40:16<55:33, 6.92s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▏ | 410/892 [40:16<55:33, 6.92s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▏ | 410/892 [40:16<55:33, 6.92s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▏ | 410/892 [40:16<55:33, 6.92s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▎ | 411/892 [40:23<55:16, 6.89s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:22,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:22,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:22,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▍ | 412/892 [40:30<54:36, 6.83s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:28,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:28,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:28,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▌ | 413/892 [40:37<54:29, 6.82s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▌ | 413/892 [40:37<54:29, 6.82s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▌ | 413/892 [40:37<54:29, 6.82s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:38,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:38,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.8392, 'learning_rate': 0.000824, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:38,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:38,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:38,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▋ | 415/892 [40:50<53:46, 6.76s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:49,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:49,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:49,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▊ | 416/892 [40:57<53:26, 6.74s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▊ | 416/892 [40:57<53:26, 6.74s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▊ | 416/892 [40:57<53:26, 6.74s/it]g-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:59,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:59,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9795, 'learning_rate': 0.00083, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-03 04:20:59,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:05,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:05,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.216, 'learning_rate': 0.000832, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:05,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:05,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:05,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:19:31,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████ | 419/892 [41:17<52:39, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████ | 419/892 [41:17<52:39, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████ | 419/892 [41:17<52:39, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████��███████████████████████ | 419/892 [41:17<52:39, 6.68s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 420/892 [41:23<52:15, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 420/892 [41:23<52:15, 6.64s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:23,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:23,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 421/892 [41:30<51:47, 6.60s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 421/892 [41:30<51:47, 6.60s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 421/892 [41:30<51:47, 6.60s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:31,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:31,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2313, 'learning_rate': 0.00084, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:31,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:38,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:38,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1135, 'learning_rate': 0.000842, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:38,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:44,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:44,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0778, 'learning_rate': 0.000844, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:44,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:44,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:44,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▌ | 425/892 [41:56<51:27, 6.61s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:54,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:54,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:21:54,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▋ | 426/892 [42:02<50:41, 6.53s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:01,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:01,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:01,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▊ | 427/892 [42:09<49:56, 6.44s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:07,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:07,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:07,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▊ | 428/892 [42:15<49:17, 6.37s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▊ | 428/892 [42:15<49:17, 6.37s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:15,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:15,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▉ | 429/892 [42:21<48:54, 6.34s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▉ | 429/892 [42:21<48:54, 6.34s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:21,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:21,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████ | 430/892 [42:27<48:25, 6.29s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████ | 430/892 [42:27<48:25, 6.29s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:27,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 431/892 [42:33<47:50, 6.23s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 431/892 [42:33<47:50, 6.23s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4418, 'learning_rate': 0.000858, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:33,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 432/892 [42:39<47:17, 6.17s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 432/892 [42:39<47:17, 6.17s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1764, 'learning_rate': 0.00086, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:39,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:39,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▎ | 433/892 [42:45<46:52, 6.13s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:43,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:43,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:43,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▍ | 434/892 [42:51<46:16, 6.06s/it]g-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:49,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:49,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:49,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:21:14,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▌ | 435/892 [42:57<45:23, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:22:54,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▌ | 435/892 [42:57<45:23, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:22:54,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:58,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:22:54,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:22:58,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:22:54,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2176, 'learning_rate': 0.0008680000000000001, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:02,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:22:54,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▋ | 437/892 [43:08<43:47, 5.78s/it]g-point operations will not be computed-03 04:22:54,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▋ | 437/892 [43:08<43:47, 5.78s/it]g-point operations will not be computed-03 04:22:54,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:06,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:22:54,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:06,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:22:54,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:06,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:22:54,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▊ | 438/892 [43:14<42:53, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▊ | 438/892 [43:14<42:53, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:14,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:14,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1533, 'learning_rate': 0.000874, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:18,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:18,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▉ | 440/892 [43:24<40:37, 5.39s/it]g-point operations will not be computed-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:22,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:24,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:24,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:26,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:28,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:28,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9092, 'learning_rate': 0.00088, 'epoch': 0.5} + 50%|████████████████████████████████████████▏ | 443/892 [43:38<35:52, 4.79s/it]g-point operations will not be computed-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|██████████████████████████████████��█████▏ | 443/892 [43:38<35:52, 4.79s/it]g-point operations will not be computed-03 04:23:10,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▏ | 443/892 [43:38<35:52, 4.79s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:23:34,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▎ | 444/892 [43:42<34:01, 4.56s/it]g-point operations will not be computed-03 04:23:34,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▎ | 444/892 [43:42<34:01, 4.56s/it]g-point operations will not be computed-03 04:23:34,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▎ | 444/892 [43:42<34:01, 4.56s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:23:38,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▍ | 445/892 [43:45<32:08, 4.32s/it]g-point operations will not be computed-03 04:23:38,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▍ | 445/892 [43:45<32:08, 4.32s/it]g-point operations will not be computed-03 04:23:38,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▍ | 445/892 [43:45<32:08, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:23:41,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▌ | 446/892 [43:49<29:55, 4.03s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:23:45,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▌ | 446/892 [43:49<29:55, 4.03s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:23:45,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:23:45,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:23:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:23:45,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▌ | 447/892 [43:52<27:30, 3.71s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:23:48,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▋ | 448/892 [43:55<27:09, 3.67s/it]g-point operations will not be computed-03 04:23:48,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▋ | 448/892 [43:55<27:09, 3.67s/it]g-point operations will not be computed-03 04:23:48,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▋ | 448/892 [43:55<27:09, 3.67s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:23:51,788 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▊ | 449/892 [43:59<26:29, 3.59s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:23:55,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▊ | 449/892 [43:59<26:29, 3.59s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:23:55,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▊ | 450/892 [44:02<24:40, 3.35s/it]g-point operations will not be computed-03 04:23:55,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▊ | 450/892 [44:02<24:40, 3.35s/it]g-point operations will not be computed-03 04:23:55,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▊ | 450/892 [44:02<24:40, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:23:59,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▊ | 450/892 [44:02<24:40, 3.35s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:23:59,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:24:02,865 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:23:59,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|████████████████████████████████████████▉ | 451/892 [44:09<34:13, 4.66s/it]g-point operations will not be computed-03 04:23:59,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|████████████████████████████████████████▉ | 451/892 [44:09<34:13, 4.66s/it]g-point operations will not be computed-03 04:23:59,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|████████████████████████████████████████▉ | 451/892 [44:09<34:13, 4.66s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:06,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|████████████████████████████████████████▉ | 451/892 [44:09<34:13, 4.66s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:06,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|████████████████████████████████████████▉ | 451/892 [44:09<34:13, 4.66s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:06,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████ | 452/892 [44:16<40:00, 5.45s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████ | 452/892 [44:16<40:00, 5.45s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.48, 'learning_rate': 0.0009000000000000001, 'epoch': 0.51} + 51%|█████████████████████████████████████████ | 452/892 [44:16<40:00, 5.45s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 453/892 [44:24<43:55, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 453/892 [44:24<43:55, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4334, 'learning_rate': 0.000902, 'epoch': 0.51} + 51%|█████████████████████████████████████████▏ | 453/892 [44:24<43:55, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 453/892 [44:24<43:55, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 453/892 [44:24<43:55, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 454/892 [44:31<46:19, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▏ | 454/892 [44:31<46:19, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:24:31,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▎ | 455/892 [44:38<47:54, 6.58s/it]g-point operations will not be computed-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▎ | 455/892 [44:38<47:54, 6.58s/it]g-point operations will not be computed-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.4256, 'learning_rate': 0.000906, 'epoch': 0.51} + 51%|█████████████████████████████████████████▎ | 455/892 [44:38<47:54, 6.58s/it]g-point operations will not be computed-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▎ | 455/892 [44:38<47:54, 6.58s/it]g-point operations will not be computed-03 04:24:13,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 456/892 [44:45<48:50, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 456/892 [44:45<48:50, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3247, 'learning_rate': 0.0009080000000000001, 'epoch': 0.51} + 51%|█████████████████████████████████████████▍ | 456/892 [44:45<48:50, 6.72s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 457/892 [44:52<49:18, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 457/892 [44:52<49:18, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2336, 'learning_rate': 0.00091, 'epoch': 0.51} + 51%|█████████████████████████████████████████▍ | 457/892 [44:52<49:18, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 457/892 [44:52<49:18, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▍ | 457/892 [44:52<49:18, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▌ | 458/892 [44:59<49:43, 6.87s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:24:58,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:24:58,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▋ | 459/892 [45:06<49:53, 6.91s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▋ | 459/892 [45:06<49:53, 6.91s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.2095, 'learning_rate': 0.0009140000000000001, 'epoch': 0.51} + 51%|█████████████████████████████████████████▋ | 459/892 [45:06<49:53, 6.91s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:08,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:08,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3384, 'learning_rate': 0.000916, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:08,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:08,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▊ | 461/892 [45:20<49:21, 6.87s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▊ | 461/892 [45:20<49:21, 6.87s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:18,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:18,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▉ | 462/892 [45:27<49:08, 6.86s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▉ | 462/892 [45:27<49:08, 6.86s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3328, 'learning_rate': 0.00092, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:27,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████ | 463/892 [45:33<48:43, 6.82s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████ | 463/892 [45:33<48:43, 6.82s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.5567, 'learning_rate': 0.0009220000000000001, 'epoch': 0.52} + 52%|██████████████████████████████████████████ | 463/892 [45:33<48:43, 6.82s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:35,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:35,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:38,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:38,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▏ | 465/892 [45:47<47:53, 6.73s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▏ | 465/892 [45:47<47:53, 6.73s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:45,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:45,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▎ | 466/892 [45:53<47:46, 6.73s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▎ | 466/892 [45:53<47:46, 6.73s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3116, 'learning_rate': 0.0009280000000000001, 'epoch': 0.52} + 52%|██████████████████████████████████████████▎ | 466/892 [45:53<47:46, 6.73s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:55,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:55,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0797, 'learning_rate': 0.00093, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-03 04:25:55,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:01,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:01,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.1186, 'learning_rate': 0.0009320000000000001, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:01,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:01,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:01,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▌ | 469/892 [46:13<46:44, 6.63s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:11,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:11,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:11,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▋ | 470/892 [46:20<46:21, 6.59s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:18,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:18,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:18,353 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 471/892 [46:26<45:48, 6.53s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:24,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:24,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:24,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 472/892 [46:32<45:29, 6.50s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 472/892 [46:32<45:29, 6.50s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 472/892 [46:32<45:29, 6.50s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 472/892 [46:32<45:29, 6.50s/it]g-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:34,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:34,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:34,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:34,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:40,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:40,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:40,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:40,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:40,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:24:42,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|███████████████████████████████████████████▏ | 475/892 [46:52<45:08, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|███████████████████████████████████████████▏ | 475/892 [46:52<45:08, 6.49s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:53,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:53,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.418, 'learning_rate': 0.000948, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:53,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:59,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:59,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.5494, 'learning_rate': 0.00095, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-03 04:26:59,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:05,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:05,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0258, 'learning_rate': 0.0009519999999999999, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:05,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:11,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:11,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0919, 'learning_rate': 0.000954, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:11,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:17,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:17,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.0294, 'learning_rate': 0.0009559999999999999, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:17,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:17,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:17,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:26:48,965 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▋ | 481/892 [47:28<41:47, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:28,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▊ | 482/892 [47:34<41:21, 6.05s/it]g-point operations will not be computed-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▊ | 482/892 [47:34<41:21, 6.05s/it]g-point operations will not be computed-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.3622, 'learning_rate': 0.00096, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:34,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:34,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▊ | 483/892 [47:40<40:39, 5.96s/it]g-point operations will not be computed-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▊ | 483/892 [47:40<40:39, 5.96s/it]g-point operations will not be computed-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:39,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:39,836 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▉ | 484/892 [47:46<39:58, 5.88s/it]g-point operations will not be computed-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:44,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:44,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:44,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:25,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|████████████████████████████████████████████ | 485/892 [47:51<39:18, 5.79s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:27:48,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|████████████████████████████████████████████ | 485/892 [47:51<39:18, 5.79s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:27:48,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:52,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:48,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:52,365 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:48,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 4.9877, 'learning_rate': 0.000968, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:56,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:48,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:27:56,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:48,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▏ | 487/892 [48:02<38:08, 5.65s/it]g-point operations will not be computed-03 04:27:48,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:00,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:48,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:00,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:48,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:00,551 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:27:48,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▎ | 488/892 [48:08<37:18, 5.54s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:28:04,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:06,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:04,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▍ | 489/892 [48:13<36:18, 5.41s/it]g-point operations will not be computed-03 04:28:04,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▍ | 489/892 [48:13<36:18, 5.41s/it]g-point operations will not be computed-03 04:28:04,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:10,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:04,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:10,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:04,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:10,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:04,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▍ | 490/892 [48:18<35:17, 5.27s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:28:14,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:16,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:14,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:16,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:14,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▌ | 491/892 [48:22<34:00, 5.09s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▌ | 491/892 [48:22<34:00, 5.09s/it][WARNING|modeling_utils.py:388] 2022-03-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:22,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:22,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:24,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:26,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:26,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:28,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:28,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:29,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:33,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:33,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:34,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:34,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:36,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:39,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:39,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:40,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:40,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:42,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:42,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:44,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-03 04:28:44,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|trainer.py:2369] 2022-03-03 04:28:46,559 >> Batch size = 8aluation *****e number of tokens of the input, floating-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 0/331 [00:00> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 2/331 [00:02<06:42, 1.22s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 3/331 [00:04<08:53, 1.63s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 4/331 [00:06<10:05, 1.85s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 5/331 [00:09<11:40, 2.15s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 6/331 [00:12<12:45, 2.35s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 7/331 [00:14<12:49, 2.38s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|██ | 8/331 [00:17<13:07, 2.44s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 9/331 [00:20<13:39, 2.55s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 10/331 [00:23<14:37, 2.73s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 11/331 [00:25<14:08, 2.65s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 12/331 [00:28<13:56, 2.62s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 13/331 [00:30<13:46, 2.60s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▍ | 14/331 [00:33<13:33, 2.57s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 15/331 [00:36<14:55, 2.83s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 16/331 [00:40<15:48, 3.01s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▏ | 17/331 [00:43<15:54, 3.04s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████▍ | 18/331 [00:45<14:36, 2.80s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 19/331 [00:48<14:16, 2.74s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▉ | 20/331 [00:50<13:24, 2.59s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█████▏ | 21/331 [00:53<13:48, 2.67s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 22/331 [00:56<14:59, 2.91s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▋ | 23/331 [01:00<16:26, 3.20s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▉ | 24/331 [01:04<17:22, 3.40s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 25/331 [01:07<16:42, 3.28s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▍ | 26/331 [01:09<15:30, 3.05s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▋ | 27/331 [01:13<15:34, 3.08s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▉ | 28/331 [01:15<15:05, 2.99s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▏ | 29/331 [01:18<14:36, 2.90s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▍ | 30/331 [01:21<14:00, 2.79s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 9%|███████▋ | 31/331 [01:23<13:25, 2.69s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|███████▉ | 32/331 [01:26<13:07, 2.63s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▏ | 33/331 [01:28<13:08, 2.64s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 10%|████████▍ | 34/331 [01:31<12:59, 2.63s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▋ | 35/331 [01:34<13:10, 2.67s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|████████▉ | 36/331 [01:37<13:48, 2.81s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████▏ | 37/331 [01:40<14:35, 2.98s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 11%|█████████▍ | 38/331 [01:43<14:48, 3.03s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▋ | 39/331 [01:46<14:50, 3.05s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|█████████▉ | 40/331 [01:49<13:33, 2.79s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 12%|██████████▏ | 41/331 [01:51<12:53, 2.67s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▍ | 42/331 [01:54<13:45, 2.86s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▋ | 43/331 [01:58<14:32, 3.03s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 13%|██████████▉ | 44/331 [02:01<14:55, 3.12s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▏ | 45/331 [02:04<14:02, 2.95s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▍ | 46/331 [02:06<12:56, 2.73s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 14%|███████████▋ | 47/331 [02:08<12:06, 2.56s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|███████████▉ | 48/331 [02:11<12:24, 2.63s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▏ | 49/331 [02:14<13:02, 2.78s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▍ | 50/331 [02:17<12:53, 2.75s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 15%|████████████▋ | 51/331 [02:20<13:13, 2.84s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|████████████▉ | 52/331 [02:22<12:39, 2.72s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████▏ | 53/331 [02:25<12:39, 2.73s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 16%|█████████████▍ | 54/331 [02:27<12:06, 2.62s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▋ | 55/331 [02:31<13:06, 2.85s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|█████████████▊ | 56/331 [02:33<12:52, 2.81s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 17%|██████████████ | 57/331 [02:36<12:27, 2.73s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▎ | 58/331 [02:39<12:57, 2.85s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▌ | 59/331 [02:41<12:15, 2.71s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|██████████████▊ | 60/331 [02:44<11:54, 2.64s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 18%|███████████████ | 61/331 [02:47<12:18, 2.73s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▎ | 62/331 [02:49<12:19, 2.75s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▌ | 63/331 [02:53<13:29, 3.02s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 19%|███████████████▊ | 64/331 [02:56<13:06, 2.95s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████ | 65/331 [02:59<12:53, 2.91s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████▎ | 66/331 [03:03<14:12, 3.22s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 20%|████████████████▌ | 67/331 [03:06<14:46, 3.36s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|████████████████▊ | 68/331 [03:10<14:51, 3.39s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|█████████████████ | 69/331 [03:13<14:26, 3.31s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|█████████████████▎ | 70/331 [03:16<14:10, 3.26s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 21%|█████████████████▌ | 71/331 [03:20<14:20, 3.31s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|█████████████████▊ | 72/331 [03:23<14:17, 3.31s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|██████████████████ | 73/331 [03:26<13:45, 3.20s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 22%|██████████████████▎ | 74/331 [03:29<13:23, 3.13s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▌ | 75/331 [03:32<13:30, 3.16s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|██████████████████▊ | 76/331 [03:35<12:48, 3.02s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 23%|███████████████████ | 77/331 [03:37<12:27, 2.94s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▎ | 78/331 [03:40<11:51, 2.81s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▌ | 79/331 [03:42<11:22, 2.71s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|███████████████████▊ | 80/331 [03:45<11:13, 2.68s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 24%|████████████████████ | 81/331 [03:48<11:39, 2.80s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|████████████████████▎ | 82/331 [03:51<11:25, 2.75s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|████████████████████▌ | 83/331 [03:54<11:49, 2.86s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 25%|████████████████████▊ | 84/331 [03:57<12:36, 3.06s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|█████████████████████ | 85/331 [04:00<11:41, 2.85s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|█████████████████████▎ | 86/331 [04:03<12:18, 3.01s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 26%|█████████████████████▌ | 87/331 [04:06<11:55, 2.93s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|█████████████████████▊ | 88/331 [04:09<11:38, 2.87s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|██████████████████████ | 89/331 [04:11<10:48, 2.68s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|██████████████████████▎ | 90/331 [04:13<10:19, 2.57s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 27%|██████████████████████▌ | 91/331 [04:16<10:49, 2.71s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|██████████████████████▊ | 92/331 [04:18<10:09, 2.55s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|███████████████████████ | 93/331 [04:21<10:17, 2.59s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 28%|███████████████████████▎ | 94/331 [04:24<10:32, 2.67s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████▌ | 95/331 [04:27<10:39, 2.71s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|███████████████████████▊ | 96/331 [04:29<10:41, 2.73s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 29%|████████████████████████ | 97/331 [04:32<10:17, 2.64s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|███████████��████████████▎ | 98/331 [04:35<10:37, 2.74s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████▌ | 99/331 [04:38<10:30, 2.72s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 30%|████████████████████████▍ | 100/331 [04:40<10:04, 2.62s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▋ | 101/331 [04:43<09:58, 2.60s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|████████████████████████▉ | 102/331 [04:46<10:49, 2.83s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|█████████████████████████▏ | 103/331 [04:48<10:16, 2.71s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 31%|█████████████████████████▍ | 104/331 [04:51<10:15, 2.71s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▋ | 105/331 [04:54<10:16, 2.73s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|█████████████████████████▉ | 106/331 [04:57<10:15, 2.74s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 32%|██████████████████████████▏ | 107/331 [04:59<09:30, 2.55s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▍ | 108/331 [05:01<09:16, 2.50s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▋ | 109/331 [05:04<09:16, 2.51s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 33%|██████████████████████████▉ | 110/331 [05:07<09:46, 2.65s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▏ | 111/331 [05:09<09:48, 2.68s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▍ | 112/331 [05:12<09:49, 2.69s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▋ | 113/331 [05:14<09:19, 2.57s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 34%|███████████████████████████▉ | 114/331 [05:17<09:24, 2.60s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|████████████████████████████▏ | 115/331 [05:20<09:21, 2.60s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|████████████████████████████▍ | 116/331 [05:22<09:40, 2.70s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 35%|████████████████████████████▋ | 117/331 [05:25<09:39, 2.71s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|████████████████████████████▉ | 118/331 [05:28<09:21, 2.64s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|█████████████████████████████ | 119/331 [05:30<09:25, 2.67s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 36%|█████████████████████████████▎ | 120/331 [05:33<09:25, 2.68s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▌ | 121/331 [05:36<09:56, 2.84s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|█████████████████████████████▊ | 122/331 [05:39<09:44, 2.80s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████ | 123/331 [05:42<10:21, 2.99s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 37%|██████████████████████████████▎ | 124/331 [05:45<10:08, 2.94s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▌ | 125/331 [05:49<10:43, 3.13s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|██████████████████████████████▊ | 126/331 [05:52<10:46, 3.15s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 38%|███████████████████████████████ | 127/331 [05:56<11:09, 3.28s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▎ | 128/331 [05:59<11:07, 3.29s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▌ | 129/331 [06:02<10:53, 3.24s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▌ | 129/331 [06:02<10:53, 3.24s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 39%|███████████████████████████████▌ | 129/331 [06:02<10:53, 3.24s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████ | 131/331 [06:09<11:12, 3.36s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▎ | 132/331 [06:12<10:38, 3.21s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▌ | 133/331 [06:14<10:00, 3.03s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 40%|████████████████████████████████▊ | 134/331 [06:17<09:36, 2.93s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████ | 135/331 [06:20<09:41, 2.97s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▎ | 136/331 [06:24<09:57, 3.06s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 41%|█████████████████████████████████▌ | 137/331 [06:27<10:21, 3.21s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|█████████████████████████████████▊ | 138/331 [06:31<10:36, 3.30s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████ | 139/331 [06:33<09:23, 2.94s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 42%|██████████████████████████████████▎ | 140/331 [06:36<10:03, 3.16s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▌ | 141/331 [06:39<09:31, 3.01s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▌ | 141/331 [06:39<09:31, 3.01s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▌ | 141/331 [06:39<09:31, 3.01s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 43%|██████████████████████████████████▉ | 143/331 [06:45<09:42, 3.10s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▏ | 144/331 [06:48<09:16, 2.98s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▍ | 145/331 [06:51<09:09, 2.95s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▋ | 146/331 [06:54<09:31, 3.09s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 44%|███████████████████████████████████▉ | 147/331 [06:57<09:11, 3.00s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▏ | 148/331 [06:59<08:33, 2.80s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▍ | 149/331 [07:02<08:00, 2.64s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 45%|████████████████████████████████████▋ | 150/331 [07:05<08:19, 2.76s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|████████████████████████████████████▉ | 151/331 [07:07<08:09, 2.72s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▏ | 152/331 [07:10<07:49, 2.62s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 46%|█████████████████████████████████████▍ | 153/331 [07:12<07:47, 2.63s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▋ | 154/331 [07:15<08:06, 2.75s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|█████████████████████████████████████▉ | 155/331 [07:19<08:29, 2.90s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▏ | 156/331 [07:22<08:43, 2.99s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 47%|██████████████████████████████████████▍ | 157/331 [07:25<09:01, 3.11s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▋ | 158/331 [07:28<09:06, 3.16s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|██████████████████████████████████████▉ | 159/331 [07:32<09:07, 3.18s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 48%|███████████████████████████████████████▏ | 160/331 [07:34<08:36, 3.02s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▍ | 161/331 [07:37<08:22, 2.96s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▋ | 162/331 [07:41<08:53, 3.16s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 49%|███████████████████████████████████████▉ | 163/331 [07:44<08:58, 3.20s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▏ | 164/331 [07:47<08:28, 3.04s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▍ | 165/331 [07:50<08:15, 2.98s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▌ | 166/331 [07:52<08:04, 2.94s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 50%|████████████████████████████████████████▊ | 167/331 [07:56<08:15, 3.02s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████ | 168/331 [07:58<07:47, 2.87s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▎ | 169/331 [08:01<07:54, 2.93s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 51%|█████████████████████████████████████████▌ | 170/331 [08:04<07:30, 2.80s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|█████████████████████████████████████████▊ | 171/331 [08:06<07:25, 2.78s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████ | 172/331 [08:09<07:08, 2.69s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 52%|██████████████████████████████████████████▎ | 173/331 [08:12<07:17, 2.77s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▌ | 174/331 [08:14<06:56, 2.65s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|██████████████████████████████████████████▊ | 175/331 [08:17<07:00, 2.70s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|███████████████████████████████████████████ | 176/331 [08:20<06:46, 2.62s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 53%|███████████████████████████████████████████▎ | 177/331 [08:23<07:07, 2.78s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▌ | 178/331 [08:26<07:34, 2.97s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|███████████████████████████████████████████▊ | 179/331 [08:30<07:57, 3.14s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 54%|████████████████████████████████████████████ | 180/331 [08:33<07:50, 3.12s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▎ | 181/331 [08:36<07:45, 3.10s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▌ | 182/331 [08:38<07:09, 2.88s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 55%|████████████████████████████████████████████▊ | 183/331 [08:40<06:36, 2.68s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████ | 184/331 [08:42<06:09, 2.52s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▎ | 185/331 [08:44<05:42, 2.35s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▌ | 186/331 [08:47<05:53, 2.43s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 56%|█████████████████████████████████████████████▊ | 187/331 [08:50<06:23, 2.66s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|██████████████████████████████████████████████ | 188/331 [08:53<06:23, 2.68s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|██████████████████████████████████████████████▎ | 189/331 [08:55<06:06, 2.58s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 57%|██████████████████████████████████████████████▍ | 190/331 [08:58<05:52, 2.50s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|██████████████████████████████████████████████▋ | 191/331 [09:00<05:48, 2.49s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|██████████████████████████████████████████████▉ | 192/331 [09:02<05:37, 2.43s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 58%|███████████████████████████████████████████████▏ | 193/331 [09:06<06:04, 2.64s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▍ | 194/331 [09:08<05:43, 2.51s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▋ | 195/331 [09:10<05:34, 2.46s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 59%|███████████████████████████████████████████████▉ | 196/331 [09:13<05:40, 2.52s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▏ | 197/331 [09:16<05:55, 2.65s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▍ | 198/331 [09:18<05:39, 2.55s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▋ | 199/331 [09:21<05:43, 2.60s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 60%|████████████████████████████████████████████████▉ | 200/331 [09:23<05:25, 2.48s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 61%|█████████████████████████████████████████████████▏ | 201/331 [09:25<05:22, 2.48s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 61%|█████████████████████████████████████████████████▍ | 202/331 [09:28<05:29, 2.55s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 61%|█████████████████████████████████████████████████▋ | 203/331 [09:31<05:27, 2.56s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 62%|█████████████████████████████████████████████████▉ | 204/331 [09:34<05:47, 2.73s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 62%|██████████████████████████████████████████████████▏ | 205/331 [09:37<05:49, 2.77s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 62%|██████████████████████████████████████████████████▍ | 206/331 [09:39<05:44, 2.75s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|██████████████████████████████████████████████████▋ | 207/331 [09:43<05:58, 2.89s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|██████████████████████████████████████████████████▉ | 208/331 [09:46<06:03, 2.96s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|███████████████████████████████████████████████████▏ | 209/331 [09:48<05:33, 2.74s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 63%|███████████████████████████████████████████████████▍ | 210/331 [09:50<05:10, 2.57s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|███████████████████████████████████████████████████▋ | 211/331 [09:53<05:12, 2.61s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|███████████████████████████████████████████████████▉ | 212/331 [09:55<04:58, 2.51s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 64%|████████████████████████████████████████████████████ | 213/331 [09:58<04:57, 2.52s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████████████████████████████████████████▎ | 214/331 [10:00<04:42, 2.41s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████████████████████████████████████████▌ | 215/331 [10:02<04:29, 2.32s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 65%|████████████████████████████████████████████████████▊ | 216/331 [10:05<04:57, 2.59s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████ | 217/331 [10:08<04:57, 2.61s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▎ | 218/331 [10:11<05:10, 2.75s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▌ | 219/331 [10:14<05:06, 2.73s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 66%|█████████████████████████████████████████████████████▊ | 220/331 [10:16<04:52, 2.64s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████ | 221/331 [10:19<04:54, 2.68s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▎ | 222/331 [10:21<04:38, 2.55s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 67%|██████████████████████████████████████████████████████▌ | 223/331 [10:24<04:39, 2.59s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|██████���███████████████████████████████████████████████▊ | 224/331 [10:26<04:40, 2.62s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████ | 225/331 [10:29<04:39, 2.64s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 68%|███████████████████████████████████████████████████████▎ | 226/331 [10:32<04:54, 2.80s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▌ | 227/331 [10:35<04:47, 2.76s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|███████████████████████████████████████████████████████▊ | 228/331 [10:38<04:39, 2.72s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|████████████████████████████████████████████████████████ | 229/331 [10:40<04:38, 2.73s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 69%|████████████████████████████████████████████████████████▎ | 230/331 [10:43<04:30, 2.67s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|████████████████████████████████████████████████████████▌ | 231/331 [10:46<04:36, 2.77s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|████████████████████████████████████████████████████████▊ | 232/331 [10:48<04:30, 2.73s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 70%|█████████████████████████████████████████████████████████ | 233/331 [10:52<04:37, 2.83s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▎ | 234/331 [10:54<04:22, 2.71s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▌ | 235/331 [10:56<04:11, 2.62s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 71%|█████████████████████████████████████████████████████████▊ | 236/331 [11:00<04:37, 2.92s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 72%|████��████████████████████████████████████████████████████▉ | 237/331 [11:03<04:48, 3.07s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 72%|██████████████████████████████████████████████████████████▏ | 238/331 [11:06<04:45, 3.07s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 72%|██████████████████████████████████████████████████████████▍ | 239/331 [11:10<04:43, 3.09s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|██████████████████████████████████████████████████████████▋ | 240/331 [11:13<04:45, 3.14s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|██████████████████████████████████████████████████████████▉ | 241/331 [11:16<04:48, 3.20s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|███████████████████████████████████████████████████████████▏ | 242/331 [11:19<04:45, 3.21s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 73%|███████████████████████████████████████████████████████████▍ | 243/331 [11:23<04:42, 3.21s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|███████████████████████████████████████████████████████████▋ | 244/331 [11:26<04:47, 3.30s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|███████████████████████████████████████████████████████████▉ | 245/331 [11:29<04:33, 3.18s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 74%|████████████████████████████████████████████████████████████▏ | 246/331 [11:33<04:44, 3.35s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|████████████████████████████████████████████████████████████▍ | 247/331 [11:36<04:34, 3.26s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|████████████████████████████████████████████████████████████▋ | 248/331 [11:38<04:14, 3.07s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 75%|████████████████████████████████████████████████████████████▉ | 249/331 [11:41<03:53, 2.84s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|█████████████████████████████████████████████████████████████▏ | 250/331 [11:43<03:40, 2.72s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|█████████████████████████████████████████████████████████████▍ | 251/331 [11:46<03:43, 2.79s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|█████████████████████████████████████████████████████████████▋ | 252/331 [11:49<03:31, 2.67s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 76%|█████████████████████████████████████████████████████████████▉ | 253/331 [11:52<03:39, 2.81s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|██████████████████████████████████████████████████████████████▏ | 254/331 [11:54<03:33, 2.77s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|██████████████████████████████████████████████████████████████▍ | 255/331 [11:58<03:38, 2.87s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 77%|██████████████████████████████████████████████████████████████▋ | 256/331 [12:00<03:29, 2.79s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|██████████████████████████████████████████████████████████████▉ | 257/331 [12:03<03:33, 2.88s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|███████████████████████████████████████████████████████████████▏ | 258/331 [12:06<03:20, 2.74s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 78%|███████████████████████████████████████████████████████████████▍ | 259/331 [12:08<03:14, 2.71s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|███████████████████████████████████████████████████████████████▋ | 260/331 [12:11<03:18, 2.80s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|███████████████████████████████████████████████████████████████▊ | 261/331 [12:14<03:04, 2.64s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|█████████████████████████████████████████████████████��██████████ | 262/331 [12:16<03:03, 2.66s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 79%|████████████████████████████████████████████████████████████████▎ | 263/331 [12:19<03:10, 2.80s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|████████████████████████████████████████████████████████████████▌ | 264/331 [12:22<03:00, 2.69s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|████████████████████████████████████████████████████████████████▊ | 265/331 [12:24<02:53, 2.63s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 80%|█████████████████████████████████████████████████████████████████ | 266/331 [12:27<02:47, 2.57s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|█████████████████████████████████████████████████████████████████▎ | 267/331 [12:30<02:55, 2.74s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|█████████████████████████████████████████████████████████████████▌ | 268/331 [12:33<02:52, 2.74s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 81%|█████████████████████████████████████████████████████████████████▊ | 269/331 [12:36<02:59, 2.90s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|██████████████████████████████████████████████████████████████████ | 270/331 [12:39<02:56, 2.90s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|██████████████████████████████████████████████████████████████████▎ | 271/331 [12:42<03:00, 3.01s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|██████████████████████████████████████████████████████████████████▌ | 272/331 [12:45<02:51, 2.90s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 82%|██████████████████████████████████████████████████████████████████▊ | 273/331 [12:48<02:50, 2.95s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|███████████████████████████████████████████████████████████████████ | 274/331 [12:51<02:55, 3.07s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|███████████████████████████████████████████████████████████████████▎ | 275/331 [12:54<02:55, 3.14s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 83%|███████████████████████████████████████████████████████████████████▌ | 276/331 [12:57<02:42, 2.96s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|███████████████████████████████████████████████████████████████████▊ | 277/331 [13:00<02:35, 2.88s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|████████████████████████████████████████████████████████████████████ | 278/331 [13:02<02:30, 2.83s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 84%|████████████████████████████████████████████████████████████████████▎ | 279/331 [13:06<02:39, 3.06s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|████████████████████████████████████████████████████████████████████▌ | 280/331 [13:09<02:33, 3.02s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|████████████████████████████████████████████████████████████████████▊ | 281/331 [13:12<02:36, 3.13s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|█████████████████████████████████████████████████████████████████████ | 282/331 [13:15<02:33, 3.14s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 85%|█████████████████████████████████████████████████████████████████████▎ | 283/331 [13:19<02:34, 3.22s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|█████████████████████████████████████████████████████████████████████▍ | 284/331 [13:22<02:34, 3.29s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|█████████████████████████████████████████████████████████████████████▋ | 285/331 [13:26<02:33, 3.33s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 86%|█████████████████████████████████████████████████████████████████████▉ | 286/331 [13:29<02:31, 3.36s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|██��███████████████████████████████████████████████████████████████████▏ | 287/331 [13:33<02:31, 3.45s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|██████████████████████████████████████████████████████████████████████▍ | 288/331 [13:36<02:27, 3.43s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|██████████████████████████████████████████████████████████████████████▋ | 289/331 [13:39<02:15, 3.22s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|██████████████████████████████████████████████████████████████████████▋ | 289/331 [13:39<02:15, 3.22s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 87%|██████████████████████████████████████████████████████████████████████▋ | 289/331 [13:39<02:15, 3.22s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 88%|███████████████████████████████████████████████████████████████████████▏ | 291/331 [13:44<01:55, 2.88s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 88%|███████████████████████████████████████████████████████████████████████▍ | 292/331 [13:47<01:49, 2.82s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 89%|███████████████████████████████████████████████████████████████████████▋ | 293/331 [13:50<01:47, 2.83s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 89%|███████████████████████████████████████████████████████████████████████▉ | 294/331 [13:52<01:39, 2.70s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 89%|████████████████████████████████████████████████████████████████████████▏ | 295/331 [13:54<01:35, 2.64s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 89%|████████████████████████████████████████████████████████████████████████▍ | 296/331 [13:57<01:29, 2.55s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|████████████████████████████████████████████████████████████████████████▋ | 297/331 [14:00<01:36, 2.85s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|██████████��█████████████████████████████████████████████████████████████▉ | 298/331 [14:04<01:41, 3.06s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 90%|█████████████████████████████████████████████████████████████████████████▏ | 299/331 [14:07<01:34, 2.95s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|█████████████████████████████████████████████████████████████████████████▍ | 300/331 [14:10<01:30, 2.93s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|█████████████████████████████████████████████████████████████████████████▋ | 301/331 [14:12<01:26, 2.88s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 91%|█████████████████████████████████████████████████████████████████████████▉ | 302/331 [14:15<01:21, 2.82s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 92%|██████████████████████████████████████████████████████████████████████████▏ | 303/331 [14:17<01:15, 2.71s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 92%|██████████████████████████████████████████████████████████████████████████▍ | 304/331 [14:20<01:15, 2.79s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 92%|██████████████████████████████████████████████████████████████████████████▋ | 305/331 [14:24<01:15, 2.92s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 92%|██████████████████████████████████████████████████████████████████████████▉ | 306/331 [14:27<01:17, 3.09s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|███████████████████████████████████████████████████████████████████████████▏ | 307/331 [14:31<01:17, 3.23s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|███████████████████████████████████████████████████████████████████████████▎ | 308/331 [14:35<01:18, 3.42s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 93%|███████████████████████████████████████████████████████████████████████████▌ | 309/331 [14:38<01:16, 3.46s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|███████████████████████████████████████████████████████████████████████████▊ | 310/331 [14:41<01:07, 3.21s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|████████████████████████████████████████████████████████████████████████████ | 311/331 [14:44<01:04, 3.21s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 94%|████████████████████████████████████████████████████████████████████████████▎ | 312/331 [14:46<00:57, 3.01s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 95%|████████████████████████████████████████████████████████████████████████████▌ | 313/331 [14:49<00:52, 2.94s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 95%|████████████████████████████████████████████████████████████████████████████▊ | 314/331 [14:52<00:50, 2.97s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 95%|█████████████████████████████████████████████████████████████████████████████ | 315/331 [14:56<00:48, 3.06s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 95%|█████████████████████████████████████████████████████████████████████████████▎ | 316/331 [14:59<00:46, 3.08s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|█████████████████████████████████████████████████████████████████████████████▌ | 317/331 [15:02<00:45, 3.22s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|█████████████████████████████████████████████████████████████████████████████▊ | 318/331 [15:05<00:39, 3.04s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 96%|██████████████████████████████████████████████████████████████████████████████ | 319/331 [15:07<00:34, 2.90s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|██████████████████████████████████████████████████████████████████████████████▎ | 320/331 [15:10<00:32, 2.91s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|██████████████████████████████████████████████████████████████████████████████▌ | 321/331 [15:13<00:28, 2.87s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 97%|██████████████████████████████████████████████████████████████████████████████▊ | 322/331 [15:16<00:27, 3.02s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 98%|███████████████████████████████████████████████████████████████████████████████ | 323/331 [15:19<00:23, 2.92s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 98%|███████████████████████████████████████████████████████████████████████████████▎ | 324/331 [15:22<00:21, 3.02s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 98%|███████████████████████████████████████████████████████████████████████████████▌ | 325/331 [15:26<00:18, 3.05s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 98%|███████████████████████████████████████████████████████████████████████████████▊ | 326/331 [15:29<00:15, 3.09s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|████████████████████████████████████████████████████████████████████████████████ | 327/331 [15:32<00:12, 3.10s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|████████████████████████████████████████████████████████████████████████████████▎| 328/331 [15:35<00:09, 3.14s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 99%|████████████████████████████████████████████████████████████████████████████████▌| 329/331 [15:38<00:06, 3.07s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +100%|████████████████████████████████████████████████████████████████████████████████▊| 330/331 [15:42<00:03, 3.24s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +100%|█████████████████████████████████████████████████████████████████████████████████| 331/331 [15:43<00:00, 2.81s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +100%|█████████████████████████████████████████████████████████████████████████████████| 331/331 [15:43<00:00, 2.81s/it]g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +03/03/2022 04:44:33 - INFO - datasets.metric - Removing /home/sanchit_huggingface_co/.cache/huggingface/metrics/wer/default/default_experiment-1-0.arrow +[INFO|configuration_utils.py:438] 2022-03-03 04:44:33,883 >> Configuration saved in ./checkpoint-500/config.json g-point operations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|feature_extraction_utils.py:324] 2022-03-03 04:44:38,919 >> Configuration saved in ./checkpoint-500/preprocessor_config.jsonerations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|feature_extraction_utils.py:324] 2022-03-03 04:44:38,919 >> Configuration saved in ./checkpoint-500/preprocessor_config.jsonerations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|feature_extraction_utils.py:324] 2022-03-03 04:44:38,919 >> Configuration saved in ./checkpoint-500/preprocessor_config.jsonerations will not be computed-03 04:28:19,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +03/03/2022 04:46:11 - WARNING - huggingface_hub.repository - Adding files tracked by Git LFS: ['wandb/run-20220303_033953-1eigbhyo/run-1eigbhyo.wandb']. This may take a bit of time if the files are large.