diff --git "a/wandb/run-20220310_212039-1nikmzrh/files/output.log" "b/wandb/run-20220310_212039-1nikmzrh/files/output.log" new file mode 100644--- /dev/null +++ "b/wandb/run-20220310_212039-1nikmzrh/files/output.log" @@ -0,0 +1,5728 @@ + + + 0%| | 0/17840 [00:00> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:20:44,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:20:46,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:20:48,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 1/17840 [00:07<38:35:37, 7.79s/it] + + 0%| | 1/17840 [00:07<38:35:37, 7.79s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:20:49,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:20:51,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:20:53,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:20:54,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 2/17840 [00:14<35:46:18, 7.22s/it] + 0%| | 2/17840 [00:14<35:46:18, 7.22s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:20:56,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:20:58,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:00,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 11.0856, 'learning_rate': 9e-08, 'epoch': 0.0} +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:01,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 3/17840 [00:21<34:50:31, 7.03s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:21:03,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:05,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:06,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:08,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 4/17840 [00:28<34:19:47, 6.93s/it] + + 0%| | 4/17840 [00:28<34:19:47, 6.93s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:21:10,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:11,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:13,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 11.0751, 'learning_rate': 1.5000000000000002e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:15,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 5/17840 [00:34<33:58:07, 6.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:21:17,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:18,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:20,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 11.0764, 'learning_rate': 1.8e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:21,926 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 6/17840 [00:41<33:40:16, 6.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:21:23,669 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:25,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:26,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 11.0548, 'learning_rate': 2.1e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:28,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 7/17840 [00:48<33:22:42, 6.74s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:21:30,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:31,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 11.0916, 'learning_rate': 2.4000000000000003e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:33,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:35,138 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + + 0%| | 8/17840 [00:54<33:09:03, 6.69s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:21:36,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:38,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:40,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:41,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 9/17840 [01:01<32:57:52, 6.66s/it] + + 0%| | 9/17840 [01:01<32:57:52, 6.66s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:21:43,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:45,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:46,697 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 11.0499, 'learning_rate': 3.0000000000000004e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:48,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 10/17840 [01:07<32:51:14, 6.63s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:21:50,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:51,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:53,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 11.0538, 'learning_rate': 3.2999999999999996e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:54,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 11/17840 [01:14<32:32:14, 6.57s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:21:56,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:57,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:21:59,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 11.0245, 'learning_rate': 3.6e-07, 'epoch': 0.01} +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:01,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 12/17840 [01:20<32:17:19, 6.52s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:22:02,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:04,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:05,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:07,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 13/17840 [01:27<32:06:34, 6.48s/it] + + 0%| | 13/17840 [01:27<32:06:34, 6.48s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:22:09,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:10,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:12,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:13,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 14/17840 [01:33<31:59:49, 6.46s/it] + + 0%| | 14/17840 [01:33<31:59:49, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:22:15,584 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:17,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:18,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:20,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 15/17840 [01:39<31:43:10, 6.41s/it] + + 0%| | 15/17840 [01:39<31:43:10, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:22:21,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:23,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:24,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:26,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 16/17840 [01:46<31:31:42, 6.37s/it] + + 0%| | 16/17840 [01:46<31:31:42, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:22:28,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:29,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:31,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:32,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 17/17840 [01:52<31:22:14, 6.34s/it] + + 0%| | 17/17840 [01:52<31:22:14, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:22:34,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:35,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:37,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:38,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 18/17840 [01:58<31:05:25, 6.28s/it] + + 0%| | 18/17840 [01:58<31:05:25, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:22:40,536 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:42,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:43,594 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:45,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 19/17840 [02:04<31:00:11, 6.26s/it] + + 0%| | 19/17840 [02:04<31:00:11, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:22:46,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:48,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:49,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:51,295 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 20/17840 [02:10<30:51:08, 6.23s/it] + + 0%| | 20/17840 [02:10<30:51:08, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:22:52,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:54,406 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:55,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:22:57,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 21/17840 [02:17<30:41:25, 6.20s/it] + + 0%| | 21/17840 [02:17<30:41:25, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:22:59,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:00,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:02,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:03,498 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 22/17840 [02:23<30:30:30, 6.16s/it] + + 0%| | 22/17840 [02:23<30:30:30, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:23:05,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:06,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:08,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:09,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 23/17840 [02:29<30:13:59, 6.11s/it] + + 0%| | 23/17840 [02:29<30:13:59, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:23:11,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:12,533 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:13,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:15,453 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 24/17840 [02:35<30:01:57, 6.07s/it] + + 0%| | 24/17840 [02:35<30:01:57, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:23:16,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:18,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:19,869 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:21,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 25/17840 [02:41<30:22:16, 6.14s/it] + 0%| | 25/17840 [02:41<30:22:16, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:23:23,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:26,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:23:23,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:26,199 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:23:23,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 10.829, 'learning_rate': 7.799999999999999e-07, 'epoch': 0.03} +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:27,632 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 26/17840 [02:47<29:59:26, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:23:29,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:30,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:32,026 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:23:29,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [02:53<29:37:05, 5.99s/it]g-point operations will not be computed-10 21:23:29,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [02:53<29:37:05, 5.99s/it]g-point operations will not be computed-10 21:23:29,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 27/17840 [02:53<29:37:05, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:23:34,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:37,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:23:34,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:37,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:23:34,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [02:58<29:13:06, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:23:40,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%| | 28/17840 [02:58<29:13:06, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:23:40,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:04<28:48:45, 5.82s/it]g-point operations will not be computed-10 21:23:40,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:04<28:48:45, 5.82s/it]g-point operations will not be computed-10 21:23:40,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 29/17840 [03:04<28:48:45, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:23:46,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:49,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:23:46,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:10<28:25:50, 5.75s/it]g-point operations will not be computed-10 21:23:46,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:10<28:25:50, 5.75s/it]g-point operations will not be computed-10 21:23:46,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 30/17840 [03:10<28:25:50, 5.75s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:23:51,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:54,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:23:51,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:23:54,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:23:51,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 31/17840 [03:15<28:10:48, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:23:57,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 31/17840 [03:15<28:10:48, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:23:57,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 32/17840 [03:21<27:51:26, 5.63s/it]g-point operations will not be computed-10 21:23:57,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 32/17840 [03:21<27:51:26, 5.63s/it]g-point operations will not be computed-10 21:23:57,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 32/17840 [03:21<27:51:26, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:02,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:24:05,488 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:24:02,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 33/17840 [03:26<27:32:00, 5.57s/it]g-point operations will not be computed-10 21:24:02,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 33/17840 [03:26<27:32:00, 5.57s/it]g-point operations will not be computed-10 21:24:02,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 33/17840 [03:26<27:32:00, 5.57s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:24:10,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:24:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:24:10,741 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:24:08,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 34/17840 [03:31<26:55:02, 5.44s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:13,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 34/17840 [03:31<26:55:02, 5.44s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:13,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 35/17840 [03:36<26:23:48, 5.34s/it]g-point operations will not be computed-10 21:24:13,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 35/17840 [03:36<26:23:48, 5.34s/it]g-point operations will not be computed-10 21:24:13,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 35/17840 [03:36<26:23:48, 5.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:18,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:24:20,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:24:18,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:24:20,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:24:18,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 36/17840 [03:41<26:01:48, 5.26s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:23,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:24:25,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:24:23,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 37/17840 [03:46<25:33:40, 5.17s/it]g-point operations will not be computed-10 21:24:23,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 37/17840 [03:46<25:33:40, 5.17s/it]g-point operations will not be computed-10 21:24:23,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 37/17840 [03:46<25:33:40, 5.17s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:28,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 38/17840 [03:51<25:05:39, 5.07s/it]g-point operations will not be computed-10 21:24:28,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 38/17840 [03:51<25:05:39, 5.07s/it]g-point operations will not be computed-10 21:24:28,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 38/17840 [03:51<25:05:39, 5.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:33,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:24:35,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:24:33,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 39/17840 [03:56<24:31:06, 4.96s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:37,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 39/17840 [03:56<24:31:06, 4.96s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:37,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:24:40,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:24:37,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 40/17840 [04:00<23:52:00, 4.83s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:42,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 40/17840 [04:00<23:52:00, 4.83s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:42,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:24:44,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:24:42,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 41/17840 [04:05<23:03:59, 4.67s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 41/17840 [04:05<23:03:59, 4.67s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:24:48,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:24:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 42/17840 [04:09<22:07:29, 4.48s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:50,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 42/17840 [04:09<22:07:29, 4.48s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:50,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:24:52,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:24:50,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 43/17840 [04:12<21:05:30, 4.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:54,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 43/17840 [04:12<21:05:30, 4.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:54,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:24:55,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:24:54,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:24:55,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:24:54,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 44/17840 [04:16<20:00:41, 4.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:57,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 44/17840 [04:16<20:00:41, 4.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:24:57,689 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 45/17840 [04:19<18:34:21, 3.76s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:00,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 45/17840 [04:19<18:34:21, 3.76s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:00,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 46/17840 [04:22<17:06:23, 3.46s/it]g-point operations will not be computed-10 21:25:00,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:04,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:03,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:06,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:05,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:06,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:05,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:08,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:07,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:08,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:07,940 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:10,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:09,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:10,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:09,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [04:31<12:16:06, 2.48s/it]g-point operations will not be computed-10 21:25:09,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [04:31<12:16:06, 2.48s/it]g-point operations will not be computed-10 21:25:09,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [04:31<12:16:06, 2.48s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:13,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [04:31<12:16:06, 2.48s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:13,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 50/17840 [04:31<12:16:06, 2.48s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:13,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [04:38<18:56:29, 3.83s/it]g-point operations will not be computed-10 21:25:13,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [04:38<18:56:29, 3.83s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:20,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 51/17840 [04:38<18:56:29, 3.83s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:20,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:20,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:23,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:20,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [04:45<23:20:27, 4.72s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:27,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 52/17840 [04:45<23:20:27, 4.72s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:27,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:30,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:27,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:30,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:27,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [04:51<26:24:04, 5.34s/it]g-point operations will not be computed-10 21:25:27,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 53/17840 [04:51<26:24:04, 5.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:33,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:37,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:33,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:37,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:33,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [04:58<28:27:03, 5.76s/it]g-point operations will not be computed-10 21:25:33,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 54/17840 [04:58<28:27:03, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:40,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:43,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:40,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:05<29:38:10, 6.00s/it]g-point operations will not be computed-10 21:25:40,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:05<29:38:10, 6.00s/it]g-point operations will not be computed-10 21:25:40,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:05<29:38:10, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:47,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 55/17840 [05:05<29:38:10, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:47,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:11<30:26:11, 6.16s/it]g-point operations will not be computed-10 21:25:47,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:11<30:26:11, 6.16s/it]g-point operations will not be computed-10 21:25:47,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:11<30:26:11, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:53,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 56/17840 [05:11<30:26:11, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:25:53,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:56,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:53,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:25:56,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:25:53,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [05:18<30:56:15, 6.26s/it]g-point operations will not be computed-10 21:25:53,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▏ | 57/17840 [05:18<30:56:15, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:00,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:26:03,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:26:00,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:26:03,361 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:26:00,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [05:24<31:16:47, 6.33s/it]g-point operations will not be computed-10 21:26:00,109 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 58/17840 [05:24<31:16:47, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:06,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:26:09,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:26:06,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:26:09,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:26:06,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [05:31<31:21:34, 6.35s/it]g-point operations will not be computed-10 21:26:06,581 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 59/17840 [05:31<31:21:34, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:13,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:26:16,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:26:13,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [05:37<31:32:12, 6.39s/it]g-point operations will not be computed-10 21:26:13,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [05:37<31:32:12, 6.39s/it]g-point operations will not be computed-10 21:26:13,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 60/17840 [05:37<31:32:12, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:19,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:26:22,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:26:19,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [05:43<31:30:14, 6.38s/it]g-point operations will not be computed-10 21:26:19,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [05:43<31:30:14, 6.38s/it]g-point operations will not be computed-10 21:26:19,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 61/17840 [05:43<31:30:14, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:25,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:26:28,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:26:25,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 62/17840 [05:50<31:23:33, 6.36s/it]g-point operations will not be computed-10 21:26:25,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 62/17840 [05:50<31:23:33, 6.36s/it]g-point operations will not be computed-10 21:26:25,802 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 62/17840 [05:50<31:23:33, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:32,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:26:35,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:26:32,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [05:56<31:15:18, 6.33s/it]g-point operations will not be computed-10 21:26:32,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [05:56<31:15:18, 6.33s/it]g-point operations will not be computed-10 21:26:32,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [05:56<31:15:18, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:38,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 63/17840 [05:56<31:15:18, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:38,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:02<31:12:11, 6.32s/it]g-point operations will not be computed-10 21:26:38,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:02<31:12:11, 6.32s/it]g-point operations will not be computed-10 21:26:38,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:02<31:12:11, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:44,696 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 64/17840 [06:02<31:12:11, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:44,696 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [06:08<31:04:04, 6.29s/it]g-point operations will not be computed-10 21:26:44,696 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [06:08<31:04:04, 6.29s/it]g-point operations will not be computed-10 21:26:44,696 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [06:08<31:04:04, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:50,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 65/17840 [06:08<31:04:04, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:50,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [06:15<30:47:28, 6.24s/it]g-point operations will not be computed-10 21:26:50,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [06:15<30:47:28, 6.24s/it]g-point operations will not be computed-10 21:26:50,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [06:15<30:47:28, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:56,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 66/17840 [06:15<30:47:28, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:26:56,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [06:21<30:34:21, 6.19s/it]g-point operations will not be computed-10 21:26:56,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [06:21<30:34:21, 6.19s/it]g-point operations will not be computed-10 21:26:56,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [06:21<30:34:21, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:03,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 67/17840 [06:21<30:34:21, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:03,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [06:27<30:21:34, 6.15s/it]g-point operations will not be computed-10 21:27:03,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [06:27<30:21:34, 6.15s/it]g-point operations will not be computed-10 21:27:03,017 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 68/17840 [06:27<30:21:34, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:09,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:12,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:09,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [06:33<30:19:42, 6.14s/it]g-point operations will not be computed-10 21:27:09,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [06:33<30:19:42, 6.14s/it]g-point operations will not be computed-10 21:27:09,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 69/17840 [06:33<30:19:42, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:15,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:18,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:15,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [06:39<30:10:47, 6.11s/it]g-point operations will not be computed-10 21:27:15,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [06:39<30:10:47, 6.11s/it]g-point operations will not be computed-10 21:27:15,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 70/17840 [06:39<30:10:47, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:21,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:24,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:21,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:24,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:21,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 71/17840 [06:45<29:55:23, 6.06s/it]g-point operations will not be computed-10 21:27:21,242 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 71/17840 [06:45<29:55:23, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:27,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:30,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:27,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:30,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:27,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 72/17840 [06:51<29:47:11, 6.04s/it]g-point operations will not be computed-10 21:27:27,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 72/17840 [06:51<29:47:11, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:33,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:36,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:33,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:36,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:33,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 73/17840 [06:57<29:27:53, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:38,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 73/17840 [06:57<29:27:53, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:38,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:41,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:38,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:41,847 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:38,934 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [07:02<29:20:36, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:44,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 74/17840 [07:02<29:20:36, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:44,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:47,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:44,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:47,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:44,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [07:09<29:42:19, 6.02s/it]g-point operations will not be computed-10 21:27:44,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 75/17840 [07:09<29:42:19, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:51,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:53,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:51,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:27:53,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:27:51,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 76/17840 [07:14<29:15:42, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:56,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 76/17840 [07:14<29:15:42, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:27:56,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [07:20<28:56:32, 5.87s/it]g-point operations will not be computed-10 21:27:56,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [07:20<28:56:32, 5.87s/it]g-point operations will not be computed-10 21:27:56,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 77/17840 [07:20<28:56:32, 5.87s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:02,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:05,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:02,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:05,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:02,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 78/17840 [07:26<28:38:13, 5.80s/it]g-point operations will not be computed-10 21:28:02,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 78/17840 [07:26<28:38:13, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:08,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:10,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:08,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:10,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:08,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 79/17840 [07:31<28:19:49, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:13,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 79/17840 [07:31<28:19:49, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:13,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 80/17840 [07:37<28:04:32, 5.69s/it]g-point operations will not be computed-10 21:28:13,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 80/17840 [07:37<28:04:32, 5.69s/it]g-point operations will not be computed-10 21:28:13,646 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 80/17840 [07:37<28:04:32, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:19,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:21,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:19,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:21,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:19,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 81/17840 [07:42<27:42:54, 5.62s/it]g-point operations will not be computed-10 21:28:19,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 81/17840 [07:42<27:42:54, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:24,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:27,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:24,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:27,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:24,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 82/17840 [07:48<27:24:15, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:30,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 82/17840 [07:48<27:24:15, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:30,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 83/17840 [07:53<27:09:48, 5.51s/it]g-point operations will not be computed-10 21:28:30,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 83/17840 [07:53<27:09:48, 5.51s/it]g-point operations will not be computed-10 21:28:30,062 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 83/17840 [07:53<27:09:48, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:35,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:37,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:35,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:37,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:35,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 84/17840 [07:58<26:33:23, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:40,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 84/17840 [07:58<26:33:23, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:40,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 85/17840 [08:03<26:04:33, 5.29s/it]g-point operations will not be computed-10 21:28:40,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 85/17840 [08:03<26:04:33, 5.29s/it]g-point operations will not be computed-10 21:28:40,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 85/17840 [08:03<26:04:33, 5.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:45,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:47,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:45,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:47,953 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:45,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▎ | 86/17840 [08:08<25:41:37, 5.21s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:50,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:52,954 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:50,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 87/17840 [08:13<25:20:23, 5.14s/it]g-point operations will not be computed-10 21:28:50,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 87/17840 [08:13<25:20:23, 5.14s/it]g-point operations will not be computed-10 21:28:50,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 87/17840 [08:13<25:20:23, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:28:55,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:57,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:55,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:28:57,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:28:55,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 88/17840 [08:18<24:50:04, 5.04s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:00,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:02,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:00,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:02,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:00,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 89/17840 [08:23<24:16:18, 4.92s/it]g-point operations will not be computed-10 21:29:00,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 0%|▍ | 89/17840 [08:23<24:16:18, 4.92s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:04,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 90/17840 [08:27<23:34:05, 4.78s/it]g-point operations will not be computed-10 21:29:04,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 90/17840 [08:27<23:34:05, 4.78s/it]g-point operations will not be computed-10 21:29:04,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:11,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:09,198 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 91/17840 [08:31<22:40:29, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:13,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 91/17840 [08:31<22:40:29, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:13,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:15,264 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:13,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 92/17840 [08:35<21:44:14, 4.41s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:17,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 92/17840 [08:35<21:44:14, 4.41s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:17,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:19,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:17,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:19,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:17,222 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 93/17840 [08:39<20:39:47, 4.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:20,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 94/17840 [08:43<19:36:53, 3.98s/it]g-point operations will not be computed-10 21:29:20,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 94/17840 [08:43<19:36:53, 3.98s/it]g-point operations will not be computed-10 21:29:20,852 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 94/17840 [08:43<19:36:53, 3.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:24,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 95/17840 [08:46<18:26:53, 3.74s/it]g-point operations will not be computed-10 21:29:24,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 95/17840 [08:46<18:26:53, 3.74s/it]g-point operations will not be computed-10 21:29:24,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:28,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:27,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:28,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:27,442 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:31,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:30,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 97/17840 [08:51<15:44:43, 3.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:32,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 97/17840 [08:51<15:44:43, 3.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:32,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 98/17840 [08:53<14:19:03, 2.91s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:34,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 98/17840 [08:53<14:19:03, 2.91s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:34,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:37,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:36,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:37,511 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:36,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 100/17840 [08:58<12:11:22, 2.47s/it]g-point operations will not be computed-10 21:29:36,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 100/17840 [08:58<12:11:22, 2.47s/it]g-point operations will not be computed-10 21:29:36,740 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 100/17840 [08:58<12:11:22, 2.47s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:40,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:43,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:40,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 101/17840 [09:04<18:48:56, 3.82s/it]g-point operations will not be computed-10 21:29:40,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 101/17840 [09:04<18:48:56, 3.82s/it]g-point operations will not be computed-10 21:29:40,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 101/17840 [09:04<18:48:56, 3.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:47,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 101/17840 [09:04<18:48:56, 3.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:47,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:50,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:47,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:50,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:47,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 102/17840 [09:11<23:12:26, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:53,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 102/17840 [09:11<23:12:26, 4.71s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:29:53,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:57,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:53,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:29:57,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:29:53,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 103/17840 [09:18<25:57:29, 5.27s/it]g-point operations will not be computed-10 21:29:53,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 103/17840 [09:18<25:57:29, 5.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:30:00,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:30:03,709 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:30:00,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 104/17840 [09:24<28:02:40, 5.69s/it]g-point operations will not be computed-10 21:30:00,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 104/17840 [09:24<28:02:40, 5.69s/it]g-point operations will not be computed-10 21:30:00,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 104/17840 [09:24<28:02:40, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:30:07,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:30:10,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:30:07,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [09:31<29:20:35, 5.96s/it]g-point operations will not be computed-10 21:30:07,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [09:31<29:20:35, 5.96s/it]g-point operations will not be computed-10 21:30:07,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 105/17840 [09:31<29:20:35, 5.96s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:30:13,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:30:16,761 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:30:13,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 106/17840 [09:38<30:06:57, 6.11s/it]g-point operations will not be computed-10 21:30:13,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 106/17840 [09:38<30:06:57, 6.11s/it]g-point operations will not be computed-10 21:30:13,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 106/17840 [09:38<30:06:57, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:30:20,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 106/17840 [09:38<30:06:57, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:30:20,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:30:23,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:30:20,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:30:23,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:30:20,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 107/17840 [09:44<30:37:44, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:30:26,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 107/17840 [09:44<30:37:44, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:30:26,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:30:29,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:30:26,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:30:29,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:30:26,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 108/17840 [09:50<30:54:27, 6.27s/it]g-point operations will not be computed-10 21:30:26,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 108/17840 [09:50<30:54:27, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:30:32,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:30:36,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:30:32,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 109/17840 [09:57<31:06:03, 6.31s/it]g-point operations will not be computed-10 21:30:32,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 109/17840 [09:57<31:06:03, 6.31s/it]g-point operations will not be computed-10 21:30:32,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 109/17840 [09:57<31:06:03, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:30:39,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:30:42,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:30:39,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 110/17840 [10:03<31:05:58, 6.31s/it]g-point operations will not be computed-10 21:30:39,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 110/17840 [10:03<31:05:58, 6.31s/it]g-point operations will not be computed-10 21:30:39,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 110/17840 [10:03<31:05:58, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:30:45,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:30:48,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:30:45,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 111/17840 [10:09<30:57:23, 6.29s/it]g-point operations will not be computed-10 21:30:45,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 111/17840 [10:09<30:57:23, 6.29s/it]g-point operations will not be computed-10 21:30:45,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 111/17840 [10:09<30:57:23, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:30:51,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:30:54,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:30:51,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [10:16<30:49:19, 6.26s/it]g-point operations will not be computed-10 21:30:51,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [10:16<30:49:19, 6.26s/it]g-point operations will not be computed-10 21:30:51,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 112/17840 [10:16<30:49:19, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:30:57,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:01,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:30:57,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 113/17840 [10:22<30:40:07, 6.23s/it]g-point operations will not be computed-10 21:30:57,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 113/17840 [10:22<30:40:07, 6.23s/it]g-point operations will not be computed-10 21:30:57,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 113/17840 [10:22<30:40:07, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:31:04,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:07,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:04,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 114/17840 [10:28<30:32:29, 6.20s/it]g-point operations will not be computed-10 21:31:04,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 114/17840 [10:28<30:32:29, 6.20s/it]g-point operations will not be computed-10 21:31:04,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 114/17840 [10:28<30:32:29, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:13,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 115/17840 [10:34<30:29:32, 6.19s/it]g-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 115/17840 [10:34<30:29:32, 6.19s/it]g-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:17,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:17,930 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 116/17840 [10:40<30:19:10, 6.16s/it]g-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 116/17840 [10:40<30:19:10, 6.16s/it]g-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:24,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:24,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 117/17840 [10:46<30:10:53, 6.13s/it]g-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▍ | 117/17840 [10:46<30:10:53, 6.13s/it]g-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:30,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:30,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 118/17840 [10:52<30:04:08, 6.11s/it]g-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 118/17840 [10:52<30:04:08, 6.11s/it]g-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:36,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:36,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 119/17840 [10:58<29:52:11, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:31:40,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 119/17840 [10:58<29:52:11, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:31:40,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.2186, 'learning_rate': 3.57e-06, 'epoch': 0.13} + 1%|▌ | 119/17840 [10:58<29:52:11, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:31:40,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 120/17840 [11:04<29:49:14, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 120/17840 [11:04<29:49:14, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.2858, 'learning_rate': 3.6e-06, 'epoch': 0.13} +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:50,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:50,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.1868, 'learning_rate': 3.63e-06, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:50,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:50,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:56,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:31:56,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:01,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:01,179 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 123/17840 [11:22<29:09:15, 5.92s/it]g-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 123/17840 [11:22<29:09:15, 5.92s/it]g-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:07,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:07,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 124/17840 [11:28<29:03:15, 5.90s/it]g-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:11,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:11,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:11,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 125/17840 [11:34<29:28:37, 5.99s/it]g-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:17,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:17,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:17,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 126/17840 [11:40<29:04:39, 5.91s/it]g-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:23,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:23,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:23,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:31:46,585 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 127/17840 [11:45<28:46:53, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:32:27,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 127/17840 [11:45<28:46:53, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:32:27,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:31,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:27,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:31,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:27,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.2874, 'learning_rate': 3.8400000000000005e-06, 'epoch': 0.14} +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:35,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:27,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:35,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:27,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 129/17840 [11:56<28:07:04, 5.72s/it]g-point operations will not be computed-10 21:32:27,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:40,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:27,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:40,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:27,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:40,064 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:27,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 130/17840 [12:02<27:55:45, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:32:44,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 130/17840 [12:02<27:55:45, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:32:44,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:48,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:44,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:48,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:44,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.1654, 'learning_rate': 3.9300000000000005e-06, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:52,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:44,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:52,529 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:44,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 132/17840 [12:13<27:27:02, 5.58s/it]g-point operations will not be computed-10 21:32:44,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:56,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:44,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:56,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:44,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:32:56,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:32:44,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 133/17840 [12:18<27:06:18, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:33:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 133/17840 [12:18<27:06:18, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:33:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:04,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:04,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.1517, 'learning_rate': 4.0200000000000005e-06, 'epoch': 0.15} +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:08,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:08,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 135/17840 [12:29<26:02:12, 5.29s/it]g-point operations will not be computed-10 21:33:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:11,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:11,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:14,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:14,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:18,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:18,194 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:00,534 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 137/17840 [12:39<25:16:31, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:22,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:22,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▌ | 138/17840 [12:43<24:37:05, 5.01s/it]g-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:26,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:28,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:28,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:30,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:32,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:32,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:34,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:36,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:36,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:38,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:38,665 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:40,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:42,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:42,216 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:45,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:47,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:47,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:48,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:51,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:51,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:52,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:52,587 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:54,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:57,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:57,116 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.5888, 'learning_rate': 4.44e-06, 'epoch': 0.17} +[WARNING|modeling_utils.py:388] 2022-03-10 21:33:59,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:01,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:01,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.5008, 'learning_rate': 4.5e-06, 'epoch': 0.17} +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:04,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:04,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:04,616 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:07,974 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:11,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:11,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:11,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:14,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:14,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:18,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:18,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:21,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:21,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:24,542 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:27,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:27,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.1945, 'learning_rate': 4.62e-06, 'epoch': 0.17} +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:31,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:31,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:31,056 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:33:20,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 155/17840 [13:53<28:47:21, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:35,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 155/17840 [13:53<28:47:21, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:35,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 155/17840 [13:53<28:47:21, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:35,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 155/17840 [13:53<28:47:21, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:35,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [14:00<29:34:42, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:42,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [14:00<29:34:42, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:42,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [14:00<29:34:42, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:42,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 156/17840 [14:00<29:34:42, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:42,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 157/17840 [14:06<30:05:53, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 157/17840 [14:06<30:05:53, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 157/17840 [14:06<30:05:53, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 157/17840 [14:06<30:05:53, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [14:13<30:35:30, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 158/17840 [14:13<30:35:30, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:34:58,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 159/17840 [14:19<30:48:15, 6.27s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 159/17840 [14:19<30:48:15, 6.27s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.0042, 'learning_rate': 4.77e-06, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-10 21:35:04,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [14:25<30:55:09, 6.30s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 160/17840 [14:25<30:55:09, 6.30s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.0174, 'learning_rate': 4.800000000000001e-06, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-10 21:35:10,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 161/17840 [14:32<30:45:39, 6.26s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 161/17840 [14:32<30:45:39, 6.26s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.93, 'learning_rate': 4.83e-06, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-10 21:35:17,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 162/17840 [14:38<30:36:19, 6.23s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 162/17840 [14:38<30:36:19, 6.23s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.9949, 'learning_rate': 4.86e-06, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-10 21:35:23,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 163/17840 [14:44<30:27:19, 6.20s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 163/17840 [14:44<30:27:19, 6.20s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.9755, 'learning_rate': 4.890000000000001e-06, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-10 21:35:29,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [14:50<30:34:18, 6.23s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 164/17840 [14:50<30:34:18, 6.23s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.9916, 'learning_rate': 4.92e-06, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-10 21:35:35,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 165/17840 [14:56<30:20:15, 6.18s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 165/17840 [14:56<30:20:15, 6.18s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.932, 'learning_rate': 4.95e-06, 'epoch': 0.18} +[WARNING|modeling_utils.py:388] 2022-03-10 21:35:41,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 166/17840 [15:02<30:11:41, 6.15s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 166/17840 [15:02<30:11:41, 6.15s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.9655, 'learning_rate': 4.980000000000001e-06, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-10 21:35:47,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 167/17840 [15:08<30:01:20, 6.12s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 167/17840 [15:08<30:01:20, 6.12s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:35:52,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:35:52,178 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 168/17840 [15:14<29:49:10, 6.07s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 168/17840 [15:14<29:49:10, 6.07s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:35:58,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:35:58,173 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 169/17840 [15:20<29:36:07, 6.03s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 169/17840 [15:20<29:36:07, 6.03s/it]g-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:04,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:04,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:04,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:34:48,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 170/17840 [15:26<29:28:30, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 170/17840 [15:26<29:28:30, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:12,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:12,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.9866, 'learning_rate': 5.130000000000001e-06, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:12,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:18,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:18,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.922, 'learning_rate': 5.16e-06, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:23,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 173/17840 [15:44<28:56:40, 5.90s/it]g-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 173/17840 [15:44<28:56:40, 5.90s/it]g-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.9504, 'learning_rate': 5.1899999999999994e-06, 'epoch': 0.19} +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:28,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 174/17840 [15:50<28:48:03, 5.87s/it]g-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 174/17840 [15:50<28:48:03, 5.87s/it]g-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.8753, 'learning_rate': 5.22e-06, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:34,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [15:56<29:13:49, 5.96s/it]g-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 175/17840 [15:56<29:13:49, 5.96s/it]g-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.8031, 'learning_rate': 5.25e-06, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:40,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 176/17840 [16:02<29:01:59, 5.92s/it]g-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▋ | 176/17840 [16:02<29:01:59, 5.92s/it]g-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:45,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:45,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:08,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 177/17840 [16:07<28:32:19, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:36:49,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 177/17840 [16:07<28:32:19, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:36:49,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.8233, 'learning_rate': 5.31e-06, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:53,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:49,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:53,493 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:49,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.848, 'learning_rate': 5.34e-06, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-10 21:36:57,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:49,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 179/17840 [16:18<27:53:55, 5.69s/it]g-point operations will not be computed-10 21:36:49,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 179/17840 [16:18<27:53:55, 5.69s/it]g-point operations will not be computed-10 21:36:49,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:01,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:49,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:01,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:49,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:01,860 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:36:49,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 180/17840 [16:24<27:37:46, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:37:06,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 180/17840 [16:24<27:37:46, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:37:06,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:10,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:06,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:10,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:06,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.8931, 'learning_rate': 5.43e-06, 'epoch': 0.2} +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:14,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:06,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 182/17840 [16:35<27:01:21, 5.51s/it]g-point operations will not be computed-10 21:37:06,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 182/17840 [16:35<27:01:21, 5.51s/it]g-point operations will not be computed-10 21:37:06,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:18,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:06,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:18,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:06,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 183/17840 [16:40<26:34:05, 5.42s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:37:21,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 183/17840 [16:40<26:34:05, 5.42s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:37:21,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:24,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:21,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:24,411 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:21,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 184/17840 [16:45<26:06:43, 5.32s/it]g-point operations will not be computed-10 21:37:21,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:28,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:21,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:28,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:21,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:28,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:21,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 185/17840 [16:50<25:42:24, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:37:32,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 185/17840 [16:50<25:42:24, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:37:32,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 185/17840 [16:50<25:42:24, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:37:32,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:35,645 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:32,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:38,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:32,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:38,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:32,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:40,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:32,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:40,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:32,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:44,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:32,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:44,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:32,039 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 188/17840 [17:04<24:26:04, 4.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 188/17840 [17:04<24:26:04, 4.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▊ | 188/17840 [17:04<24:26:04, 4.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:49,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:52,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:52,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:54,356 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:56,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:56,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:37:58,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:00,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:00,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:02,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:04,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:04,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:06,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:08,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:08,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:09,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:09,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:13,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:14,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:14,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:17,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:17,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:19,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:19,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:21,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:21,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:23,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:23,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:24,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:24,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:27,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:27,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:31,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:31,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:34,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:34,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:38,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:38,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 9.0044, 'learning_rate': 6.0600000000000004e-06, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:41,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:44,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:44,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.857, 'learning_rate': 6.090000000000001e-06, 'epoch': 0.23} +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:48,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:48,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:51,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:51,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:51,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:51,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:57,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:57,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:57,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:57,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:38:57,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:37:46,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 206/17840 [18:23<29:45:16, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:39:05,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 206/17840 [18:23<29:45:16, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:39:05,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 206/17840 [18:23<29:45:16, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:39:05,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 206/17840 [18:23<29:45:16, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:39:05,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 207/17840 [18:30<30:15:09, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 207/17840 [18:30<30:15:09, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 207/17840 [18:30<30:15:09, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 207/17840 [18:30<30:15:09, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 208/17840 [18:36<30:37:36, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:20,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:20,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:20,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 209/17840 [18:43<30:47:58, 6.29s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:26,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:26,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:26,728 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 210/17840 [18:49<30:50:53, 6.30s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:33,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:33,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:33,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 211/17840 [18:55<30:47:18, 6.29s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:39,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:39,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:39,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 212/17840 [19:02<30:45:39, 6.28s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:45,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:45,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:45,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 213/17840 [19:08<30:42:32, 6.27s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 213/17840 [19:08<30:42:32, 6.27s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:53,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:53,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 214/17840 [19:14<30:34:35, 6.25s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 214/17840 [19:14<30:34:35, 6.25s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:59,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:39:59,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 215/17840 [19:20<30:20:24, 6.20s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 215/17840 [19:20<30:20:24, 6.20s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:05,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:05,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 216/17840 [19:26<30:17:54, 6.19s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 216/17840 [19:26<30:17:54, 6.19s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:11,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:11,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 217/17840 [19:32<30:06:37, 6.15s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 217/17840 [19:32<30:06:37, 6.15s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:17,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:17,671 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 218/17840 [19:38<29:54:26, 6.11s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:22,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:22,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:22,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 219/17840 [19:44<29:38:34, 6.06s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:28,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:28,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:28,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 220/17840 [19:50<29:32:30, 6.04s/it]g-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:34,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:34,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:34,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:39:12,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 221/17840 [19:56<29:24:16, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:40:38,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 221/17840 [19:56<29:24:16, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:40:38,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 221/17840 [19:56<29:24:16, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:40:38,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 221/17840 [19:56<29:24:16, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:40:38,539 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 222/17840 [20:02<29:15:29, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 222/17840 [20:02<29:15:29, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:48,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:48,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.6606, 'learning_rate': 6.69e-06, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:48,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:54,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:54,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.6133, 'learning_rate': 6.72e-06, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-10 21:40:58,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 225/17840 [20:20<29:06:23, 5.95s/it]g-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 225/17840 [20:20<29:06:23, 5.95s/it]g-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.4904, 'learning_rate': 6.750000000000001e-06, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:05,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 226/17840 [20:26<28:53:45, 5.91s/it]g-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 226/17840 [20:26<28:53:45, 5.91s/it]g-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:09,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:12,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:12,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.4659, 'learning_rate': 6.81e-06, 'epoch': 0.25} +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:12,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:17,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:17,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.4571, 'learning_rate': 6.840000000000001e-06, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:21,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 229/17840 [20:42<27:45:42, 5.68s/it]g-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 229/17840 [20:42<27:45:42, 5.68s/it]g-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:25,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:25,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:25,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:40:44,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 230/17840 [20:48<27:31:37, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:41:30,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 230/17840 [20:48<27:31:37, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:41:30,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:34,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:41:30,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:34,140 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:41:30,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.4575, 'learning_rate': 6.9300000000000006e-06, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:38,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:41:30,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 232/17840 [20:59<27:01:41, 5.53s/it]g-point operations will not be computed-10 21:41:30,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 232/17840 [20:59<27:01:41, 5.53s/it]g-point operations will not be computed-10 21:41:30,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:42,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:41:30,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:42,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:41:30,081 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 233/17840 [21:04<26:44:00, 5.47s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:41:46,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|▉ | 233/17840 [21:04<26:44:00, 5.47s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:41:46,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.4948, 'learning_rate': 6.990000000000001e-06, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:50,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:41:46,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:50,091 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:41:46,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.4332, 'learning_rate': 7.0200000000000006e-06, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-10 21:41:53,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:41:46,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 235/17840 [21:14<25:57:46, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:41:56,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 235/17840 [21:14<25:57:46, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:41:56,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.5111, 'learning_rate': 7.049999999999999e-06, 'epoch': 0.26} +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:00,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:41:56,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:00,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:41:56,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:02,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:41:56,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:02,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:41:56,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 237/17840 [21:24<25:02:42, 5.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 237/17840 [21:24<25:02:42, 5.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:08,717 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 238/17840 [21:29<24:31:33, 5.02s/it]g-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 238/17840 [21:29<24:31:33, 5.02s/it]g-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:12,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:12,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:14,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:16,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:16,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:18,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:21,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:21,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:23,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:25,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:25,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:27,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:28,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:28,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:30,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:32,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:35,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:35,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:37,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:37,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:38,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:38,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:41,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:41,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:43,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:43,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:45,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:45,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:47,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:47,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:48,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:48,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:52,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:52,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:55,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:55,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:42:58,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:02,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:02,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.489, 'learning_rate': 7.5600000000000005e-06, 'epoch': 0.28} +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:05,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:05,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:05,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:08,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:12,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:12,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:12,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:15,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:15,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:20,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:20,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [22:41<28:48:05, 5.90s/it]g-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 255/17840 [22:41<28:48:05, 5.90s/it]g-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:26,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 256/17840 [22:47<29:39:41, 6.07s/it]g-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 256/17840 [22:47<29:39:41, 6.07s/it]g-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.3869, 'learning_rate': 7.680000000000001e-06, 'epoch': 0.29} + 1%|█ | 256/17840 [22:47<29:39:41, 6.07s/it]g-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:34,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:34,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.3575, 'learning_rate': 7.71e-06, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:34,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:41,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:41,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.297, 'learning_rate': 7.74e-06, 'epoch': 0.29} +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:41,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:41,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:41,113 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:42:06,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 259/17840 [23:07<30:44:09, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 259/17840 [23:07<30:44:09, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 259/17840 [23:07<30:44:09, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 259/17840 [23:07<30:44:09, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 260/17840 [23:13<30:52:54, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:57,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:57,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:43:57,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 261/17840 [23:19<30:43:54, 6.29s/it]g-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:03,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:03,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:03,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 262/17840 [23:25<30:27:40, 6.24s/it]g-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:09,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:09,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:09,354 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 263/17840 [23:32<30:24:56, 6.23s/it]g-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:15,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:15,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:15,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█ | 264/17840 [23:38<30:19:11, 6.21s/it]g-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:21,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:21,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:21,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:43:49,169 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 265/17840 [23:44<30:13:36, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:26,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 265/17840 [23:44<30:13:36, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:26,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 265/17840 [23:44<30:13:36, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:26,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 265/17840 [23:44<30:13:36, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:26,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 266/17840 [23:50<30:17:24, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:32,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 266/17840 [23:50<30:17:24, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:32,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 266/17840 [23:50<30:17:24, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:32,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 266/17840 [23:50<30:17:24, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:32,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 1%|█▏ | 267/17840 [23:56<30:03:01, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:32,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:40,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:32,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:40,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:32,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:44:40,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:32,563 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 268/17840 [24:02<29:51:23, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:44,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 268/17840 [24:02<29:51:23, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:44,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 268/17840 [24:02<29:51:23, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:44,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 268/17840 [24:02<29:51:23, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:44,699 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [24:08<29:46:56, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:50,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [24:08<29:46:56, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:50,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [24:08<29:46:56, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:50,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 269/17840 [24:08<29:46:56, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:50,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 270/17840 [24:14<29:46:46, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 270/17840 [24:14<29:46:46, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:01,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:01,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.1452, 'learning_rate': 8.13e-06, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:01,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:07,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:07,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.1497, 'learning_rate': 8.160000000000001e-06, 'epoch': 0.3} +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:07,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:12,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:12,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.059, 'learning_rate': 8.190000000000001e-06, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:12,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:18,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:18,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:21,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:21,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 275/17840 [24:44<29:30:15, 6.05s/it]g-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 275/17840 [24:44<29:30:15, 6.05s/it]g-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.215, 'learning_rate': 8.25e-06, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:29,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 276/17840 [24:50<29:08:17, 5.97s/it]g-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 276/17840 [24:50<29:08:17, 5.97s/it]g-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.0676, 'learning_rate': 8.28e-06, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:35,259 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 277/17840 [24:56<28:43:16, 5.89s/it]g-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 277/17840 [24:56<28:43:16, 5.89s/it]g-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:39,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:39,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:44:56,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 278/17840 [25:01<28:24:11, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:45:43,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 278/17840 [25:01<28:24:11, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:45:43,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.0933, 'learning_rate': 8.340000000000001e-06, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:47,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:45:43,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:47,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:45:43,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.1058, 'learning_rate': 8.370000000000001e-06, 'epoch': 0.31} +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:52,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:45:43,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:52,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:45:43,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 280/17840 [25:13<27:48:16, 5.70s/it]g-point operations will not be computed-10 21:45:43,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:56,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:45:43,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:56,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:45:43,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:45:56,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:45:43,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 281/17840 [25:18<27:32:40, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:00,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 281/17840 [25:18<27:32:40, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:00,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 281/17840 [25:18<27:32:40, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:00,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:04,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:00,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:04,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:00,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:08,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:00,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:08,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:00,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 283/17840 [25:29<26:40:33, 5.47s/it]g-point operations will not be computed-10 21:46:00,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:00,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:00,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:12,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:00,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 284/17840 [25:34<26:08:13, 5.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:16,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:18,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:16,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 285/17840 [25:39<25:42:20, 5.27s/it]g-point operations will not be computed-10 21:46:16,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 285/17840 [25:39<25:42:20, 5.27s/it]g-point operations will not be computed-10 21:46:16,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:22,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:16,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:24,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:16,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:24,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:16,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.9205, 'learning_rate': 8.58e-06, 'epoch': 0.32} +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:28,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:16,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 287/17840 [25:49<24:44:06, 5.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 287/17840 [25:49<24:44:06, 5.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:33,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:33,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 288/17840 [25:54<24:15:41, 4.98s/it]g-point operations will not be computed-10 21:46:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:36,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:36,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:38,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:38,873 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:42,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:42,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 290/17840 [26:02<22:55:09, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:44,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 290/17840 [26:02<22:55:09, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:44,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:46:46,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:46:44,399 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 291/17840 [26:07<22:04:53, 4.53s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:48,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 291/17840 [26:07<22:04:53, 4.53s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:48,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 292/17840 [26:10<21:06:29, 4.33s/it]g-point operations will not be computed-10 21:46:48,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 292/17840 [26:10<21:06:29, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:52,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 292/17840 [26:10<21:06:29, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:52,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 293/17840 [26:14<20:07:28, 4.13s/it]g-point operations will not be computed-10 21:46:52,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 293/17840 [26:14<20:07:28, 4.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:55,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▏ | 293/17840 [26:14<20:07:28, 4.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:55,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 294/17840 [26:17<19:01:45, 3.90s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:59,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 294/17840 [26:17<19:01:45, 3.90s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:46:59,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 295/17840 [26:21<17:45:47, 3.64s/it]g-point operations will not be computed-10 21:46:59,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:03,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:02,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:03,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:02,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 296/17840 [26:23<16:21:02, 3.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:47:04,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 296/17840 [26:23<16:21:02, 3.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:47:04,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 297/17840 [26:26<14:52:48, 3.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:47:06,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 297/17840 [26:26<14:52:48, 3.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:47:06,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 298/17840 [26:28<13:28:41, 2.77s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:47:08,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 298/17840 [26:28<13:28:41, 2.77s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:47:08,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:11,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:10,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:11,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:10,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 300/17840 [26:32<11:33:42, 2.37s/it]g-point operations will not be computed-10 21:47:10,806 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 300/17840 [26:32<11:33:42, 2.37s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:47:14,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:17,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:14,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:17,796 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:14,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 301/17840 [26:39<18:28:30, 3.79s/it]g-point operations will not be computed-10 21:47:14,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 301/17840 [26:39<18:28:30, 3.79s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:47:21,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 301/17840 [26:39<18:28:30, 3.79s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:47:21,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:24,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:21,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:24,547 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:21,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [26:45<22:42:25, 4.66s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:47:27,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 302/17840 [26:45<22:42:25, 4.66s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:47:27,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:31,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:27,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:31,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:27,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 303/17840 [26:52<25:46:49, 5.29s/it]g-point operations will not be computed-10 21:47:27,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 303/17840 [26:52<25:46:49, 5.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:47:34,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:37,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:34,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:37,937 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:34,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [26:59<27:41:59, 5.69s/it]g-point operations will not be computed-10 21:47:34,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 304/17840 [26:59<27:41:59, 5.69s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:47:41,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:44,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:41,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 305/17840 [27:05<28:56:48, 5.94s/it]g-point operations will not be computed-10 21:47:41,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 305/17840 [27:05<28:56:48, 5.94s/it]g-point operations will not be computed-10 21:47:41,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.0586, 'learning_rate': 9.15e-06, 'epoch': 0.34} + 2%|█▎ | 305/17840 [27:05<28:56:48, 5.94s/it]g-point operations will not be computed-10 21:47:41,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:52,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:41,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:52,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:41,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.0814, 'learning_rate': 9.18e-06, 'epoch': 0.34} +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:52,613 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:41,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:59,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:41,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:59,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:41,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 8.0176, 'learning_rate': 9.21e-06, 'epoch': 0.34} +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:59,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:41,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:59,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:41,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:47:59,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:47:41,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 308/17840 [27:25<30:45:44, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 308/17840 [27:25<30:45:44, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 308/17840 [27:25<30:45:44, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 308/17840 [27:25<30:45:44, 6.32s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 309/17840 [27:31<30:53:29, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:48:15,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:48:15,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 310/17840 [27:38<30:59:24, 6.36s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 310/17840 [27:38<30:59:24, 6.36s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.879, 'learning_rate': 9.3e-06, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-10 21:48:23,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 311/17840 [27:44<30:52:44, 6.34s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 311/17840 [27:44<30:52:44, 6.34s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.9173, 'learning_rate': 9.33e-06, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-10 21:48:29,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 312/17840 [27:50<30:43:40, 6.31s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 312/17840 [27:50<30:43:40, 6.31s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.9007, 'learning_rate': 9.36e-06, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-10 21:48:35,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 313/17840 [27:56<30:38:48, 6.29s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 313/17840 [27:56<30:38:48, 6.29s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.8522, 'learning_rate': 9.39e-06, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-10 21:48:41,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 314/17840 [28:03<30:32:24, 6.27s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 314/17840 [28:03<30:32:24, 6.27s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.8594, 'learning_rate': 9.42e-06, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-10 21:48:48,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 315/17840 [28:09<30:31:05, 6.27s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 315/17840 [28:09<30:31:05, 6.27s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.779, 'learning_rate': 9.450000000000001e-06, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-10 21:48:54,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 316/17840 [28:15<30:19:11, 6.23s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 316/17840 [28:15<30:19:11, 6.23s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.8403, 'learning_rate': 9.48e-06, 'epoch': 0.35} +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:00,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 317/17840 [28:21<30:07:07, 6.19s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 317/17840 [28:21<30:07:07, 6.19s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7905, 'learning_rate': 9.51e-06, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:06,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 318/17840 [28:27<29:53:26, 6.14s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 318/17840 [28:27<29:53:26, 6.14s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.8223, 'learning_rate': 9.54e-06, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:12,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 319/17840 [28:33<29:47:52, 6.12s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 319/17840 [28:33<29:47:52, 6.12s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7035, 'learning_rate': 9.57e-06, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:18,638 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 320/17840 [28:39<29:42:48, 6.11s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 320/17840 [28:39<29:42:48, 6.11s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.8657, 'learning_rate': 9.600000000000001e-06, 'epoch': 0.36} +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:24,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 321/17840 [28:45<29:31:16, 6.07s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 321/17840 [28:45<29:31:16, 6.07s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:29,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:29,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:29,117 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▎ | 322/17840 [28:51<29:20:59, 6.03s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:35,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:35,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:35,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 323/17840 [28:57<29:14:43, 6.01s/it]g-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:41,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:41,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:41,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:48:07,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 324/17840 [29:03<29:04:51, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:49:45,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 324/17840 [29:03<29:04:51, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:49:45,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 324/17840 [29:03<29:04:51, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:49:45,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 324/17840 [29:03<29:04:51, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:49:45,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 325/17840 [29:09<29:24:39, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 325/17840 [29:09<29:24:39, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:55,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:49:55,901 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7159, 'learning_rate': 9.780000000000001e-06, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:00,190 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [29:21<28:38:11, 5.89s/it]g-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 327/17840 [29:21<28:38:11, 5.89s/it]g-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.6492, 'learning_rate': 9.810000000000001e-06, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:05,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 328/17840 [29:26<28:22:09, 5.83s/it]g-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 328/17840 [29:26<28:22:09, 5.83s/it]g-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:10,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:10,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 329/17840 [29:32<28:09:21, 5.79s/it]g-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 329/17840 [29:32<28:09:21, 5.79s/it]g-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:15,818 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:18,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:18,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7348, 'learning_rate': 9.9e-06, 'epoch': 0.37} +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:22,606 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 331/17840 [29:43<27:22:23, 5.63s/it]g-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 331/17840 [29:43<27:22:23, 5.63s/it]g-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:26,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:26,672 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 332/17840 [29:49<27:03:32, 5.56s/it]g-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 332/17840 [29:49<27:03:32, 5.56s/it]g-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:32,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:32,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:34,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:34,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:38,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:38,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 334/17840 [29:59<26:17:55, 5.41s/it]g-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:42,525 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:44,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:44,979 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7568, 'learning_rate': 1.005e-05, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:48,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:49:51,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 336/17840 [30:09<25:30:44, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 336/17840 [30:09<25:30:44, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.5586, 'learning_rate': 1.008e-05, 'epoch': 0.38} +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:54,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:54,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:57,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:59,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:59,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:50:59,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:03,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 339/17840 [30:24<23:55:20, 4.92s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▍ | 339/17840 [30:24<23:55:20, 4.92s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:06,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:08,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:08,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:10,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:13,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:13,008 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:15,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:16,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:16,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:18,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:20,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:20,570 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:22,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:25,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:25,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:27,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:27,083 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:29,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:29,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:31,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:33,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:33,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:35,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:35,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:37,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:37,221 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:38,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:38,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2378, 'learning_rate': 1.05e-05, 'epoch': 0.39} +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:42,059 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:45,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:45,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7271, 'learning_rate': 1.0529999999999999e-05, 'epoch': 0.39} +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:48,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:48,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:48,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:52,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:55,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:55,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:55,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:51:58,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:02,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:02,137 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:05,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:05,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:08,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:11,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:11,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7332, 'learning_rate': 1.065e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:11,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:18,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:18,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.5851, 'learning_rate': 1.068e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:18,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:24,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:24,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7198, 'learning_rate': 1.0709999999999999e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:24,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:24,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [31:50<30:32:17, 6.29s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 358/17840 [31:50<30:32:17, 6.29s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:34,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:34,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 359/17840 [31:57<30:42:55, 6.33s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 359/17840 [31:57<30:42:55, 6.33s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4263, 'learning_rate': 1.077e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:42,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 360/17840 [32:03<30:42:33, 6.32s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 360/17840 [32:03<30:42:33, 6.32s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:47,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:47,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 361/17840 [32:09<30:33:17, 6.29s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 361/17840 [32:09<30:33:17, 6.29s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4441, 'learning_rate': 1.083e-05, 'epoch': 0.4} +[WARNING|modeling_utils.py:388] 2022-03-10 21:52:54,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 362/17840 [32:16<30:22:25, 6.26s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 362/17840 [32:16<30:22:25, 6.26s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4888, 'learning_rate': 1.086e-05, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:01,075 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 363/17840 [32:22<30:12:08, 6.22s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 363/17840 [32:22<30:12:08, 6.22s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4343, 'learning_rate': 1.089e-05, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:07,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 364/17840 [32:28<30:12:23, 6.22s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 364/17840 [32:28<30:12:23, 6.22s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4771, 'learning_rate': 1.092e-05, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:13,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 365/17840 [32:34<30:05:30, 6.20s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 365/17840 [32:34<30:05:30, 6.20s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4433, 'learning_rate': 1.095e-05, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:19,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 366/17840 [32:40<29:50:05, 6.15s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 366/17840 [32:40<29:50:05, 6.15s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3479, 'learning_rate': 1.098e-05, 'epoch': 0.41} +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:25,487 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 367/17840 [32:46<29:36:32, 6.10s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 367/17840 [32:46<29:36:32, 6.10s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:30,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:30,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 368/17840 [32:52<29:27:31, 6.07s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 368/17840 [32:52<29:27:31, 6.07s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:36,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:36,036 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 369/17840 [32:58<29:25:27, 6.06s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 369/17840 [32:58<29:25:27, 6.06s/it]g-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:42,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:42,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:50:51,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [33:04<29:17:51, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:53:46,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [33:04<29:17:51, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:53:46,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.5116, 'learning_rate': 1.11e-05, 'epoch': 0.41} + 2%|█▌ | 370/17840 [33:04<29:17:51, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:53:46,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 370/17840 [33:04<29:17:51, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:53:46,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [33:10<29:05:36, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 371/17840 [33:10<29:05:36, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:56,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:56,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.5289, 'learning_rate': 1.116e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-10 21:53:56,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:02,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:02,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3819, 'learning_rate': 1.119e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:06,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 374/17840 [33:28<28:31:36, 5.88s/it]g-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 374/17840 [33:28<28:31:36, 5.88s/it]g-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:11,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:11,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:11,312 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 375/17840 [33:34<29:01:37, 5.98s/it]g-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:17,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:17,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:17,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 376/17840 [33:40<28:39:58, 5.91s/it]g-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:23,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:23,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:23,204 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:53:52,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 377/17840 [33:45<28:19:50, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:54:27,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 377/17840 [33:45<28:19:50, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:54:27,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:31,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:27,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:31,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:27,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2827, 'learning_rate': 1.134e-05, 'epoch': 0.42} +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:35,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:27,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:35,925 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:27,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 379/17840 [33:56<27:48:55, 5.73s/it]g-point operations will not be computed-10 21:54:27,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:40,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:27,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:40,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:27,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:40,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:27,503 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 380/17840 [34:02<27:29:49, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:54:44,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▌ | 380/17840 [34:02<27:29:49, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:54:44,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:48,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:44,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:48,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:44,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3259, 'learning_rate': 1.143e-05, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:52,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:44,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:52,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:44,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 382/17840 [34:13<26:52:11, 5.54s/it]g-point operations will not be computed-10 21:54:44,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:56,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:44,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:56,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:44,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:54:56,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:54:44,218 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 383/17840 [34:18<26:32:17, 5.47s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:55:00,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 383/17840 [34:18<26:32:17, 5.47s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:55:00,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:04,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:00,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:04,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:00,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3634, 'learning_rate': 1.152e-05, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:08,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:00,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:08,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:00,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 385/17840 [34:28<25:46:05, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:55:10,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 385/17840 [34:28<25:46:05, 5.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:55:10,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:14,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:10,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:14,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:10,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2729, 'learning_rate': 1.1580000000000001e-05, 'epoch': 0.43} +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:18,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:10,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:18,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:10,642 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 387/17840 [34:39<25:07:47, 5.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:23,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:23,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 388/17840 [34:43<24:30:33, 5.06s/it]g-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:26,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:28,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:28,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:31,051 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:33,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:33,181 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:35,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:37,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:37,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:39,476 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:41,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:41,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:43,342 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:45,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:45,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:47,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:47,021 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:48,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:50,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:50,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:53,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:53,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:54,723 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:57,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:57,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:59,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:55:59,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:01,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:01,150 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:03,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:03,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9241, 'learning_rate': 1.2e-05, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:06,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:06,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:06,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:10,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:13,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:13,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:17,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:17,003 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7378, 'learning_rate': 1.2060000000000001e-05, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:20,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:23,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:23,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.6943, 'learning_rate': 1.2090000000000001e-05, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:26,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:30,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:30,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.5747, 'learning_rate': 1.2120000000000001e-05, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:30,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:36,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:36,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.6423, 'learning_rate': 1.215e-05, 'epoch': 0.45} +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:36,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:36,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:36,726 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:55:20,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 406/17840 [36:02<29:24:48, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 406/17840 [36:02<29:24:48, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 406/17840 [36:02<29:24:48, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [36:09<30:22:35, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 407/17840 [36:09<30:22:35, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3452, 'learning_rate': 1.221e-05, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-10 21:56:54,964 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 408/17840 [36:16<31:00:56, 6.41s/it]g-point operations will not be computed-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 408/17840 [36:16<31:00:56, 6.41s/it]g-point operations will not be computed-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2704, 'learning_rate': 1.224e-05, 'epoch': 0.46} + 2%|█▋ | 408/17840 [36:16<31:00:56, 6.41s/it]g-point operations will not be computed-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:57:03,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:57:03,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3917, 'learning_rate': 1.227e-05, 'epoch': 0.46} +[WARNING|modeling_utils.py:388] 2022-03-10 21:57:03,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:57:03,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:57:03,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:56:44,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 410/17840 [36:29<31:17:34, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:11,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 410/17840 [36:29<31:17:34, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:11,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 410/17840 [36:29<31:17:34, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:11,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▋ | 410/17840 [36:29<31:17:34, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:11,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [36:35<31:01:30, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:17,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [36:35<31:01:30, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:17,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [36:35<31:01:30, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:17,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 411/17840 [36:35<31:01:30, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:17,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 412/17840 [36:41<30:43:57, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:23,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 412/17840 [36:41<30:43:57, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:23,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 412/17840 [36:41<30:43:57, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:23,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 412/17840 [36:41<30:43:57, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:23,816 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 413/17840 [36:48<30:31:54, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:29,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 413/17840 [36:48<30:31:54, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:29,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 413/17840 [36:48<30:31:54, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:29,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 414/17840 [36:54<30:18:05, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:36,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 414/17840 [36:54<30:18:05, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:36,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0928, 'learning_rate': 1.242e-05, 'epoch': 0.46} + 2%|█▊ | 414/17840 [36:54<30:18:05, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:36,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 415/17840 [37:00<30:09:00, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:42,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 415/17840 [37:00<30:09:00, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:42,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1117, 'learning_rate': 1.245e-05, 'epoch': 0.47} + 2%|█▊ | 415/17840 [37:00<30:09:00, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:42,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 416/17840 [37:06<30:02:21, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:48,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 416/17840 [37:06<30:02:21, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:48,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2426, 'learning_rate': 1.2479999999999999e-05, 'epoch': 0.47} + 2%|█▊ | 416/17840 [37:06<30:02:21, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:48,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 417/17840 [37:12<29:53:59, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:54,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 417/17840 [37:12<29:53:59, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:54,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1098, 'learning_rate': 1.251e-05, 'epoch': 0.47} + 2%|█▊ | 417/17840 [37:12<29:53:59, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:57:54,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 418/17840 [37:18<29:45:10, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:58:00,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 418/17840 [37:18<29:45:10, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:58:00,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1828, 'learning_rate': 1.254e-05, 'epoch': 0.47} + 2%|█▊ | 418/17840 [37:18<29:45:10, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:58:00,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 418/17840 [37:18<29:45:10, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:58:00,628 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [37:24<29:36:29, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:58:06,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [37:24<29:36:29, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:58:06,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 419/17840 [37:24<29:36:29, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:58:06,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 420/17840 [37:30<29:21:01, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|��▊ | 420/17840 [37:30<29:21:01, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2, 'learning_rate': 1.26e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:17,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:17,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1794, 'learning_rate': 1.263e-05, 'epoch': 0.47} +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:17,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:17,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:22,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:22,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:27,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:27,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 423/17840 [37:48<28:46:11, 5.95s/it]g-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 423/17840 [37:48<28:46:11, 5.95s/it]g-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:33,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:33,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 424/17840 [37:54<28:37:45, 5.92s/it]g-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:37,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:37,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:37,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 425/17840 [38:00<29:08:58, 6.03s/it]g-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:43,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:43,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:43,832 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 426/17840 [38:06<28:49:17, 5.96s/it]g-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:49,554 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:52,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:52,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9913, 'learning_rate': 1.281e-05, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:52,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:57,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:57,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3628, 'learning_rate': 1.284e-05, 'epoch': 0.48} +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:57,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:58:57,977 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:03,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:03,595 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:07,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:07,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 430/17840 [38:28<27:31:24, 5.69s/it]g-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:11,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:11,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:11,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:58:12,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [38:34<27:15:23, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:59:16,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [38:34<27:15:23, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:59:16,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 431/17840 [38:34<27:15:23, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:59:16,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:20,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:16,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:22,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:16,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:22,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:16,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:22,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:16,060 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [38:45<26:40:08, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:59:26,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 433/17840 [38:45<26:40:08, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:59:26,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:30,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:26,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:30,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:26,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0073, 'learning_rate': 1.302e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:34,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:26,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:34,783 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:26,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 435/17840 [38:55<26:07:47, 5.40s/it]g-point operations will not be computed-10 21:59:26,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:38,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:26,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:41,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:26,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:41,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:26,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1171, 'learning_rate': 1.308e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:45,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:26,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:45,031 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:26,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 437/17840 [39:05<25:17:46, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:59:47,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 437/17840 [39:05<25:17:46, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:59:47,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:51,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:47,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:51,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:47,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1039, 'learning_rate': 1.314e-05, 'epoch': 0.49} +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:54,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:47,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:54,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:47,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 439/17840 [39:15<24:07:23, 4.99s/it][WARNING|modeling_utils.py:388] 2022-03-10 21:59:56,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:59,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:56,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 21:59:59,176 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 21:59:56,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▊ | 440/17840 [39:19<23:24:54, 4.84s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:00:01,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:01,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:03,620 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:01,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 441/17840 [39:24<22:42:37, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 2%|█▉ | 441/17840 [39:24<22:42:37, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:08,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:08,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:10,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:10,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:12,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:14,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:14,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:17,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:19,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:19,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:20,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:20,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:23,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:23,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:25,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:25,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:27,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:27,966 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:29,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:29,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:30,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:30,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:34,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:37,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:37,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.4465, 'learning_rate': 1.3530000000000001e-05, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:41,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:44,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:44,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.5743, 'learning_rate': 1.356e-05, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:47,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:47,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:47,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:51,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:51,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:54,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:57,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:00:57,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3032, 'learning_rate': 1.362e-05, 'epoch': 0.51} +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:02,680 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 455/17840 [40:23<28:31:31, 5.91s/it]g-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 455/17840 [40:23<28:31:31, 5.91s/it]g-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3564, 'learning_rate': 1.3650000000000001e-05, 'epoch': 0.51} + 3%|█▉ | 455/17840 [40:23<28:31:31, 5.91s/it]g-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 455/17840 [40:23<28:31:31, 5.91s/it]g-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 455/17840 [40:23<28:31:31, 5.91s/it]g-point operations will not be computed-10 22:00:05,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 456/17840 [40:30<29:16:43, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 456/17840 [40:30<29:16:43, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 456/17840 [40:30<29:16:43, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 456/17840 [40:30<29:16:43, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 457/17840 [40:36<29:51:30, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:20,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:20,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:20,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 458/17840 [40:43<30:10:20, 6.25s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:26,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:26,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:26,792 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 459/17840 [40:49<30:22:36, 6.29s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:33,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:33,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 460/17840 [40:55<30:24:12, 6.30s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 460/17840 [40:55<30:24:12, 6.30s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:39,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:39,449 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 461/17840 [41:02<30:20:16, 6.28s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 461/17840 [41:02<30:20:16, 6.28s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:45,696 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:45,696 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 462/17840 [41:08<30:19:15, 6.28s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 462/17840 [41:08<30:19:15, 6.28s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.1116, 'learning_rate': 1.3860000000000001e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:53,545 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 463/17840 [41:14<30:18:06, 6.28s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 463/17840 [41:14<30:18:06, 6.28s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9562, 'learning_rate': 1.389e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-10 22:01:59,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 464/17840 [41:20<30:09:01, 6.25s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 464/17840 [41:20<30:09:01, 6.25s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9394, 'learning_rate': 1.392e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-10 22:02:05,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 465/17840 [41:27<29:58:36, 6.21s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 465/17840 [41:27<29:58:36, 6.21s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.047, 'learning_rate': 1.395e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-10 22:02:12,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 466/17840 [41:33<29:58:18, 6.21s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 466/17840 [41:33<29:58:18, 6.21s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9534, 'learning_rate': 1.3980000000000002e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-10 22:02:18,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 467/17840 [41:39<29:45:10, 6.17s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 467/17840 [41:39<29:45:10, 6.17s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9702, 'learning_rate': 1.4010000000000001e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-10 22:02:24,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 468/17840 [41:45<29:36:07, 6.13s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 468/17840 [41:45<29:36:07, 6.13s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.023, 'learning_rate': 1.4040000000000001e-05, 'epoch': 0.52} +[WARNING|modeling_utils.py:388] 2022-03-10 22:02:30,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 469/17840 [41:51<29:29:56, 6.11s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|█▉ | 469/17840 [41:51<29:29:56, 6.11s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9083, 'learning_rate': 1.4069999999999999e-05, 'epoch': 0.53} +[WARNING|modeling_utils.py:388] 2022-03-10 22:02:36,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 470/17840 [41:57<29:17:07, 6.07s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 470/17840 [41:57<29:17:07, 6.07s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:02:40,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:02:40,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 471/17840 [42:03<29:05:37, 6.03s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 471/17840 [42:03<29:05:37, 6.03s/it]g-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:02:46,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:02:46,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:01:12,389 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 472/17840 [42:09<28:58:28, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:02:51,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 472/17840 [42:09<28:58:28, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:02:51,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9025, 'learning_rate': 1.416e-05, 'epoch': 0.53} + 3%|██ | 472/17840 [42:09<28:58:28, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:02:51,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 472/17840 [42:09<28:58:28, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:02:51,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 473/17840 [42:15<28:49:21, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:02:51,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:02:58,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:02:51,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:02:58,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:02:51,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:02:58,490 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:02:51,145 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 474/17840 [42:20<28:31:01, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:02,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 474/17840 [42:20<28:31:01, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:02,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 474/17840 [42:20<28:31:01, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:02,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 474/17840 [42:20<28:31:01, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:02,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [42:27<28:56:42, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:09,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [42:27<28:56:42, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:09,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [42:27<28:56:42, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:09,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 475/17840 [42:27<28:56:42, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:09,033 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 476/17840 [42:32<28:39:34, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:17,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 477/17840 [42:38<28:13:15, 5.85s/it]g-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 477/17840 [42:38<28:13:15, 5.85s/it]g-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:21,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:21,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 478/17840 [42:44<27:52:30, 5.78s/it]g-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 478/17840 [42:44<27:52:30, 5.78s/it]g-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:27,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:30,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:30,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7785, 'learning_rate': 1.437e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:30,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:35,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:35,698 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8459, 'learning_rate': 1.44e-05, 'epoch': 0.54} +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:39,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 481/17840 [43:00<27:01:59, 5.61s/it]g-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 481/17840 [43:00<27:01:59, 5.61s/it]g-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:43,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:43,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:14,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 482/17840 [43:06<26:49:13, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:48,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 482/17840 [43:06<26:49:13, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:48,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8468, 'learning_rate': 1.446e-05, 'epoch': 0.54} + 3%|██ | 482/17840 [43:06<26:49:13, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:48,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:51,889 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:48,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:54,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:48,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:54,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:48,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:03:54,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:48,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 484/17840 [43:16<25:57:37, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:58,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 484/17840 [43:16<25:57:37, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:58,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 484/17840 [43:16<25:57:37, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:03:58,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:02,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:58,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:02,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:58,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:05,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:58,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:05,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:03:58,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 486/17840 [43:26<25:05:11, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:04:08,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:10,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:08,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:10,854 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:08,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 487/17840 [43:31<24:45:31, 5.14s/it]g-point operations will not be computed-10 22:04:08,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:14,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:08,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:16,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:08,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:16,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:08,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8018, 'learning_rate': 1.464e-05, 'epoch': 0.55} +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:20,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:08,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:20,464 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:08,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 489/17840 [43:41<23:45:58, 4.93s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 489/17840 [43:41<23:45:58, 4.93s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██ | 489/17840 [43:41<23:45:58, 4.93s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:25,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:28,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:28,107 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:30,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:32,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:32,080 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:33,929 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:35,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:35,756 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:39,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:39,090 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:40,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:42,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:42,158 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:44,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:44,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:46,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:46,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:48,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:48,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:50,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:50,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:53,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:53,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:54,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:54,470 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:04:58,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:01,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:01,426 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.7231, 'learning_rate': 1.503e-05, 'epoch': 0.56} +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:04,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:04,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:04,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:08,309 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:11,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:11,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:11,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:14,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:14,967 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:18,272 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:18,272 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:21,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:21,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:24,856 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:28,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:28,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.3311, 'learning_rate': 1.515e-05, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:28,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:28,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:28,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:04:22,786 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [44:54<29:17:00, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [44:54<29:17:00, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [44:54<29:17:00, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 506/17840 [44:54<29:17:00, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 507/17840 [45:00<29:46:34, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:44,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:44,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:44,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 508/17840 [45:07<30:06:33, 6.25s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 508/17840 [45:07<30:06:33, 6.25s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:52,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:52,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [45:13<30:18:13, 6.29s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 509/17840 [45:13<30:18:13, 6.29s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:05:58,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 510/17840 [45:19<30:22:17, 6.31s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 510/17840 [45:19<30:22:17, 6.31s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9121, 'learning_rate': 1.53e-05, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-10 22:06:04,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 511/17840 [45:26<30:18:19, 6.30s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 511/17840 [45:26<30:18:19, 6.30s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8908, 'learning_rate': 1.533e-05, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-10 22:06:11,012 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 512/17840 [45:32<30:06:06, 6.25s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 512/17840 [45:32<30:06:06, 6.25s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9143, 'learning_rate': 1.5360000000000002e-05, 'epoch': 0.57} +[WARNING|modeling_utils.py:388] 2022-03-10 22:06:17,213 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 513/17840 [45:38<30:01:37, 6.24s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 513/17840 [45:38<30:01:37, 6.24s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0586, 'learning_rate': 1.539e-05, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-10 22:06:23,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [45:44<29:59:19, 6.23s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 514/17840 [45:44<29:59:19, 6.23s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9384, 'learning_rate': 1.542e-05, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-10 22:06:29,519 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 515/17840 [45:50<29:48:02, 6.19s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 515/17840 [45:50<29:48:02, 6.19s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.948, 'learning_rate': 1.545e-05, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-10 22:06:35,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 516/17840 [45:56<29:43:39, 6.18s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 516/17840 [45:56<29:43:39, 6.18s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6965, 'learning_rate': 1.548e-05, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-10 22:06:41,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 517/17840 [46:02<29:36:12, 6.15s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 517/17840 [46:02<29:36:12, 6.15s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9389, 'learning_rate': 1.5510000000000002e-05, 'epoch': 0.58} +[WARNING|modeling_utils.py:388] 2022-03-10 22:06:47,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:06:47,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 518/17840 [46:09<29:27:21, 6.12s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 518/17840 [46:09<29:27:21, 6.12s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:06:53,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 519/17840 [46:15<29:19:56, 6.10s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 519/17840 [46:15<29:19:56, 6.10s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:06:58,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:06:58,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:06:58,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 520/17840 [46:20<29:05:25, 6.05s/it]g-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:04,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:04,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:04,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:05:36,186 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 521/17840 [46:26<28:54:36, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:07:08,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 521/17840 [46:26<28:54:36, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:07:08,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 521/17840 [46:26<28:54:36, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:07:08,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 521/17840 [46:26<28:54:36, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:07:08,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 522/17840 [46:32<28:42:50, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:07:14,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 522/17840 [46:32<28:42:50, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:07:14,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 522/17840 [46:32<28:42:50, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:07:14,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 522/17840 [46:32<28:42:50, 5.97s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:07:14,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 523/17840 [46:38<28:35:23, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 523/17840 [46:38<28:35:23, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:24,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:24,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.799, 'learning_rate': 1.5720000000000002e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:29,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 525/17840 [46:50<28:51:46, 6.00s/it]g-point operations will not be computed-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 525/17840 [46:50<28:51:46, 6.00s/it]g-point operations will not be computed-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8829, 'learning_rate': 1.575e-05, 'epoch': 0.59} + 3%|██▏ | 525/17840 [46:50<28:51:46, 6.00s/it]g-point operations will not be computed-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:36,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:36,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.675, 'learning_rate': 1.578e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:41,114 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 527/17840 [47:02<28:11:54, 5.86s/it]g-point operations will not be computed-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 527/17840 [47:02<28:11:54, 5.86s/it]g-point operations will not be computed-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:45,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:45,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:07:20,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 528/17840 [47:07<27:54:43, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:07:49,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▏ | 528/17840 [47:07<27:54:43, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:07:49,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8569, 'learning_rate': 1.584e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:53,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:07:49,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:53,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:07:49,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8854, 'learning_rate': 1.5870000000000002e-05, 'epoch': 0.59} +[WARNING|modeling_utils.py:388] 2022-03-10 22:07:57,942 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:07:49,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 530/17840 [47:18<27:20:22, 5.69s/it]g-point operations will not be computed-10 22:07:49,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 530/17840 [47:18<27:20:22, 5.69s/it]g-point operations will not be computed-10 22:07:49,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:02,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:07:49,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:02,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:07:49,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 531/17840 [47:24<27:04:18, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 531/17840 [47:24<27:04:18, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8033, 'learning_rate': 1.593e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:10,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:10,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:10,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6835, 'learning_rate': 1.596e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:10,247 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:16,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:16,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:20,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:20,369 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 534/17840 [47:41<26:52:50, 5.59s/it]g-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:24,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:26,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:26,839 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.712, 'learning_rate': 1.605e-05, 'epoch': 0.6} +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:30,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:30,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 536/17840 [47:51<25:50:44, 5.38s/it]g-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:34,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:34,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:34,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:06,248 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 537/17840 [47:56<25:19:45, 5.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:40,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:40,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 538/17840 [48:01<24:43:51, 5.15s/it]g-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:44,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:44,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:46,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:48,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:50,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:50,878 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:52,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:54,851 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:54,851 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:56,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:56,731 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:08:58,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:00,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:00,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:01,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:04,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:04,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:06,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:06,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:08,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:08,947 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:10,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:10,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:12,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:12,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:14,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:14,513 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:16,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:16,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:18,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:18,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:21,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:25,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:25,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2292, 'learning_rate': 1.6530000000000003e-05, 'epoch': 0.62} +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:28,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:28,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:28,791 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:32,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:35,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:35,561 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:38,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:38,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:42,238 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:45,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:45,434 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.2045, 'learning_rate': 1.6620000000000004e-05, 'epoch': 0.62} +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:48,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:51,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:51,996 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.0826, 'learning_rate': 1.665e-05, 'epoch': 0.62} +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:55,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:55,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:09:55,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [49:18<29:33:50, 6.16s/it]g-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 556/17840 [49:18<29:33:50, 6.16s/it]g-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:03,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:03,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 557/17840 [49:24<30:06:24, 6.27s/it]g-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▎ | 557/17840 [49:24<30:06:24, 6.27s/it]g-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:10,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 558/17840 [49:31<30:25:29, 6.34s/it]g-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 558/17840 [49:31<30:25:29, 6.34s/it]g-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8974, 'learning_rate': 1.6740000000000002e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:16,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 559/17840 [49:37<30:31:55, 6.36s/it]g-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 559/17840 [49:37<30:31:55, 6.36s/it]g-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7908, 'learning_rate': 1.677e-05, 'epoch': 0.63} + 3%|██▍ | 559/17840 [49:37<30:31:55, 6.36s/it]g-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:24,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:24,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7176, 'learning_rate': 1.6800000000000002e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:24,528 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:30,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:30,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7974, 'learning_rate': 1.6830000000000003e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:30,848 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:37,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:37,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6672, 'learning_rate': 1.686e-05, 'epoch': 0.63} +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:37,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:37,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:10:37,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:08:38,296 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 563/17840 [50:03<30:15:53, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:10:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 563/17840 [50:03<30:15:53, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:10:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 563/17840 [50:03<30:15:53, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:10:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 563/17840 [50:03<30:15:53, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:10:45,093 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [50:09<30:08:41, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:10:51,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [50:09<30:08:41, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:10:51,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [50:09<30:08:41, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:10:51,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 564/17840 [50:09<30:08:41, 6.28s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:10:51,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 565/17840 [50:15<29:52:47, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:10:57,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 565/17840 [50:15<29:52:47, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:10:57,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 565/17840 [50:15<29:52:47, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:10:57,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 565/17840 [50:15<29:52:47, 6.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:10:57,335 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 566/17840 [50:21<29:41:30, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:03,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 566/17840 [50:21<29:41:30, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:03,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 566/17840 [50:21<29:41:30, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:03,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 566/17840 [50:21<29:41:30, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:03,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [50:27<29:40:55, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:09,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [50:27<29:40:55, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:09,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [50:27<29:40:55, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:09,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 567/17840 [50:27<29:40:55, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:09,627 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 568/17840 [50:33<29:32:08, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:15,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 568/17840 [50:33<29:32:08, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:15,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 568/17840 [50:33<29:32:08, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:15,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 568/17840 [50:33<29:32:08, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:15,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 569/17840 [50:39<29:15:26, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 569/17840 [50:39<29:15:26, 6.10s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:26,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:26,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8002, 'learning_rate': 1.71e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:26,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:31,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:31,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6648, 'learning_rate': 1.713e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:36,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 572/17840 [50:57<28:38:39, 5.97s/it]g-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 572/17840 [50:57<28:38:39, 5.97s/it]g-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8371, 'learning_rate': 1.716e-05, 'epoch': 0.64} +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:42,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 573/17840 [51:03<28:45:10, 5.99s/it]g-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 573/17840 [51:03<28:45:10, 5.99s/it]g-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:46,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:46,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:46,799 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 574/17840 [51:09<28:29:04, 5.94s/it]g-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:52,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:52,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:52,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 575/17840 [51:15<28:56:02, 6.03s/it]g-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:58,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:58,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:11:58,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:11:21,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 576/17840 [51:21<28:30:07, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:03,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 576/17840 [51:21<28:30:07, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:03,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 576/17840 [51:21<28:30:07, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:03,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 576/17840 [51:21<28:30:07, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:03,149 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 577/17840 [51:27<28:11:14, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 577/17840 [51:27<28:11:14, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 577/17840 [51:27<28:11:14, 5.88s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:13,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:13,144 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:17,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:17,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 579/17840 [51:38<27:41:51, 5.78s/it]g-point operations will not be computed-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 579/17840 [51:38<27:41:51, 5.78s/it]g-point operations will not be computed-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:23,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:23,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 580/17840 [51:44<27:27:01, 5.73s/it]g-point operations will not be computed-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:27,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:27,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:27,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:08,838 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 581/17840 [51:49<27:11:31, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:31,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 581/17840 [51:49<27:11:31, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:31,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 581/17840 [51:49<27:11:31, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:31,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:35,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:31,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:38,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:31,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:38,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:31,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:38,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:31,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 583/17840 [52:00<26:24:35, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:42,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 583/17840 [52:00<26:24:35, 5.51s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:42,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:45,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:42,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:45,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:42,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6399, 'learning_rate': 1.7519999999999998e-05, 'epoch': 0.65} +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:49,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:42,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:49,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:42,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 585/17840 [52:10<25:32:48, 5.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:52,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▍ | 585/17840 [52:10<25:32:48, 5.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:12:52,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:56,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:52,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:56,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:52,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:58,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:52,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:58,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:52,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:12:58,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:12:52,293 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 587/17840 [52:20<24:44:10, 5.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:13:02,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:04,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:02,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 588/17840 [52:25<24:14:43, 5.06s/it]g-point operations will not be computed-10 22:13:02,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 588/17840 [52:25<24:14:43, 5.06s/it]g-point operations will not be computed-10 22:13:02,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:08,196 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:02,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:10,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:02,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:10,491 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:02,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:12,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:02,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:15,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:02,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:15,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:02,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6269, 'learning_rate': 1.77e-05, 'epoch': 0.66} +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:18,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:02,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:18,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:02,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 591/17840 [52:39<22:27:47, 4.69s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:13:20,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 592/17840 [52:43<21:36:31, 4.51s/it]g-point operations will not be computed-10 22:13:20,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 592/17840 [52:43<21:36:31, 4.51s/it]g-point operations will not be computed-10 22:13:20,520 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 592/17840 [52:43<21:36:31, 4.51s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:13:24,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:26,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:24,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:26,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:24,543 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 593/17840 [52:46<20:35:21, 4.30s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:13:28,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 594/17840 [52:50<19:28:58, 4.07s/it]g-point operations will not be computed-10 22:13:28,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 594/17840 [52:50<19:28:58, 4.07s/it]g-point operations will not be computed-10 22:13:28,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:33,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:31,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:33,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:31,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 595/17840 [52:53<18:11:13, 3.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:13:34,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 596/17840 [52:56<16:44:24, 3.49s/it]g-point operations will not be computed-10 22:13:34,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 596/17840 [52:56<16:44:24, 3.49s/it]g-point operations will not be computed-10 22:13:34,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 597/17840 [52:58<15:19:49, 3.20s/it]g-point operations will not be computed-10 22:13:37,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 597/17840 [52:58<15:19:49, 3.20s/it]g-point operations will not be computed-10 22:13:37,557 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 598/17840 [53:01<13:45:47, 2.87s/it]g-point operations will not be computed-10 22:13:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 598/17840 [53:01<13:45:47, 2.87s/it]g-point operations will not be computed-10 22:13:39,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 599/17840 [53:02<12:16:50, 2.56s/it]g-point operations will not be computed-10 22:13:41,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 599/17840 [53:02<12:16:50, 2.56s/it]g-point operations will not be computed-10 22:13:41,955 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 600/17840 [53:05<11:36:28, 2.42s/it]g-point operations will not be computed-10 22:13:43,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 600/17840 [53:05<11:36:28, 2.42s/it]g-point operations will not be computed-10 22:13:43,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 600/17840 [53:05<11:36:28, 2.42s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:13:47,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 600/17840 [53:05<11:36:28, 2.42s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:13:47,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:50,604 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:47,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 601/17840 [53:11<18:06:28, 3.78s/it]g-point operations will not be computed-10 22:13:47,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 601/17840 [53:11<18:06:28, 3.78s/it]g-point operations will not be computed-10 22:13:47,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 601/17840 [53:11<18:06:28, 3.78s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:13:54,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:13:57,390 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:13:54,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 602/17840 [53:18<22:19:57, 4.66s/it]g-point operations will not be computed-10 22:13:54,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 602/17840 [53:18<22:19:57, 4.66s/it]g-point operations will not be computed-10 22:13:54,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 602/17840 [53:18<22:19:57, 4.66s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:00,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:14:04,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:00,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:14:04,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:00,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 603/17840 [53:25<25:11:36, 5.26s/it]g-point operations will not be computed-10 22:14:00,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 603/17840 [53:25<25:11:36, 5.26s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:07,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:14:10,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:07,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [53:31<27:00:32, 5.64s/it]g-point operations will not be computed-10 22:14:07,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [53:31<27:00:32, 5.64s/it]g-point operations will not be computed-10 22:14:07,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [53:31<27:00:32, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:13,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [53:31<27:00:32, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:13,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [53:31<27:00:32, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:13,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 604/17840 [53:31<27:00:32, 5.64s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:13,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 605/17840 [53:38<28:14:38, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:20,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 605/17840 [53:38<28:14:38, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:20,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 605/17840 [53:38<28:14:38, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:20,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 605/17840 [53:38<28:14:38, 5.90s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:20,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [53:44<29:09:17, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [53:44<29:09:17, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [53:44<29:09:17, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 606/17840 [53:44<29:09:17, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 607/17840 [53:51<29:41:26, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:14:34,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:14:34,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:14:34,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 608/17840 [53:57<30:01:47, 6.27s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:14:41,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:14:41,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:14:41,381 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 609/17840 [54:04<30:10:52, 6.31s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 609/17840 [54:04<30:10:52, 6.31s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 609/17840 [54:04<30:10:52, 6.31s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 609/17840 [54:04<30:10:52, 6.31s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:14:50,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:14:50,840 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:14:55,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:14:55,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 611/17840 [54:16<30:04:42, 6.28s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 611/17840 [54:16<30:04:42, 6.28s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 611/17840 [54:16<30:04:42, 6.28s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 611/17840 [54:16<30:04:42, 6.28s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:03,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:03,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:08,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [54:29<30:07:48, 6.30s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 613/17840 [54:29<30:07:48, 6.30s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6318, 'learning_rate': 1.8390000000000002e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:14,310 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 614/17840 [54:35<29:51:15, 6.24s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▌ | 614/17840 [54:35<29:51:15, 6.24s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.662, 'learning_rate': 1.842e-05, 'epoch': 0.69} + 3%|██▌ | 614/17840 [54:35<29:51:15, 6.24s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:21,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:21,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8667, 'learning_rate': 1.845e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:21,916 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:27,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:27,998 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5467, 'learning_rate': 1.848e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:32,598 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 617/17840 [54:53<29:25:34, 6.15s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 617/17840 [54:53<29:25:34, 6.15s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6423, 'learning_rate': 1.851e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:38,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 618/17840 [54:59<29:16:35, 6.12s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 618/17840 [54:59<29:16:35, 6.12s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5253, 'learning_rate': 1.854e-05, 'epoch': 0.69} +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:44,687 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 619/17840 [55:05<29:05:08, 6.08s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 619/17840 [55:05<29:05:08, 6.08s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:49,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:49,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:49,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 620/17840 [55:11<28:55:52, 6.05s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:55,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:55,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:15:55,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 621/17840 [55:17<28:45:24, 6.01s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:00,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:00,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:00,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 622/17840 [55:23<28:36:02, 5.98s/it]g-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:06,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:06,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:06,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:14:26,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 623/17840 [55:29<28:28:19, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:16:11,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 623/17840 [55:29<28:28:19, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:16:11,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 623/17840 [55:29<28:28:19, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:16:11,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 623/17840 [55:29<28:28:19, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:16:11,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 624/17840 [55:35<28:19:26, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 3%|██▋ | 624/17840 [55:35<28:19:26, 5.92s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:22,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:22,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7957, 'learning_rate': 1.8750000000000002e-05, 'epoch': 0.7} +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:26,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 626/17840 [55:47<28:30:45, 5.96s/it]g-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 626/17840 [55:47<28:30:45, 5.96s/it]g-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.589, 'learning_rate': 1.878e-05, 'epoch': 0.7} +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:32,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 627/17840 [55:53<28:04:42, 5.87s/it]g-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 627/17840 [55:53<28:04:42, 5.87s/it]g-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7174, 'learning_rate': 1.881e-05, 'epoch': 0.7} +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:37,682 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 628/17840 [55:58<27:39:36, 5.79s/it]g-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 628/17840 [55:58<27:39:36, 5.79s/it]g-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:41,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:41,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:41,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:16:17,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 629/17840 [56:04<27:27:21, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:16:46,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 629/17840 [56:04<27:27:21, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:16:46,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:50,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:16:46,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:50,330 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:16:46,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8648, 'learning_rate': 1.8900000000000002e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:54,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:16:46,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 631/17840 [56:15<27:05:01, 5.67s/it]g-point operations will not be computed-10 22:16:46,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 631/17840 [56:15<27:05:01, 5.67s/it]g-point operations will not be computed-10 22:16:46,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:58,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:16:46,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:16:58,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:16:46,157 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 632/17840 [56:21<26:47:11, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:17:02,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 632/17840 [56:21<26:47:11, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:17:02,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4103, 'learning_rate': 1.896e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:06,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:02,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:06,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:02,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.628, 'learning_rate': 1.899e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:10,785 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:02,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 634/17840 [56:31<26:10:14, 5.48s/it]g-point operations will not be computed-10 22:17:02,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 634/17840 [56:31<26:10:14, 5.48s/it]g-point operations will not be computed-10 22:17:02,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:14,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:02,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:14,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:02,780 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 635/17840 [56:36<25:48:30, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:17:18,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 635/17840 [56:36<25:48:30, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:17:18,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6966, 'learning_rate': 1.9050000000000002e-05, 'epoch': 0.71} +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:22,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:18,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:22,430 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:18,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:18,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:18,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:25,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:18,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 637/17840 [56:47<25:03:09, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:17:28,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:31,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:28,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 638/17840 [56:52<24:42:34, 5.17s/it]g-point operations will not be computed-10 22:17:28,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 638/17840 [56:52<24:42:34, 5.17s/it]g-point operations will not be computed-10 22:17:28,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:34,924 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:28,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:37,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:28,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:37,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:28,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:39,742 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:28,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:41,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:28,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:41,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:28,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:41,970 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:28,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:45,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:28,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 641/17840 [57:06<22:52:02, 4.79s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:17:47,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 641/17840 [57:06<22:52:02, 4.79s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:17:47,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:49,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:47,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 642/17840 [57:10<21:59:01, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:17:51,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 642/17840 [57:10<21:59:01, 4.60s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:17:51,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:53,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:51,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 643/17840 [57:14<20:48:47, 4.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:17:55,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 643/17840 [57:14<20:48:47, 4.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:17:55,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:57,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:55,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:17:57,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:17:55,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 644/17840 [57:17<19:43:44, 4.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:17:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 645/17840 [57:20<18:30:13, 3.87s/it]g-point operations will not be computed-10 22:17:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▋ | 645/17840 [57:20<18:30:13, 3.87s/it]g-point operations will not be computed-10 22:17:58,844 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:03,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:02,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:03,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:02,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 646/17840 [57:23<17:06:44, 3.58s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:04,866 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 647/17840 [57:26<15:41:19, 3.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:07,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 647/17840 [57:26<15:41:19, 3.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:07,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 648/17840 [57:28<14:13:12, 2.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 648/17840 [57:28<14:13:12, 2.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:09,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 649/17840 [57:30<12:41:14, 2.66s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:11,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 649/17840 [57:30<12:41:14, 2.66s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:11,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 650/17840 [57:32<11:52:44, 2.49s/it]g-point operations will not be computed-10 22:18:11,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 650/17840 [57:32<11:52:44, 2.49s/it]g-point operations will not be computed-10 22:18:11,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 650/17840 [57:32<11:52:44, 2.49s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 650/17840 [57:32<11:52:44, 2.49s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:18,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:18,496 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:15,025 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 651/17840 [57:39<18:37:24, 3.90s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:21,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 651/17840 [57:39<18:37:24, 3.90s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:21,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:25,307 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:21,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 652/17840 [57:46<22:43:19, 4.76s/it]g-point operations will not be computed-10 22:18:21,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 652/17840 [57:46<22:43:19, 4.76s/it]g-point operations will not be computed-10 22:18:21,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 652/17840 [57:46<22:43:19, 4.76s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:28,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:31,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:28,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:31,969 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:28,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 653/17840 [57:53<25:25:53, 5.33s/it]g-point operations will not be computed-10 22:18:28,662 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 653/17840 [57:53<25:25:53, 5.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:35,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:38,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:35,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:38,565 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:35,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 654/17840 [57:59<27:13:14, 5.70s/it]g-point operations will not be computed-10 22:18:35,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 654/17840 [57:59<27:13:14, 5.70s/it]g-point operations will not be computed-10 22:18:35,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 654/17840 [57:59<27:13:14, 5.70s/it]g-point operations will not be computed-10 22:18:35,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:46,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:35,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:46,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:35,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 7.014, 'learning_rate': 1.965e-05, 'epoch': 0.73} +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:46,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:35,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:46,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:35,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:18:46,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:35,319 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 656/17840 [58:13<29:21:06, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 656/17840 [58:13<29:21:06, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 656/17840 [58:13<29:21:06, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 656/17840 [58:13<29:21:06, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 657/17840 [58:19<29:49:39, 6.25s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:03,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:03,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:03,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 658/17840 [58:25<30:05:21, 6.30s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:09,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:09,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:09,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 659/17840 [58:32<30:13:27, 6.33s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 659/17840 [58:32<30:13:27, 6.33s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 659/17840 [58:32<30:13:27, 6.33s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 659/17840 [58:32<30:13:27, 6.33s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:19,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:19,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:23,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:23,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 661/17840 [58:45<30:16:41, 6.35s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 661/17840 [58:45<30:16:41, 6.35s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 661/17840 [58:45<30:16:41, 6.35s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 661/17840 [58:45<30:16:41, 6.35s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:31,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:31,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:31,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:37,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:37,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7444, 'learning_rate': 1.989e-05, 'epoch': 0.74} +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:37,928 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:44,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:44,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4939, 'learning_rate': 1.9920000000000002e-05, 'epoch': 0.74} +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:44,096 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:50,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:50,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5062, 'learning_rate': 1.995e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:50,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:56,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:56,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7391, 'learning_rate': 1.9980000000000002e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-10 22:19:56,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:02,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:02,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5876, 'learning_rate': 2.0010000000000003e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:02,718 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:08,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:08,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5246, 'learning_rate': 2.004e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:08,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:14,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:14,853 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6827, 'learning_rate': 2.0070000000000003e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:19,405 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 670/17840 [59:40<29:08:25, 6.11s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 670/17840 [59:40<29:08:25, 6.11s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:23,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:23,903 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 671/17840 [59:46<28:53:38, 6.06s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 671/17840 [59:46<28:53:38, 6.06s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4377, 'learning_rate': 2.0130000000000002e-05, 'epoch': 0.75} +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:31,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:31,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 672/17840 [59:52<28:41:14, 6.02s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:35,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:35,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:35,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 673/17840 [59:58<28:32:59, 5.99s/it]g-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:41,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:41,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:41,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:18:55,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 674/17840 [1:00:04<28:22:14, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:20:46,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 674/17840 [1:00:04<28:22:14, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:20:46,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 674/17840 [1:00:04<28:22:14, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:20:46,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 674/17840 [1:00:04<28:22:14, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:20:46,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:00:10<28:40:34, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:20:52,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 675/17840 [1:00:10<28:40:34, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:20:52,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:56,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:20:52,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:20:56,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:20:52,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6449, 'learning_rate': 2.0280000000000002e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:00,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:20:52,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 677/17840 [1:00:21<27:59:28, 5.87s/it]g-point operations will not be computed-10 22:20:52,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 677/17840 [1:00:21<27:59:28, 5.87s/it]g-point operations will not be computed-10 22:20:52,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4738, 'learning_rate': 2.031e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:06,409 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:20:52,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 678/17840 [1:00:27<27:39:43, 5.80s/it]g-point operations will not be computed-10 22:20:52,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 678/17840 [1:00:27<27:39:43, 5.80s/it]g-point operations will not be computed-10 22:20:52,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:10,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:20:52,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:10,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:20:52,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 679/17840 [1:00:33<27:27:22, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:21:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 679/17840 [1:00:33<27:27:22, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:21:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6009, 'learning_rate': 2.0370000000000003e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:19,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:19,009 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4856, 'learning_rate': 2.04e-05, 'epoch': 0.76} +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:23,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:23,193 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 681/17840 [1:00:44<26:55:27, 5.65s/it]g-point operations will not be computed-10 22:21:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:27,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:27,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:27,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:14,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:00:49<26:38:35, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:21:31,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:00:49<26:38:35, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:21:31,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 682/17840 [1:00:49<26:38:35, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:21:31,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:31,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:35,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:31,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:39,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:31,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:39,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:31,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 684/17840 [1:01:00<25:59:47, 5.46s/it]g-point operations will not be computed-10 22:21:31,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:43,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:31,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:43,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:31,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:43,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:31,433 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 685/17840 [1:01:05<25:41:56, 5.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 685/17840 [1:01:05<25:41:56, 5.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 685/17840 [1:01:05<25:41:56, 5.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:51,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:53,586 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:56,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:56,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5062, 'learning_rate': 2.061e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:59,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:21:59,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 688/17840 [1:01:20<24:25:21, 5.13s/it]g-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:03,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:03,436 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:05,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:08,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:10,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:10,368 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5989, 'learning_rate': 2.07e-05, 'epoch': 0.77} +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:13,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:13,753 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:21:47,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 691/17840 [1:01:34<22:43:01, 4.77s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:22:15,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:17,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:15,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:17,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:15,936 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 692/17840 [1:01:38<21:45:50, 4.57s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:22:19,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:21,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:19,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:21,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:19,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 693/17840 [1:01:42<20:38:13, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:22:23,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▊ | 693/17840 [1:01:42<20:38:13, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:22:23,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 694/17840 [1:01:45<19:16:56, 4.05s/it]g-point operations will not be computed-10 22:22:23,656 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 694/17840 [1:01:45<19:16:56, 4.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:22:26,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 694/17840 [1:01:45<19:16:56, 4.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:22:26,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 695/17840 [1:01:48<17:56:09, 3.77s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:22:29,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 695/17840 [1:01:48<17:56:09, 3.77s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:22:29,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 696/17840 [1:01:51<16:29:44, 3.46s/it]g-point operations will not be computed-10 22:22:29,997 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:33,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:32,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:33,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:32,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:36,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:35,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:36,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:35,073 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:38,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:37,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:38,034 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:37,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:39,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:38,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:39,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:38,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 700/17840 [1:02:00<11:35:08, 2.43s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:22:42,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 700/17840 [1:02:00<11:35:08, 2.43s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:22:42,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:45,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:42,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:45,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:42,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 701/17840 [1:02:07<18:04:05, 3.80s/it]g-point operations will not be computed-10 22:22:42,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 701/17840 [1:02:07<18:04:05, 3.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:22:49,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:52,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:49,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:22:52,621 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:22:49,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 702/17840 [1:02:13<22:13:20, 4.67s/it]g-point operations will not be computed-10 22:22:49,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 702/17840 [1:02:13<22:13:20, 4.67s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:22:55,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 702/17840 [1:02:13<22:13:20, 4.67s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:22:55,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-10 22:22:55,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-10 22:22:55,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:02:20<24:59:04, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 703/17840 [1:02:20<24:59:04, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:05,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:05,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 704/17840 [1:02:27<26:56:58, 5.66s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:10,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:10,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:10,894 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 705/17840 [1:02:33<28:21:29, 5.96s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 705/17840 [1:02:33<28:21:29, 5.96s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:19,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:19,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 706/17840 [1:02:40<29:07:45, 6.12s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 706/17840 [1:02:40<29:07:45, 6.12s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:25,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:02:46<29:42:55, 6.24s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 707/17840 [1:02:46<29:42:55, 6.24s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7461, 'learning_rate': 2.121e-05, 'epoch': 0.79} + 4%|██▉ | 707/17840 [1:02:46<29:42:55, 6.24s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:33,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:33,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8211, 'learning_rate': 2.124e-05, 'epoch': 0.79} +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:33,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:40,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:40,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6199, 'learning_rate': 2.1269999999999998e-05, 'epoch': 0.79} +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:40,048 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:46,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:46,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.516, 'learning_rate': 2.13e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:46,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:46,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:03:13<31:18:05, 6.58s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 711/17840 [1:03:13<31:18:05, 6.58s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:56,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:23:56,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 712/17840 [1:03:19<30:49:57, 6.48s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 712/17840 [1:03:19<30:49:57, 6.48s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4553, 'learning_rate': 2.136e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:04,560 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 713/17840 [1:03:25<30:35:06, 6.43s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 713/17840 [1:03:25<30:35:06, 6.43s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:09,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:09,262 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 714/17840 [1:03:31<30:13:57, 6.36s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 714/17840 [1:03:31<30:13:57, 6.36s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:15,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:15,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 715/17840 [1:03:38<29:50:14, 6.27s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 715/17840 [1:03:38<29:50:14, 6.27s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:21,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:21,445 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 716/17840 [1:03:44<29:35:04, 6.22s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 716/17840 [1:03:44<29:35:04, 6.22s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.612, 'learning_rate': 2.148e-05, 'epoch': 0.8} +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:29,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 717/17840 [1:03:50<29:28:48, 6.20s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 717/17840 [1:03:50<29:28:48, 6.20s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:33,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:33,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 718/17840 [1:03:56<29:15:13, 6.15s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 718/17840 [1:03:56<29:15:13, 6.15s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:39,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:39,749 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 719/17840 [1:04:02<29:05:41, 6.12s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 719/17840 [1:04:02<29:05:41, 6.12s/it]g-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:45,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:24:45,736 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:23:02,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 720/17840 [1:04:08<28:54:32, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:24:50,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 720/17840 [1:04:08<28:54:32, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:24:50,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.473, 'learning_rate': 2.16e-05, 'epoch': 0.81} + 4%|██▉ | 720/17840 [1:04:08<28:54:32, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:24:50,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 721/17840 [1:04:14<28:46:02, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:24:56,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 721/17840 [1:04:14<28:46:02, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:24:56,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4523, 'learning_rate': 2.163e-05, 'epoch': 0.81} + 4%|██▉ | 721/17840 [1:04:14<28:46:02, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:24:56,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 722/17840 [1:04:20<28:54:43, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:24:56,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 722/17840 [1:04:20<28:54:43, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:24:56,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:03,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:24:56,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:03,913 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:24:56,270 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 723/17840 [1:04:26<28:55:27, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:08,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 723/17840 [1:04:26<28:55:27, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:08,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3943, 'learning_rate': 2.169e-05, 'epoch': 0.81} + 4%|██▉ | 723/17840 [1:04:26<28:55:27, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:08,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|██▉ | 723/17840 [1:04:26<28:55:27, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:08,460 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 724/17840 [1:04:32<28:41:09, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:14,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 724/17840 [1:04:32<28:41:09, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:14,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 724/17840 [1:04:32<28:41:09, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:14,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 724/17840 [1:04:32<28:41:09, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:14,372 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 725/17840 [1:04:38<28:57:28, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 725/17840 [1:04:38<28:57:28, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:24,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:24,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6476, 'learning_rate': 2.178e-05, 'epoch': 0.81} +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:24,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:24,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:30,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:30,541 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:34,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:34,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 728/17840 [1:04:55<27:53:30, 5.87s/it]g-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:39,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:39,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:39,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 729/17840 [1:05:01<27:28:28, 5.78s/it]g-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:44,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:47,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:47,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5489, 'learning_rate': 2.19e-05, 'epoch': 0.82} +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:47,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:47,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:52,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:55,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:55,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:25:55,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:25:20,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 732/17840 [1:05:18<26:32:28, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:59,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 732/17840 [1:05:18<26:32:28, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:59,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 732/17840 [1:05:18<26:32:28, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:59,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 732/17840 [1:05:18<26:32:28, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:25:59,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 733/17840 [1:05:23<26:16:54, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:26:05,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 733/17840 [1:05:23<26:16:54, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:26:05,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 733/17840 [1:05:23<26:16:54, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:26:05,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:09,032 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:05,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:11,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:05,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:11,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:05,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:11,599 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:05,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 735/17840 [1:05:33<25:21:29, 5.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:18,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:18,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 736/17840 [1:05:38<25:03:53, 5.28s/it]g-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:21,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:24,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:24,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5158, 'learning_rate': 2.211e-05, 'epoch': 0.83} +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:27,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:27,803 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 738/17840 [1:05:48<24:00:53, 5.06s/it]g-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:31,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:33,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:33,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:35,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:35,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:38,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:40,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:42,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:42,455 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6142, 'learning_rate': 2.223e-05, 'epoch': 0.83} +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:45,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:45,654 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:15,467 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 742/17840 [1:06:06<21:28:56, 4.52s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:26:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-10 22:26:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-10 22:26:47,685 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 743/17840 [1:06:10<20:38:15, 4.35s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:26:51,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 744/17840 [1:06:13<19:32:37, 4.12s/it]g-point operations will not be computed-10 22:26:51,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 744/17840 [1:06:13<19:32:37, 4.12s/it]g-point operations will not be computed-10 22:26:51,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:55,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:26:56,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:26:55,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 745/17840 [1:06:17<18:20:26, 3.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:26:58,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 746/17840 [1:06:20<17:03:35, 3.59s/it]g-point operations will not be computed-10 22:26:58,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 746/17840 [1:06:20<17:03:35, 3.59s/it]g-point operations will not be computed-10 22:26:58,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:02,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:01,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:02,329 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:01,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:04,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:03,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:04,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:03,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:06,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:05,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:06,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:05,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:08,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:07,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:08,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:07,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 750/17840 [1:06:29<11:58:16, 2.52s/it]g-point operations will not be computed-10 22:27:07,626 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 750/17840 [1:06:29<11:58:16, 2.52s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:27:11,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:14,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:11,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 751/17840 [1:06:36<18:34:40, 3.91s/it]g-point operations will not be computed-10 22:27:11,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 751/17840 [1:06:36<18:34:40, 3.91s/it]g-point operations will not be computed-10 22:27:11,208 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 751/17840 [1:06:36<18:34:40, 3.91s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:27:18,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 751/17840 [1:06:36<18:34:40, 3.91s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:27:18,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-10 22:27:18,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-10 22:27:18,224 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:06:43<22:47:36, 4.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:27:25,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 752/17840 [1:06:43<22:47:36, 4.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:27:25,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:28,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:25,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:28,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:25,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:06:49<25:39:13, 5.40s/it]g-point operations will not be computed-10 22:27:25,127 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███ | 753/17840 [1:06:49<25:39:13, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:27:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:35,195 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 754/17840 [1:06:56<27:30:40, 5.80s/it]g-point operations will not be computed-10 22:27:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 754/17840 [1:06:56<27:30:40, 5.80s/it]g-point operations will not be computed-10 22:27:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7233, 'learning_rate': 2.262e-05, 'epoch': 0.85} + 4%|███▏ | 754/17840 [1:06:56<27:30:40, 5.80s/it]g-point operations will not be computed-10 22:27:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:43,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:43,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6489, 'learning_rate': 2.265e-05, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:43,544 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:50,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:50,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.7645, 'learning_rate': 2.268e-05, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:50,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:50,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:27:50,232 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:31,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:07:16<30:02:46, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:07:16<30:02:46, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 757/17840 [1:07:16<30:02:46, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 758/17840 [1:07:22<30:20:10, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 758/17840 [1:07:22<30:20:10, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5009, 'learning_rate': 2.274e-05, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:08,188 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 759/17840 [1:07:29<30:28:33, 6.42s/it]g-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 759/17840 [1:07:29<30:28:33, 6.42s/it]g-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5682, 'learning_rate': 2.277e-05, 'epoch': 0.85} + 4%|███▏ | 759/17840 [1:07:29<30:28:33, 6.42s/it]g-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:16,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:16,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5185, 'learning_rate': 2.2800000000000002e-05, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:16,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:22,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:22,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5858, 'learning_rate': 2.283e-05, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:22,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:29,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:29,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4719, 'learning_rate': 2.286e-05, 'epoch': 0.85} +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:29,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:35,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:35,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3274, 'learning_rate': 2.289e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:35,257 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:41,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:41,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:41,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2561, 'learning_rate': 2.292e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:41,614 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 765/17840 [1:08:07<30:00:47, 6.33s/it]g-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 765/17840 [1:08:07<30:00:47, 6.33s/it]g-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:51,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:28:51,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:27:58,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 766/17840 [1:08:13<29:55:52, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:28:55,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 766/17840 [1:08:13<29:55:52, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:28:55,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4045, 'learning_rate': 2.298e-05, 'epoch': 0.86} + 4%|███▏ | 766/17840 [1:08:13<29:55:52, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:28:55,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 767/17840 [1:08:20<29:44:17, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 767/17840 [1:08:20<29:44:17, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.434, 'learning_rate': 2.301e-05, 'epoch': 0.86} + 4%|███▏ | 767/17840 [1:08:20<29:44:17, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 768/17840 [1:08:26<29:31:11, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 768/17840 [1:08:26<29:31:11, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:09,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:09,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 769/17840 [1:08:32<29:24:27, 6.20s/it]g-point operations will not be computed-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 769/17840 [1:08:32<29:24:27, 6.20s/it]g-point operations will not be computed-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:15,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:15,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 770/17840 [1:08:38<29:17:03, 6.18s/it]g-point operations will not be computed-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 770/17840 [1:08:38<29:17:03, 6.18s/it]g-point operations will not be computed-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:21,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:21,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:01,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 771/17840 [1:08:44<29:13:21, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 771/17840 [1:08:44<29:13:21, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5898, 'learning_rate': 2.313e-05, 'epoch': 0.86} +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5922, 'learning_rate': 2.3160000000000002e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:30,881 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:36,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:36,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5272, 'learning_rate': 2.319e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:36,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:42,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:42,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3065, 'learning_rate': 2.322e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:42,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:48,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:48,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1717, 'learning_rate': 2.3250000000000003e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:48,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:48,992 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:54,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:54,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:59,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:29:59,074 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 777/17840 [1:09:20<28:03:37, 5.92s/it]g-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:03,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:03,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:29:26,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 778/17840 [1:09:25<27:44:14, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 778/17840 [1:09:25<27:44:14, 5.85s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5341, 'learning_rate': 2.334e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:11,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:11,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:11,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4253, 'learning_rate': 2.337e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:17,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:17,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4207, 'learning_rate': 2.3400000000000003e-05, 'epoch': 0.87} +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:21,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:21,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 781/17840 [1:09:42<27:01:23, 5.70s/it]g-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:25,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:25,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 782/17840 [1:09:48<26:43:43, 5.64s/it]g-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▏ | 782/17840 [1:09:48<26:43:43, 5.64s/it]g-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:31,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:34,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:34,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5258, 'learning_rate': 2.349e-05, 'epoch': 0.88} +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:38,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:38,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 784/17840 [1:09:59<26:03:02, 5.50s/it]g-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:42,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:42,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:42,005 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:07,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 785/17840 [1:10:04<25:34:35, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:30:45,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 785/17840 [1:10:04<25:34:35, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:30:45,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 785/17840 [1:10:04<25:34:35, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:30:45,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 785/17840 [1:10:04<25:34:35, 5.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:30:45,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 786/17840 [1:10:10<27:20:44, 5.77s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:30:45,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:53,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:45,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:53,670 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:45,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:56,094 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:45,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:58,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:45,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:58,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:45,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:30:58,630 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:30:45,870 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 788/17840 [1:10:20<25:17:13, 5.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:04,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:04,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 4%|███▎ | 789/17840 [1:10:25<24:27:55, 5.17s/it]g-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:08,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:08,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:10,403 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:12,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:14,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:14,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:16,994 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:19,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:19,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:21,086 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:22,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:22,959 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:24,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:24,939 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:26,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:28,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:28,326 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:31,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:31,425 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:32,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:35,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:35,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:37,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:37,494 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:39,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:39,423 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:40,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:40,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:41,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:45,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:45,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:45,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:48,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:48,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:52,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:55,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:55,463 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8057, 'learning_rate': 2.4060000000000003e-05, 'epoch': 0.9} +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:59,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:59,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:31:59,210 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:02,473 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:05,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:05,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:11:28<27:17:25, 5.77s/it]g-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 804/17840 [1:11:28<27:17:25, 5.77s/it]g-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8048, 'learning_rate': 2.4120000000000003e-05, 'epoch': 0.9} +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:14,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:11:35<28:30:21, 6.02s/it]g-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 805/17840 [1:11:35<28:30:21, 6.02s/it]g-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4712, 'learning_rate': 2.415e-05, 'epoch': 0.9} + 5%|███▎ | 805/17840 [1:11:35<28:30:21, 6.02s/it]g-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:22,114 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:22,114 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6673, 'learning_rate': 2.4180000000000002e-05, 'epoch': 0.9} +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:22,114 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:28,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:28,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6048, 'learning_rate': 2.4210000000000004e-05, 'epoch': 0.9} +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:28,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:28,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:28,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:31:02,280 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 808/17840 [1:11:54<30:04:40, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 808/17840 [1:11:54<30:04:40, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 808/17840 [1:11:54<30:04:40, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 808/17840 [1:11:54<30:04:40, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 809/17840 [1:12:01<30:06:45, 6.37s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:44,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:44,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:44,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 810/17840 [1:12:07<30:03:26, 6.35s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:51,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:51,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:51,132 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 811/17840 [1:12:13<30:02:23, 6.35s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:57,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:57,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:32:57,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 812/17840 [1:12:20<29:55:07, 6.33s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:03,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:03,684 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 813/17840 [1:12:26<29:59:40, 6.34s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▎ | 813/17840 [1:12:26<29:59:40, 6.34s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:10,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:10,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 814/17840 [1:12:32<29:47:41, 6.30s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 814/17840 [1:12:32<29:47:41, 6.30s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3781, 'learning_rate': 2.442e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:17,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 815/17840 [1:12:38<29:31:39, 6.24s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 815/17840 [1:12:38<29:31:39, 6.24s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4108, 'learning_rate': 2.4449999999999998e-05, 'epoch': 0.91} +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:23,790 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 816/17840 [1:12:45<29:21:41, 6.21s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 816/17840 [1:12:45<29:21:41, 6.21s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:28,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:28,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 817/17840 [1:12:51<29:06:09, 6.15s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 817/17840 [1:12:51<29:06:09, 6.15s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:34,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:34,458 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 818/17840 [1:12:57<29:00:04, 6.13s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 818/17840 [1:12:57<29:00:04, 6.13s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3803, 'learning_rate': 2.454e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:42,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 819/17840 [1:13:03<29:15:01, 6.19s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 819/17840 [1:13:03<29:15:01, 6.19s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2678, 'learning_rate': 2.457e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:48,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 820/17840 [1:13:09<28:56:49, 6.12s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 820/17840 [1:13:09<28:56:49, 6.12s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4604, 'learning_rate': 2.4599999999999998e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:54,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:54,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 821/17840 [1:13:15<28:45:32, 6.08s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:58,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:58,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:33:58,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 822/17840 [1:13:21<28:26:20, 6.02s/it]g-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:04,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:04,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:04,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:32:36,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 823/17840 [1:13:27<28:06:28, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:34:08,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 823/17840 [1:13:27<28:06:28, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:34:08,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:13,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:08,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:13,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:08,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3879, 'learning_rate': 2.472e-05, 'epoch': 0.92} +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:13,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:08,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:13,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:08,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:13,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:08,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 825/17840 [1:13:39<28:42:33, 6.07s/it]g-point operations will not be computed-10 22:34:08,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:22,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:08,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:22,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:08,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:22,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:08,882 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 826/17840 [1:13:45<28:17:25, 5.99s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:29,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 827/17840 [1:13:50<27:54:03, 5.90s/it]g-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 827/17840 [1:13:50<27:54:03, 5.90s/it]g-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:33,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:33,981 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 828/17840 [1:13:56<27:29:27, 5.82s/it]g-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 828/17840 [1:13:56<27:29:27, 5.82s/it]g-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:39,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:42,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:42,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:42,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3526, 'learning_rate': 2.487e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:42,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:47,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:47,829 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:52,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:52,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 831/17840 [1:14:13<26:52:40, 5.69s/it]g-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:56,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:56,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:34:56,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 832/17840 [1:14:18<26:33:30, 5.62s/it]g-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:01,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:04,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:04,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3711, 'learning_rate': 2.499e-05, 'epoch': 0.93} +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:08,401 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 834/17840 [1:14:29<25:48:34, 5.46s/it]g-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 834/17840 [1:14:29<25:48:34, 5.46s/it]g-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:12,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:14,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:14,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3602, 'learning_rate': 2.505e-05, 'epoch': 0.94} +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:18,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 836/17840 [1:14:39<24:47:02, 5.25s/it]g-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 836/17840 [1:14:39<24:47:02, 5.25s/it]g-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:22,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:24,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:24,729 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.357, 'learning_rate': 2.511e-05, 'epoch': 0.94} +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:28,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:28,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:34:26,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 838/17840 [1:14:49<23:52:10, 5.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:35:30,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:32,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:30,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:32,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:30,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 839/17840 [1:14:53<23:10:30, 4.91s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:37,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:37,332 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▍ | 840/17840 [1:14:57<22:12:32, 4.70s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:40,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:40,417 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:42,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:44,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:44,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:46,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:46,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:49,538 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:51,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:51,261 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:52,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:52,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:55,575 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:56,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:56,927 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:59,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:35:59,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:01,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:01,578 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:03,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:03,492 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:05,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:05,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:06,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:06,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:10,265 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:13,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:13,624 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9396, 'learning_rate': 2.553e-05, 'epoch': 0.95} +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:17,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:17,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:17,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:20,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:23,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:23,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:23,813 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:27,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:27,105 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:30,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:33,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:33,757 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9008, 'learning_rate': 2.562e-05, 'epoch': 0.96} +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:37,141 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:40,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:40,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6005, 'learning_rate': 2.565e-05, 'epoch': 0.96} +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:40,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:40,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:40,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 856/17840 [1:16:06<28:55:26, 6.13s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:50,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:50,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:50,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 857/17840 [1:16:13<29:22:07, 6.23s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:56,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:56,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:36:56,634 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 858/17840 [1:16:19<29:41:38, 6.29s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 858/17840 [1:16:19<29:41:38, 6.29s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:04,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:04,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 859/17840 [1:16:25<29:45:35, 6.31s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 859/17840 [1:16:25<29:45:35, 6.31s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:10,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:10,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 860/17840 [1:16:32<29:42:27, 6.30s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 860/17840 [1:16:32<29:42:27, 6.30s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 860/17840 [1:16:32<29:42:27, 6.30s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 860/17840 [1:16:32<29:42:27, 6.30s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:18,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:18,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:18,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:24,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:24,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4885, 'learning_rate': 2.586e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:24,835 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:31,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:31,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4111, 'learning_rate': 2.589e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:31,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:37,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:37,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5711, 'learning_rate': 2.592e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:37,087 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:43,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:43,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5212, 'learning_rate': 2.595e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:43,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:43,112 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:49,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:49,182 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:53,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:17:14<28:42:32, 6.09s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 867/17840 [1:17:14<28:42:32, 6.09s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4778, 'learning_rate': 2.601e-05, 'epoch': 0.97} +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:59,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:37:59,705 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 868/17840 [1:17:20<28:33:02, 6.06s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 868/17840 [1:17:20<28:33:02, 6.06s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:05,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:05,653 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 869/17840 [1:17:26<28:22:58, 6.02s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:10,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:10,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:10,128 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 870/17840 [1:17:32<28:11:29, 5.98s/it]g-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:16,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:16,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:16,020 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:35:35,254 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 871/17840 [1:17:38<28:01:20, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 871/17840 [1:17:38<28:01:20, 5.94s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:24,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:24,566 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4134, 'learning_rate': 2.616e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:28,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 873/17840 [1:17:49<27:30:01, 5.83s/it]g-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▌ | 873/17840 [1:17:49<27:30:01, 5.83s/it]g-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3563, 'learning_rate': 2.619e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:34,571 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 874/17840 [1:17:55<27:15:16, 5.78s/it]g-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 874/17840 [1:17:55<27:15:16, 5.78s/it]g-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4026, 'learning_rate': 2.622e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:40,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 875/17840 [1:18:01<27:39:37, 5.87s/it]g-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 875/17840 [1:18:01<27:39:37, 5.87s/it]g-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5302, 'learning_rate': 2.625e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:46,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:46,321 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 876/17840 [1:18:07<27:19:04, 5.80s/it]g-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:50,479 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:53,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2191, 'learning_rate': 2.631e-05, 'epoch': 0.98} +[WARNING|modeling_utils.py:388] 2022-03-10 22:38:57,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 878/17840 [1:18:18<26:19:52, 5.59s/it]g-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 878/17840 [1:18:18<26:19:52, 5.59s/it]g-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:01,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:01,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:01,192 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:38:20,379 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 879/17840 [1:18:23<25:55:18, 5.50s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:39:05,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:07,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:05,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 880/17840 [1:18:28<25:19:30, 5.38s/it]g-point operations will not be computed-10 22:39:05,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 880/17840 [1:18:28<25:19:30, 5.38s/it]g-point operations will not be computed-10 22:39:05,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:11,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:05,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:11,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:05,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:11,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:05,100 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 881/17840 [1:18:33<24:44:45, 5.25s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:39:15,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:17,532 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:15,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 882/17840 [1:18:38<24:14:08, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 882/17840 [1:18:38<24:14:08, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2953, 'learning_rate': 2.646e-05, 'epoch': 0.99} +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:23,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:23,351 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:25,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:27,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:27,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:29,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:31,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:31,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:33,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:35,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:35,392 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:37,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:38,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:38,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:41,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:41,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:43,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:43,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:45,648 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:47,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:47,750 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:50,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:50,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9657, 'learning_rate': 2.673e-05, 'epoch': 1.0} +{'loss': 5.6541, 'learning_rate': 2.676e-05, 'epoch': 1.0} +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:54,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:54,014 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:57,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:39:57,407 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8734, 'learning_rate': 2.6790000000000003e-05, 'epoch': 1.0} +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:00,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:04,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:04,250 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.9303, 'learning_rate': 2.682e-05, 'epoch': 1.0} +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:07,612 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:10,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:10,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:10,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:14,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:14,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:39:19,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:19:37<26:39:55, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 896/17840 [1:19:37<26:39:55, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4885, 'learning_rate': 2.688e-05, 'epoch': 1.0} + 5%|███▋ | 896/17840 [1:19:37<26:39:55, 5.67s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 897/17840 [1:19:43<27:48:55, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 897/17840 [1:19:43<27:48:55, 5.91s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4402, 'learning_rate': 2.691e-05, 'epoch': 1.01} +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:28,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 898/17840 [1:19:50<28:40:58, 6.09s/it]g-point operations will not be computed-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 898/17840 [1:19:50<28:40:58, 6.09s/it]g-point operations will not be computed-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5345, 'learning_rate': 2.6940000000000003e-05, 'epoch': 1.01} +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:35,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:35,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 899/17840 [1:19:56<29:04:26, 6.18s/it]g-point operations will not be computed-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 899/17840 [1:19:56<29:04:26, 6.18s/it]g-point operations will not be computed-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:41,625 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:20:03<30:01:18, 6.38s/it]g-point operations will not be computed-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:20:03<30:01:18, 6.38s/it]g-point operations will not be computed-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4342, 'learning_rate': 2.7000000000000002e-05, 'epoch': 1.01} + 5%|███▋ | 900/17840 [1:20:03<30:01:18, 6.38s/it]g-point operations will not be computed-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:20:03<30:01:18, 6.38s/it]g-point operations will not be computed-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 900/17840 [1:20:03<30:01:18, 6.38s/it]g-point operations will not be computed-10 22:40:19,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:20:09<30:09:09, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:20:09<30:09:09, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:20:09<30:09:09, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 901/17840 [1:20:09<30:09:09, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 902/17840 [1:20:16<30:14:02, 6.43s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:59,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:59,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:40:59,765 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 903/17840 [1:20:22<29:59:35, 6.38s/it]g-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:05,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:05,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:05,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▋ | 904/17840 [1:20:28<29:45:30, 6.33s/it]g-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:12,200 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 905/17840 [1:20:34<29:37:10, 6.30s/it]g-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:18,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:18,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:18,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 906/17840 [1:20:41<29:23:04, 6.25s/it]g-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:24,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:24,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:24,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 907/17840 [1:20:47<29:06:57, 6.19s/it]g-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:30,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:30,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:30,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 908/17840 [1:20:53<28:57:22, 6.16s/it]g-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:36,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:36,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:36,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 909/17840 [1:20:59<28:51:20, 6.14s/it]g-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:42,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:42,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:42,704 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 910/17840 [1:21:05<28:46:59, 6.12s/it]g-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:48,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:48,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:41:48,695 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:40:51,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 911/17840 [1:21:11<28:33:33, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:41:53,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 911/17840 [1:21:11<28:33:33, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:41:53,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 911/17840 [1:21:11<28:33:33, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:41:53,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 911/17840 [1:21:11<28:33:33, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:41:53,230 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 912/17840 [1:21:17<28:21:41, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 912/17840 [1:21:17<28:21:41, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:03,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:03,608 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.235, 'learning_rate': 2.739e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:08,070 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 914/17840 [1:21:29<28:10:01, 5.99s/it]g-point operations will not be computed-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 914/17840 [1:21:29<28:10:01, 5.99s/it]g-point operations will not be computed-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2791, 'learning_rate': 2.7420000000000002e-05, 'epoch': 1.02} +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:13,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 915/17840 [1:21:35<27:54:14, 5.94s/it]g-point operations will not be computed-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 915/17840 [1:21:35<27:54:14, 5.94s/it]g-point operations will not be computed-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0708, 'learning_rate': 2.7450000000000003e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:19,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 916/17840 [1:21:40<27:41:06, 5.89s/it]g-point operations will not be computed-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 916/17840 [1:21:40<27:41:06, 5.89s/it]g-point operations will not be computed-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:24,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:24,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:41:59,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 917/17840 [1:21:46<27:26:42, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:42:28,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 917/17840 [1:21:46<27:26:42, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:42:28,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1343, 'learning_rate': 2.7510000000000003e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:32,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:28,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:32,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:28,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2946, 'learning_rate': 2.754e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:32,514 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:28,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:38,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:28,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:38,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:28,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3232, 'learning_rate': 2.7570000000000002e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:42,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:28,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 920/17840 [1:22:03<26:53:05, 5.72s/it]g-point operations will not be computed-10 22:42:28,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 920/17840 [1:22:03<26:53:05, 5.72s/it]g-point operations will not be computed-10 22:42:28,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:46,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:28,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:46,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:28,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:46,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:28,292 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 921/17840 [1:22:09<26:42:19, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:42:50,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 921/17840 [1:22:09<26:42:19, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:42:50,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:54,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:50,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:54,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:50,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.404, 'learning_rate': 2.7660000000000003e-05, 'epoch': 1.03} +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:54,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:50,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:42:54,931 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:50,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:00,437 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:50,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:03,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:50,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:03,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:50,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:03,175 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:42:50,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 924/17840 [1:22:25<26:00:16, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 924/17840 [1:22:25<26:00:16, 5.53s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:11,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:11,657 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.195, 'learning_rate': 2.7750000000000004e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:15,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:15,759 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 926/17840 [1:22:36<26:04:04, 5.55s/it]g-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:19,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:22,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:22,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2929, 'learning_rate': 2.7810000000000003e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:22,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:22,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:27,156 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:29,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:29,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:29,686 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:07,234 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 929/17840 [1:22:51<24:25:10, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:43:33,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:35,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:33,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:35,764 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:33,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 930/17840 [1:22:56<23:53:37, 5.09s/it]g-point operations will not be computed-10 22:43:33,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:39,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:33,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:39,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:33,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:41,618 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:33,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:43,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:33,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:46,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:33,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:46,167 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:33,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0005, 'learning_rate': 2.7960000000000003e-05, 'epoch': 1.04} +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:33,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:49,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:33,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 933/17840 [1:23:10<22:03:57, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:43:51,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:53,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:51,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:43:53,677 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:43:51,658 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▊ | 934/17840 [1:23:14<21:15:25, 4.53s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:43:55,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 935/17840 [1:23:18<20:17:57, 4.32s/it]g-point operations will not be computed-10 22:43:55,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 935/17840 [1:23:18<20:17:57, 4.32s/it]g-point operations will not be computed-10 22:43:55,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 935/17840 [1:23:18<20:17:57, 4.32s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:43:59,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 936/17840 [1:23:21<19:16:01, 4.10s/it]g-point operations will not be computed-10 22:43:59,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 936/17840 [1:23:21<19:16:01, 4.10s/it]g-point operations will not be computed-10 22:43:59,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:04,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:03,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:04,590 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:03,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 937/17840 [1:23:25<18:02:17, 3.84s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:44:06,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 938/17840 [1:23:27<16:37:50, 3.54s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:44:08,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 938/17840 [1:23:27<16:37:50, 3.54s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:44:08,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 939/17840 [1:23:30<15:02:32, 3.20s/it]g-point operations will not be computed-10 22:44:08,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 939/17840 [1:23:30<15:02:32, 3.20s/it]g-point operations will not be computed-10 22:44:08,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 940/17840 [1:23:32<13:32:23, 2.88s/it]g-point operations will not be computed-10 22:44:11,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 940/17840 [1:23:32<13:32:23, 2.88s/it]g-point operations will not be computed-10 22:44:11,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 941/17840 [1:23:34<12:08:06, 2.59s/it]g-point operations will not be computed-10 22:44:13,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 941/17840 [1:23:34<12:08:06, 2.59s/it]g-point operations will not be computed-10 22:44:13,277 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 942/17840 [1:23:35<10:53:44, 2.32s/it]g-point operations will not be computed-10 22:44:15,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 942/17840 [1:23:35<10:53:44, 2.32s/it]g-point operations will not be computed-10 22:44:15,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 942/17840 [1:23:35<10:53:44, 2.32s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:44:18,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 942/17840 [1:23:35<10:53:44, 2.32s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:44:18,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:21,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:18,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:21,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:18,185 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 943/17840 [1:23:42<17:20:52, 3.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:44:25,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 943/17840 [1:23:42<17:20:52, 3.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:44:25,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:28,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:25,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:28,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:25,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 944/17840 [1:23:49<21:43:09, 4.63s/it]g-point operations will not be computed-10 22:44:25,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 944/17840 [1:23:49<21:43:09, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:44:31,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:35,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:31,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 945/17840 [1:23:56<24:34:44, 5.24s/it]g-point operations will not be computed-10 22:44:31,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 945/17840 [1:23:56<24:34:44, 5.24s/it]g-point operations will not be computed-10 22:44:31,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 945/17840 [1:23:56<24:34:44, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:44:38,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:41,635 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:38,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:24:02<26:31:19, 5.65s/it]g-point operations will not be computed-10 22:44:38,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:24:02<26:31:19, 5.65s/it]g-point operations will not be computed-10 22:44:38,359 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:24:02<26:31:19, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 946/17840 [1:24:02<26:31:19, 5.65s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:49,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:49,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.654, 'learning_rate': 2.841e-05, 'epoch': 1.06} +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:49,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:49,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:49,872 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 948/17840 [1:24:16<28:45:28, 6.13s/it]g-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:59,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:44:59,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 949/17840 [1:24:22<29:20:47, 6.25s/it]g-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 949/17840 [1:24:22<29:20:47, 6.25s/it]g-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4299, 'learning_rate': 2.847e-05, 'epoch': 1.06} +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:07,906 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 950/17840 [1:24:29<30:26:04, 6.49s/it]g-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 950/17840 [1:24:29<30:26:04, 6.49s/it]g-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4866, 'learning_rate': 2.8499999999999998e-05, 'epoch': 1.07} + 5%|███▉ | 950/17840 [1:24:29<30:26:04, 6.49s/it]g-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:16,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:16,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0897, 'learning_rate': 2.853e-05, 'epoch': 1.07} +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:16,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:16,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:16,457 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:44:45,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 952/17840 [1:24:42<30:17:53, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:45:24,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 952/17840 [1:24:42<30:17:53, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:45:24,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 952/17840 [1:24:42<30:17:53, 6.46s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:45:24,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 953/17840 [1:24:49<30:15:33, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|█���█▉ | 953/17840 [1:24:49<30:15:33, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4175, 'learning_rate': 2.859e-05, 'epoch': 1.07} + 5%|███▉ | 953/17840 [1:24:49<30:15:33, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 954/17840 [1:24:55<30:01:38, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 954/17840 [1:24:55<30:01:38, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:38,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:38,810 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 955/17840 [1:25:01<29:51:52, 6.37s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 955/17840 [1:25:01<29:51:52, 6.37s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:45,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:45,102 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 956/17840 [1:25:07<29:44:09, 6.34s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 956/17840 [1:25:07<29:44:09, 6.34s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:51,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:51,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 957/17840 [1:25:14<29:27:26, 6.28s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 957/17840 [1:25:14<29:27:26, 6.28s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:57,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:45:57,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 958/17840 [1:25:20<29:16:24, 6.24s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 958/17840 [1:25:20<29:16:24, 6.24s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2993, 'learning_rate': 2.874e-05, 'epoch': 1.07} +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:05,057 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 959/17840 [1:25:26<29:03:29, 6.20s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 959/17840 [1:25:26<29:03:29, 6.20s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3628, 'learning_rate': 2.877e-05, 'epoch': 1.08} +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:11,122 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 960/17840 [1:25:32<28:47:28, 6.14s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 960/17840 [1:25:32<28:47:28, 6.14s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:15,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:15,641 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 961/17840 [1:25:38<28:32:49, 6.09s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 961/17840 [1:25:38<28:32:49, 6.09s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:21,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:21,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 962/17840 [1:25:44<28:29:47, 6.08s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 962/17840 [1:25:44<28:29:47, 6.08s/it]g-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:27,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:27,647 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:45:30,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 963/17840 [1:25:50<28:21:44, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:46:32,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 963/17840 [1:25:50<28:21:44, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:46:32,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4272, 'learning_rate': 2.889e-05, 'epoch': 1.08} + 5%|███▉ | 963/17840 [1:25:50<28:21:44, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:46:32,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 964/17840 [1:25:56<28:07:06, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|███▉ | 964/17840 [1:25:56<28:07:06, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2172, 'learning_rate': 2.892e-05, 'epoch': 1.08} +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:42,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:42,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1887, 'learning_rate': 2.895e-05, 'epoch': 1.08} +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:42,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:42,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:48,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:48,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:52,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:52,420 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 967/17840 [1:26:13<27:24:46, 5.85s/it]g-point operations will not be computed-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:56,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:56,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:46:56,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:46:38,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 968/17840 [1:26:19<27:09:30, 5.79s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 968/17840 [1:26:19<27:09:30, 5.79s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:05,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:05,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3242, 'learning_rate': 2.907e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:05,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:05,136 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:10,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:10,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:14,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:14,943 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 971/17840 [1:26:35<26:31:37, 5.66s/it]g-point operations will not be computed-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:19,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:19,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:19,135 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:01,002 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 972/17840 [1:26:41<26:18:35, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:47:23,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 972/17840 [1:26:41<26:18:35, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:47:23,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:27,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:23,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:27,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:23,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3106, 'learning_rate': 2.919e-05, 'epoch': 1.09} +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:31,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:23,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:31,358 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:23,228 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 974/17840 [1:26:52<25:51:10, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:47:34,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 974/17840 [1:26:52<25:51:10, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:47:34,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 974/17840 [1:26:52<25:51:10, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:47:34,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 974/17840 [1:26:52<25:51:10, 5.52s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:47:34,084 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 975/17840 [1:26:58<26:09:54, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:47:39,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 975/17840 [1:26:58<26:09:54, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:47:39,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:43,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:39,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:43,681 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:39,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:46,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:39,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:46,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:39,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:46,233 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:39,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 977/17840 [1:27:08<25:05:53, 5.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:47:50,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:52,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:50,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 978/17840 [1:27:13<24:35:49, 5.25s/it]g-point operations will not be computed-10 22:47:50,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 978/17840 [1:27:13<24:35:49, 5.25s/it]g-point operations will not be computed-10 22:47:50,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:56,236 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:50,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:58,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:50,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:47:58,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:50,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2145, 'learning_rate': 2.9370000000000002e-05, 'epoch': 1.1} +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:02,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:50,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:02,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:47:50,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 980/17840 [1:27:22<23:26:27, 5.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 5%|████ | 980/17840 [1:27:22<23:26:27, 5.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:07,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:07,843 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:10,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:12,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:12,189 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:14,285 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:16,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:16,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:18,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:19,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:19,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:21,820 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:25,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:25,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:26,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:26,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:28,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:28,355 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:31,027 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:33,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:33,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:35,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:35,501 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:37,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:37,324 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:39,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:39,019 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.543, 'learning_rate': 2.973e-05, 'epoch': 1.11} +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:39,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:43,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:43,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:46,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:46,824 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.6938, 'learning_rate': 2.979e-05, 'epoch': 1.11} +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:50,272 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:53,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:53,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.8028, 'learning_rate': 2.982e-05, 'epoch': 1.11} +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:57,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:48:57,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:00,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:00,302 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:03,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:03,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:03,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:06,879 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:10,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:10,172 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:13,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:13,422 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4902, 'learning_rate': 2.991e-05, 'epoch': 1.12} +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:18,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:18,271 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 998/17840 [1:28:39<28:22:25, 6.06s/it]g-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 998/17840 [1:28:39<28:22:25, 6.06s/it]g-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 998/17840 [1:28:39<28:22:25, 6.06s/it]g-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 998/17840 [1:28:39<28:22:25, 6.06s/it]g-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:26,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:26,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:26,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:33,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:33,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1305, 'learning_rate': 3e-05, 'epoch': 1.12} +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:33,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:33,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:49:33,076 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:48:04,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1001/17840 [1:28:59<29:49:27, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:49:41,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1001/17840 [1:28:59<29:49:27, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:49:41,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1001/17840 [1:28:59<29:49:27, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:49:41,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1001/17840 [1:28:59<29:49:27, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:49:41,097 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1002/17840 [1:29:05<29:38:26, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:49:47,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1002/17840 [1:29:05<29:38:26, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:49:47,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1002/17840 [1:29:05<29:38:26, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:49:47,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1002/17840 [1:29:05<29:38:26, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:49:47,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:29:11<29:28:25, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:49:53,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:29:11<29:28:25, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:49:53,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:29:11<29:28:25, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:49:53,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1003/17840 [1:29:11<29:28:25, 6.30s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:49:53,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1004/17840 [1:29:17<29:17:53, 6.26s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:49:53,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:50:01,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:49:53,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:50:01,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:49:53,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:50:01,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:49:53,601 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1005/17840 [1:29:24<29:18:41, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:06,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1005/17840 [1:29:24<29:18:41, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:06,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1005/17840 [1:29:24<29:18:41, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:06,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1005/17840 [1:29:24<29:18:41, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:06,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1006/17840 [1:29:30<29:11:00, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:12,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1006/17840 [1:29:30<29:11:00, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:12,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1006/17840 [1:29:30<29:11:00, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:12,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1006/17840 [1:29:30<29:11:00, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:12,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1007/17840 [1:29:36<29:02:38, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:18,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1007/17840 [1:29:36<29:02:38, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:18,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1007/17840 [1:29:36<29:02:38, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:18,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1007/17840 [1:29:36<29:02:38, 6.21s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:18,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:29:42<28:49:15, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:24,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████ | 1008/17840 [1:29:42<28:49:15, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:24,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:50:28,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:24,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:50:28,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:24,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2076, 'learning_rate': 2.998396674584323e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-10 22:50:28,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:24,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:50:28,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:24,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:50:28,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:24,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1010/17840 [1:29:54<28:24:11, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1010/17840 [1:29:54<28:24:11, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:50:40,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:50:40,794 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2217, 'learning_rate': 2.998040380047506e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-10 22:50:45,297 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1012/17840 [1:30:06<28:10:37, 6.03s/it]g-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1012/17840 [1:30:06<28:10:37, 6.03s/it]g-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3091, 'learning_rate': 2.9978622327790974e-05, 'epoch': 1.13} +[WARNING|modeling_utils.py:388] 2022-03-10 22:50:51,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1013/17840 [1:30:12<27:54:51, 5.97s/it]g-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1013/17840 [1:30:12<27:54:51, 5.97s/it]g-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0609, 'learning_rate': 2.997684085510689e-05, 'epoch': 1.14} +[WARNING|modeling_utils.py:388] 2022-03-10 22:50:57,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1014/17840 [1:30:18<27:50:00, 5.96s/it]g-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1014/17840 [1:30:18<27:50:00, 5.96s/it]g-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:01,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:01,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1015/17840 [1:30:23<27:36:56, 5.91s/it]g-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1015/17840 [1:30:23<27:36:56, 5.91s/it]g-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:07,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:07,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:07,275 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:50:36,362 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1016/17840 [1:30:29<27:22:23, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1016/17840 [1:30:29<27:22:23, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1016/17840 [1:30:29<27:22:23, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:15,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:15,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:15,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:15,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:21,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:24,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:24,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:24,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1019/17840 [1:30:46<26:40:00, 5.71s/it]g-point operations will not be computed-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:29,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:29,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:29,812 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:11,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1020/17840 [1:30:52<26:31:34, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:51:34,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1020/17840 [1:30:52<26:31:34, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:51:34,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:38,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:34,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:38,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:34,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1667, 'learning_rate': 2.9962589073634204e-05, 'epoch': 1.14} +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:42,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:34,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:42,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:34,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1022/17840 [1:31:03<26:10:39, 5.60s/it]g-point operations will not be computed-10 22:51:34,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1022/17840 [1:31:03<26:10:39, 5.60s/it]g-point operations will not be computed-10 22:51:34,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:47,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:34,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:47,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:34,040 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1023/17840 [1:31:08<25:57:24, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:51:50,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1023/17840 [1:31:08<25:57:24, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:51:50,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:54,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:50,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:54,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:50,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2545, 'learning_rate': 2.9957244655581948e-05, 'epoch': 1.15} +[WARNING|modeling_utils.py:388] 2022-03-10 22:51:58,556 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:50,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1025/17840 [1:31:19<26:07:41, 5.59s/it]g-point operations will not be computed-10 22:51:50,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1025/17840 [1:31:19<26:07:41, 5.59s/it]g-point operations will not be computed-10 22:51:50,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:02,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:50,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:02,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:50,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:02,952 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:51:50,484 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1026/17840 [1:31:25<25:37:49, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:52:06,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1026/17840 [1:31:25<25:37:49, 5.49s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:52:06,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:10,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:06,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:10,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:06,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:13,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:06,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:13,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:06,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:13,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:06,827 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1028/17840 [1:31:35<24:39:06, 5.28s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:52:16,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:19,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:16,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1029/17840 [1:31:40<24:08:03, 5.17s/it]g-point operations will not be computed-10 22:52:16,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1029/17840 [1:31:40<24:08:03, 5.17s/it]g-point operations will not be computed-10 22:52:16,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:23,016 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:16,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:25,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:16,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:25,349 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:16,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1786, 'learning_rate': 2.9946555819477437e-05, 'epoch': 1.15} +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:28,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:16,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:28,886 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:16,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1031/17840 [1:31:49<23:03:05, 4.94s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:52:31,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:33,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:31,229 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1032/17840 [1:31:54<22:22:55, 4.79s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:52:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1032/17840 [1:31:54<22:22:55, 4.79s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:52:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:37,706 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:35,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1033/17840 [1:31:58<21:37:33, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:52:39,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1033/17840 [1:31:58<21:37:33, 4.63s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:52:39,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:41,837 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:39,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1034/17840 [1:32:02<20:49:04, 4.46s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:52:43,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1034/17840 [1:32:02<20:49:04, 4.46s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:52:43,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:45,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:43,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:45,639 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:43,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1035/17840 [1:32:06<19:49:49, 4.25s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:52:47,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:49,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:47,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:49,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:47,555 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1036/17840 [1:32:09<18:45:41, 4.02s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:52:50,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1037/17840 [1:32:12<17:29:35, 3.75s/it]g-point operations will not be computed-10 22:52:50,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1037/17840 [1:32:12<17:29:35, 3.75s/it]g-point operations will not be computed-10 22:52:50,902 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1038/17840 [1:32:15<15:58:36, 3.42s/it]g-point operations will not be computed-10 22:52:53,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▏ | 1038/17840 [1:32:15<15:58:36, 3.42s/it]g-point operations will not be computed-10 22:52:53,908 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:57,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:56,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:57,629 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:56,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:59,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:58,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:52:59,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:52:58,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:01,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:00,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:01,715 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:00,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1042/17840 [1:32:23<10:29:09, 2.25s/it]g-point operations will not be computed-10 22:53:02,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1042/17840 [1:32:23<10:29:09, 2.25s/it]g-point operations will not be computed-10 22:53:02,636 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1042/17840 [1:32:23<10:29:09, 2.25s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:53:05,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1042/17840 [1:32:23<10:29:09, 2.25s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:53:05,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:08,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:05,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:08,982 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:05,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1043/17840 [1:32:30<17:01:09, 3.65s/it]g-point operations will not be computed-10 22:53:05,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1043/17840 [1:32:30<17:01:09, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:53:12,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:15,732 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:12,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1044/17840 [1:32:37<21:14:41, 4.55s/it]g-point operations will not be computed-10 22:53:12,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1044/17840 [1:32:37<21:14:41, 4.55s/it]g-point operations will not be computed-10 22:53:12,408 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1044/17840 [1:32:37<21:14:41, 4.55s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:53:19,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:22,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:19,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|█��██▎ | 1045/17840 [1:32:43<24:08:11, 5.17s/it]g-point operations will not be computed-10 22:53:19,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:32:43<24:08:11, 5.17s/it]g-point operations will not be computed-10 22:53:19,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1045/17840 [1:32:43<24:08:11, 5.17s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:53:25,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:28,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:25,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:32:50<26:03:58, 5.59s/it]g-point operations will not be computed-10 22:53:25,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:32:50<26:03:58, 5.59s/it]g-point operations will not be computed-10 22:53:25,659 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:32:50<26:03:58, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1046/17840 [1:32:50<26:03:58, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:36,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:36,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5066, 'learning_rate': 2.991627078384798e-05, 'epoch': 1.17} +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:36,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:36,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1048/17840 [1:33:03<28:11:04, 6.04s/it]g-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1048/17840 [1:33:03<28:11:04, 6.04s/it]g-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:46,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:46,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1049/17840 [1:33:09<28:39:25, 6.14s/it]g-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1049/17840 [1:33:09<28:39:25, 6.14s/it]g-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:53,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:53:53,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1050/17840 [1:33:16<29:33:18, 6.34s/it]g-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1050/17840 [1:33:16<29:33:18, 6.34s/it]g-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1865, 'learning_rate': 2.9910926365795728e-05, 'epoch': 1.18} + 6%|████▎ | 1050/17840 [1:33:16<29:33:18, 6.34s/it]g-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:03,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:03,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1958, 'learning_rate': 2.990914489311164e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:03,037 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:09,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:09,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3965, 'learning_rate': 2.990736342042755e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:09,328 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:15,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:15,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2306, 'learning_rate': 2.990558194774347e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:15,579 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:21,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:21,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3773, 'learning_rate': 2.990380047505938e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:21,779 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:27,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:27,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1611, 'learning_rate': 2.99020190023753e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:27,914 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:34,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:34,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1622, 'learning_rate': 2.990023752969121e-05, 'epoch': 1.18} +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:34,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:34,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:34,160 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:53:32,142 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:33:59<28:48:03, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:54:41,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:33:59<28:48:03, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:54:41,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:33:59<28:48:03, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:54:41,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1057/17840 [1:33:59<28:48:03, 6.18s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:54:41,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1058/17840 [1:34:05<28:41:28, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1058/17840 [1:34:05<28:41:28, 6.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:52,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:52,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0988, 'learning_rate': 2.9894893111638958e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:52,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:58,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:58,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0928, 'learning_rate': 2.989311163895487e-05, 'epoch': 1.19} +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:58,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:54:58,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:04,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:04,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:08,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:08,808 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1062/17840 [1:34:29<28:06:47, 6.03s/it]g-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1062/17840 [1:34:29<28:06:47, 6.03s/it]g-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:14,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:14,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1063/17840 [1:34:35<28:04:35, 6.02s/it]g-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1063/17840 [1:34:35<28:04:35, 6.02s/it]g-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:20,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:20,755 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1064/17840 [1:34:41<27:53:29, 5.99s/it]g-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:25,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:25,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:25,183 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1065/17840 [1:34:47<27:46:01, 5.96s/it]g-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:31,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:31,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:31,078 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:54:47,855 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1066/17840 [1:34:53<27:38:08, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:55:35,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1066/17840 [1:34:53<27:38:08, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:55:35,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:39,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:35,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:39,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:35,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9859, 'learning_rate': 2.9880641330166272e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:39,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:35,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:45,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:35,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:45,495 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:35,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0189, 'learning_rate': 2.9878859857482187e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:49,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:35,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1069/17840 [1:35:10<27:04:47, 5.81s/it]g-point operations will not be computed-10 22:55:35,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▎ | 1069/17840 [1:35:10<27:04:47, 5.81s/it]g-point operations will not be computed-10 22:55:35,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:54,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:35,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:54,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:35,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:55:54,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:35,456 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1070/17840 [1:35:16<26:45:21, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:55:58,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1070/17840 [1:35:16<26:45:21, 5.74s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:55:58,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:02,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:58,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:02,376 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:58,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2003, 'learning_rate': 2.9873515439429928e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:06,537 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:58,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1072/17840 [1:35:27<26:14:40, 5.63s/it]g-point operations will not be computed-10 22:55:58,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1072/17840 [1:35:27<26:14:40, 5.63s/it]g-point operations will not be computed-10 22:55:58,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:10,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:58,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:10,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:58,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:10,666 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:55:58,274 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1073/17840 [1:35:33<26:02:37, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:56:14,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1073/17840 [1:35:33<26:02:37, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:56:14,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:18,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:14,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:18,692 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:14,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9879, 'learning_rate': 2.9868171021377672e-05, 'epoch': 1.2} +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:22,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:14,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1075/17840 [1:35:44<25:57:50, 5.58s/it]g-point operations will not be computed-10 22:56:14,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1075/17840 [1:35:44<25:57:50, 5.58s/it]g-point operations will not be computed-10 22:56:14,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0389, 'learning_rate': 2.9866389548693587e-05, 'epoch': 1.21} +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:28,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:14,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:28,385 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:14,789 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1076/17840 [1:35:49<25:29:22, 5.47s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:56:30,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:33,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:30,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1077/17840 [1:35:54<24:53:00, 5.34s/it]g-point operations will not be computed-10 22:56:30,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1077/17840 [1:35:54<24:53:00, 5.34s/it]g-point operations will not be computed-10 22:56:30,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:37,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:30,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:37,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:30,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:37,258 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:30,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1078/17840 [1:35:59<24:21:40, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:56:40,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:43,327 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:40,932 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1079/17840 [1:36:04<23:48:56, 5.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:56:45,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1079/17840 [1:36:04<23:48:56, 5.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:56:45,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2413, 'learning_rate': 2.9859263657957246e-05, 'epoch': 1.21} +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:49,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:45,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:49,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:45,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0885, 'learning_rate': 2.985748218527316e-05, 'epoch': 1.21} +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:52,771 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:45,778 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1081/17840 [1:36:13<22:47:56, 4.90s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:56:55,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1081/17840 [1:36:13<22:47:56, 4.90s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:56:55,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:56:57,245 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:55,089 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1082/17840 [1:36:17<22:07:02, 4.75s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:56:59,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1082/17840 [1:36:17<22:07:02, 4.75s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:56:59,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:01,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:56:59,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1083/17840 [1:36:22<21:20:21, 4.58s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:03,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1083/17840 [1:36:22<21:20:21, 4.58s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:03,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:05,526 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:03,577 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1084/17840 [1:36:26<20:27:25, 4.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:07,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1084/17840 [1:36:26<20:27:25, 4.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:07,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:09,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:07,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:09,184 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:07,446 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1085/17840 [1:36:29<19:19:47, 4.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:10,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1086/17840 [1:36:33<18:13:26, 3.92s/it]g-point operations will not be computed-10 22:57:10,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1086/17840 [1:36:33<18:13:26, 3.92s/it]g-point operations will not be computed-10 22:57:10,986 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:15,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:14,249 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1087/17840 [1:36:36<17:00:27, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:17,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1087/17840 [1:36:36<17:00:27, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:17,243 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1088/17840 [1:36:38<15:47:38, 3.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:19,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1088/17840 [1:36:38<15:47:38, 3.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:19,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1089/17840 [1:36:41<14:31:38, 3.12s/it]g-point operations will not be computed-10 22:57:19,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1089/17840 [1:36:41<14:31:38, 3.12s/it]g-point operations will not be computed-10 22:57:19,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:23,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:22,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:23,441 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:22,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:25,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:24,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:25,432 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:24,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:36:47<10:47:38, 2.32s/it]g-point operations will not be computed-10 22:57:26,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:36:47<10:47:38, 2.32s/it]g-point operations will not be computed-10 22:57:26,412 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:36:47<10:47:38, 2.32s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:29,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1092/17840 [1:36:47<10:47:38, 2.32s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:29,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:32,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:29,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:32,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:29,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1093/17840 [1:36:54<17:15:29, 3.71s/it]g-point operations will not be computed-10 22:57:29,440 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1093/17840 [1:36:54<17:15:29, 3.71s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:36,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:39,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:36,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:37:00<21:27:30, 4.61s/it]g-point operations will not be computed-10 22:57:36,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:37:00<21:27:30, 4.61s/it]g-point operations will not be computed-10 22:57:36,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1094/17840 [1:37:00<21:27:30, 4.61s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:42,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:46,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:42,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1095/17840 [1:37:07<24:14:00, 5.21s/it]g-point operations will not be computed-10 22:57:42,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1095/17840 [1:37:07<24:14:00, 5.21s/it]g-point operations will not be computed-10 22:57:42,983 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1095/17840 [1:37:07<24:14:00, 5.21s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:49,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:57:52,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:49,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:37:14<26:07:15, 5.62s/it]g-point operations will not be computed-10 22:57:49,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:37:14<26:07:15, 5.62s/it]g-point operations will not be computed-10 22:57:49,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:37:14<26:07:15, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1096/17840 [1:37:14<26:07:15, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:01,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:01,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:01,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5431, 'learning_rate': 2.9827197149643708e-05, 'epoch': 1.23} +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:01,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1098/17840 [1:37:27<28:23:33, 6.11s/it]g-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1098/17840 [1:37:27<28:23:33, 6.11s/it]g-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:10,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:10,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:37:33<28:52:29, 6.21s/it]g-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▍ | 1099/17840 [1:37:33<28:52:29, 6.21s/it]g-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:17,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:17,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:17,298 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:37:40<29:49:33, 6.41s/it]g-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:37:40<29:49:33, 6.41s/it]g-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:37:40<29:49:33, 6.41s/it]g-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1100/17840 [1:37:40<29:49:33, 6.41s/it]g-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:27,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:27,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:27,371 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:33,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:33,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0777, 'learning_rate': 2.981828978622328e-05, 'epoch': 1.24} +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:33,703 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:39,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:39,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9565, 'learning_rate': 2.9816508313539193e-05, 'epoch': 1.24} +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:39,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:39,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:58:39,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:57:56,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1104/17840 [1:38:05<29:29:29, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:58:47,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1104/17840 [1:38:05<29:29:29, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:58:47,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1104/17840 [1:38:05<29:29:29, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:58:47,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1104/17840 [1:38:05<29:29:29, 6.34s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:58:47,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:38:12<29:20:28, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:58:54,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:38:12<29:20:28, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:58:54,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:38:12<29:20:28, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:58:54,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1105/17840 [1:38:12<29:20:28, 6.31s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:58:54,133 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1106/17840 [1:38:18<29:08:38, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:00,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1106/17840 [1:38:18<29:08:38, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:00,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1106/17840 [1:38:18<29:08:38, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:00,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1106/17840 [1:38:18<29:08:38, 6.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:00,276 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1107/17840 [1:38:24<28:55:37, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:06,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1107/17840 [1:38:24<28:55:37, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:06,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1107/17840 [1:38:24<28:55:37, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:06,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1107/17840 [1:38:24<28:55:37, 6.22s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:06,414 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1108/17840 [1:38:30<28:48:01, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1108/17840 [1:38:30<28:48:01, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1108/17840 [1:38:30<28:48:01, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1108/17840 [1:38:30<28:48:01, 6.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1109/17840 [1:38:36<28:45:32, 6.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:59:20,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:59:20,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:59:20,288 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:12,546 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1110/17840 [1:38:42<28:37:51, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:24,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1110/17840 [1:38:42<28:37:51, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:24,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1110/17840 [1:38:42<28:37:51, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:24,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1110/17840 [1:38:42<28:37:51, 6.16s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:24,825 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1111/17840 [1:38:49<28:33:16, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:30,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1111/17840 [1:38:49<28:33:16, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:30,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1111/17840 [1:38:49<28:33:16, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:30,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1111/17840 [1:38:49<28:33:16, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:30,892 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1112/17840 [1:38:55<28:22:14, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:36,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1112/17840 [1:38:55<28:22:14, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:36,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1112/17840 [1:38:55<28:22:14, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:36,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:59:41,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:36,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:59:41,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:36,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:59:41,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:36,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:59:41,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:36,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:59:41,323 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:36,883 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1114/17840 [1:39:06<28:05:29, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:59:51,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:59:51,850 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1115/17840 [1:39:12<28:01:18, 6.03s/it]g-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1115/17840 [1:39:12<28:01:18, 6.03s/it]g-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1115/17840 [1:39:12<28:01:18, 6.03s/it]g-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1115/17840 [1:39:12<28:01:18, 6.03s/it]g-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:59:59,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 22:59:59,152 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:03,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:03,553 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1117/17840 [1:39:24<27:31:22, 5.92s/it]g-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1117/17840 [1:39:24<27:31:22, 5.92s/it]g-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:09,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:09,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1118/17840 [1:39:30<27:23:16, 5.90s/it]g-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:13,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:13,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:13,701 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 22:59:48,910 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1119/17840 [1:39:36<27:12:18, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:00:18,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1119/17840 [1:39:36<27:12:18, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:00:18,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:22,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:18,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:22,273 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:18,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.003, 'learning_rate': 2.9786223277909737e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:26,550 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:18,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1121/17840 [1:39:47<26:45:14, 5.76s/it]g-point operations will not be computed-10 23:00:18,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1121/17840 [1:39:47<26:45:14, 5.76s/it]g-point operations will not be computed-10 23:00:18,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:30,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:18,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:30,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:18,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:30,766 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:18,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1122/17840 [1:39:53<26:27:08, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1122/17840 [1:39:53<26:27:08, 5.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:38,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:38,989 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.097, 'learning_rate': 2.9780878859857485e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:43,171 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1124/17840 [1:40:04<26:03:55, 5.61s/it]g-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1124/17840 [1:40:04<26:03:55, 5.61s/it]g-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:47,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:47,294 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1125/17840 [1:40:10<26:17:53, 5.66s/it]g-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1125/17840 [1:40:10<26:17:53, 5.66s/it]g-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:53,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:55,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:55,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2069, 'learning_rate': 2.9775534441805226e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-10 23:00:59,418 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1127/17840 [1:40:20<25:08:10, 5.41s/it]g-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1127/17840 [1:40:20<25:08:10, 5.41s/it]g-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:03,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:05,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:05,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1118, 'learning_rate': 2.9771971496437055e-05, 'epoch': 1.26} +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:09,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:00:34,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1129/17840 [1:40:30<24:04:27, 5.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:11,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▌ | 1129/17840 [1:40:30<24:04:27, 5.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:11,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1537, 'learning_rate': 2.977019002375297e-05, 'epoch': 1.27} +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:15,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:01:11,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:15,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:01:11,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9541, 'learning_rate': 2.9768408551068885e-05, 'epoch': 1.27} + 6%|████▋ | 1131/17840 [1:40:39<22:59:39, 4.95s/it]g-point operations will not be computed-10 23:01:11,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1131/17840 [1:40:39<22:59:39, 4.95s/it]g-point operations will not be computed-10 23:01:11,915 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1131/17840 [1:40:39<22:59:39, 4.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:21,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:23,419 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:01:21,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1132/17840 [1:40:44<22:10:24, 4.78s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:25,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1132/17840 [1:40:44<22:10:24, 4.78s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:25,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:27,690 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:01:25,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1133/17840 [1:40:48<21:22:20, 4.61s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:29,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1133/17840 [1:40:48<21:22:20, 4.61s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:29,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1134/17840 [1:40:52<20:11:08, 4.35s/it]g-point operations will not be computed-10 23:01:29,712 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1134/17840 [1:40:52<20:11:08, 4.35s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:33,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1134/17840 [1:40:52<20:11:08, 4.35s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:33,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1135/17840 [1:40:55<18:58:11, 4.09s/it]g-point operations will not be computed-10 23:01:33,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1135/17840 [1:40:55<18:58:11, 4.09s/it]g-point operations will not be computed-10 23:01:33,374 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:38,377 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:01:36,801 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1136/17840 [1:40:58<17:47:12, 3.83s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:39,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1136/17840 [1:40:58<17:47:12, 3.83s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:39,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1137/17840 [1:41:01<16:30:37, 3.56s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:42,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1137/17840 [1:41:01<16:30:37, 3.56s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:42,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1138/17840 [1:41:04<15:13:54, 3.28s/it]g-point operations will not be computed-10 23:01:42,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:46,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:01:45,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:46,477 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:01:45,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:48,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:01:47,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:48,637 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:01:47,622 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:50,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:01:49,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:50,593 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:01:49,702 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1142/17840 [1:41:12<10:24:14, 2.24s/it]g-point operations will not be computed-10 23:01:51,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1142/17840 [1:41:12<10:24:14, 2.24s/it]g-point operations will not be computed-10 23:01:51,535 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1142/17840 [1:41:12<10:24:14, 2.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:54,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1142/17840 [1:41:12<10:24:14, 2.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:01:54,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8846, 'learning_rate': 2.9747030878859858e-05, 'epoch': 1.28} +[WARNING|modeling_utils.py:388] 2022-03-10 23:01:57,945 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:01:54,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1143/17840 [1:41:19<16:55:19, 3.65s/it]g-point operations will not be computed-10 23:01:54,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1143/17840 [1:41:19<16:55:19, 3.65s/it]g-point operations will not be computed-10 23:01:54,552 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1143/17840 [1:41:19<16:55:19, 3.65s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:02:01,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:02:04,688 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:02:01,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1144/17840 [1:41:26<21:09:32, 4.56s/it]g-point operations will not be computed-10 23:02:01,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1144/17840 [1:41:26<21:09:32, 4.56s/it]g-point operations will not be computed-10 23:02:01,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1144/17840 [1:41:26<21:09:32, 4.56s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:02:08,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1144/17840 [1:41:26<21:09:32, 4.56s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:02:08,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-10 23:02:08,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-10 23:02:08,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:41:32<24:04:12, 5.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:02:14,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1145/17840 [1:41:32<24:04:12, 5.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:02:14,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:02:18,011 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:02:14,720 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1146/17840 [1:41:39<26:02:45, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1146/17840 [1:41:39<26:02:45, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.5664, 'learning_rate': 2.9739904988123517e-05, 'epoch': 1.28} +[WARNING|modeling_utils.py:388] 2022-03-10 23:02:24,582 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1147/17840 [1:41:45<27:21:52, 5.90s/it]g-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1147/17840 [1:41:45<27:21:52, 5.90s/it]g-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:02:29,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:02:29,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:02:29,597 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1148/17840 [1:41:52<28:23:46, 6.12s/it]g-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:02:36,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:02:36,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:02:36,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1149/17840 [1:41:58<28:50:01, 6.22s/it]g-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1149/17840 [1:41:58<28:50:01, 6.22s/it]g-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:02:44,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:42:05<29:49:42, 6.43s/it]g-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:42:05<29:49:42, 6.43s/it]g-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2102, 'learning_rate': 2.9732779097387176e-05, 'epoch': 1.29} + 6%|████▋ | 1150/17840 [1:42:05<29:49:42, 6.43s/it]g-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:42:05<29:49:42, 6.43s/it]g-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1150/17840 [1:42:05<29:49:42, 6.43s/it]g-point operations will not be computed-10 23:02:21,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:42:12<29:55:07, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:02:54,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:42:12<29:55:07, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:02:54,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:42:12<29:55:07, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:02:54,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1151/17840 [1:42:12<29:55:07, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:02:54,387 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:42:18<29:54:05, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:00,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:42:18<29:54:05, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:00,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:42:18<29:54:05, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:00,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1152/17840 [1:42:18<29:54:05, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:00,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1153/17840 [1:42:25<29:39:55, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1153/17840 [1:42:25<29:39:55, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1153/17840 [1:42:25<29:39:55, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1153/17840 [1:42:25<29:39:55, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1154/17840 [1:42:31<29:24:48, 6.35s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:14,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:14,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:14,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1155/17840 [1:42:37<29:18:00, 6.32s/it]g-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:21,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:21,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:21,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1156/17840 [1:42:43<29:08:44, 6.29s/it]g-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:27,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:27,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:27,215 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1157/17840 [1:42:49<28:54:56, 6.24s/it]g-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:33,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:33,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:33,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1158/17840 [1:42:56<28:46:59, 6.21s/it]g-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:39,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:39,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:39,431 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 6%|████▋ | 1159/17840 [1:43:02<28:30:54, 6.15s/it]g-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:45,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:45,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:45,507 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:07,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▋ | 1160/17840 [1:43:08<28:23:44, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:50,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▋ | 1160/17840 [1:43:08<28:23:44, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:50,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▋ | 1160/17840 [1:43:08<28:23:44, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:50,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▋ | 1160/17840 [1:43:08<28:23:44, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:50,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1161/17840 [1:43:14<28:11:58, 6.09s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:03:50,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:57,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:50,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:57,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:50,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:03:57,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:03:50,045 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1162/17840 [1:43:20<28:01:14, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:04:01,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1162/17840 [1:43:20<28:01:14, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:04:01,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1162/17840 [1:43:20<28:01:14, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:04:01,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1162/17840 [1:43:20<28:01:14, 6.05s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:04:01,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1163/17840 [1:43:26<27:56:57, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1163/17840 [1:43:26<27:56:57, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:12,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:12,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0078, 'learning_rate': 2.9707838479809976e-05, 'epoch': 1.3} +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:12,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:18,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:18,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0641, 'learning_rate': 2.9706057007125894e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:22,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1166/17840 [1:43:43<27:13:40, 5.88s/it]g-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1166/17840 [1:43:43<27:13:40, 5.88s/it]g-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:26,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:26,768 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1167/17840 [1:43:49<27:03:56, 5.84s/it]g-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1167/17840 [1:43:49<27:03:56, 5.84s/it]g-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:32,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:32,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:32,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:07,946 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:43:54<26:49:18, 5.79s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:04:36,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:43:54<26:49:18, 5.79s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:04:36,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:43:54<26:49:18, 5.79s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:04:36,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1168/17840 [1:43:54<26:49:18, 5.79s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:04:36,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1169/17840 [1:44:00<26:44:45, 5.78s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:04:42,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:45,217 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:42,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1170/17840 [1:44:06<26:25:32, 5.71s/it]g-point operations will not be computed-10 23:04:42,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1170/17840 [1:44:06<26:25:32, 5.71s/it]g-point operations will not be computed-10 23:04:42,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1472, 'learning_rate': 2.9697149643705465e-05, 'epoch': 1.31} +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:50,822 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:42,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1171/17840 [1:44:11<26:15:28, 5.67s/it]g-point operations will not be computed-10 23:04:42,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1171/17840 [1:44:11<26:15:28, 5.67s/it]g-point operations will not be computed-10 23:04:42,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:54,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:42,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:54,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:42,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:04:54,990 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:42,499 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1172/17840 [1:44:17<26:05:03, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:04:59,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1172/17840 [1:44:17<26:05:03, 5.63s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:04:59,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:03,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:59,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:03,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:59,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0924, 'learning_rate': 2.9691805225653205e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:07,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:59,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1174/17840 [1:44:28<25:43:35, 5.56s/it]g-point operations will not be computed-10 23:04:59,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1174/17840 [1:44:28<25:43:35, 5.56s/it]g-point operations will not be computed-10 23:04:59,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:11,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:59,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:11,393 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:04:59,147 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1175/17840 [1:44:34<26:00:00, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:05:15,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1175/17840 [1:44:34<26:00:00, 5.62s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:05:15,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0753, 'learning_rate': 2.9688242280285035e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:19,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:15,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:19,676 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:15,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:22,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:15,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:22,279 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:15,826 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1177/17840 [1:44:44<24:53:08, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:05:26,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1177/17840 [1:44:44<24:53:08, 5.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:05:26,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.192, 'learning_rate': 2.9684679334916864e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:29,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:26,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:29,700 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:26,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:32,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:26,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:34,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:26,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:34,572 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:26,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1233, 'learning_rate': 2.9681116389548694e-05, 'epoch': 1.32} +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:38,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:26,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:38,148 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:26,072 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1180/17840 [1:44:58<23:12:24, 5.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:42,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:42,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▊ | 1181/17840 [1:45:03<22:35:25, 4.88s/it]g-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:46,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:46,104 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:48,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:50,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:50,253 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:52,252 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:54,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:54,220 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:56,007 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:57,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:05:57,815 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:01,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:02,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:02,679 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:04,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:04,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:06,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:06,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:08,106 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:10,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:10,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:12,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:12,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:15,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:15,281 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:16,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:16,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:19,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:19,591 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:22,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:22,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:26,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:26,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:26,416 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:29,746 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:33,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:33,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:33,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:36,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:36,474 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:39,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:39,933 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:43,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:46,508 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:49,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:49,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.3939, 'learning_rate': 2.9649049881235156e-05, 'epoch': 1.34} +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:49,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:49,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:06:49,739 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:05:40,524 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1198/17840 [1:46:15<28:15:18, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1198/17840 [1:46:15<28:15:18, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1198/17840 [1:46:15<28:15:18, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1198/17840 [1:46:15<28:15:18, 6.11s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1199/17840 [1:46:22<28:49:56, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1199/17840 [1:46:22<28:49:56, 6.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:07,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1200/17840 [1:46:29<29:42:48, 6.43s/it]g-point operations will not be computed-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1200/17840 [1:46:29<29:42:48, 6.43s/it]g-point operations will not be computed-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2941, 'learning_rate': 2.9643705463182897e-05, 'epoch': 1.35} + 7%|████▉ | 1200/17840 [1:46:29<29:42:48, 6.43s/it]g-point operations will not be computed-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:16,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:16,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1355, 'learning_rate': 2.9641923990498815e-05, 'epoch': 1.35} +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:16,197 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:22,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:22,549 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1867, 'learning_rate': 2.9640142517814726e-05, 'epoch': 1.35} +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:25,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:25,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:25,748 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:06:57,972 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [1:46:48<29:28:38, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:07:30,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [1:46:48<29:28:38, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:07:30,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [1:46:48<29:28:38, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:07:30,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1203/17840 [1:46:48<29:28:38, 6.38s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:07:30,465 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1204/17840 [1:46:54<29:16:17, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1204/17840 [1:46:54<29:16:17, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1204/17840 [1:46:54<29:16:17, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1204/17840 [1:46:54<29:16:17, 6.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1205/17840 [1:47:00<29:05:07, 6.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:44,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:44,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:44,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1206/17840 [1:47:07<29:04:09, 6.29s/it]g-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:50,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:50,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:50,607 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1207/17840 [1:47:13<28:51:23, 6.25s/it]g-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:56,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:56,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:07:56,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1208/17840 [1:47:19<28:38:55, 6.20s/it]g-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:02,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:02,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:02,842 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1209/17840 [1:47:25<28:28:21, 6.16s/it]g-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:08,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:08,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:08,909 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:07:36,663 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1210/17840 [1:47:31<28:15:14, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:08:13,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1210/17840 [1:47:31<28:15:14, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:08:13,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1210/17840 [1:47:31<28:15:14, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:08:13,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1210/17840 [1:47:31<28:15:14, 6.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:08:13,395 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1211/17840 [1:47:37<28:02:31, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:08:19,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1211/17840 [1:47:37<28:02:31, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:08:19,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1211/17840 [1:47:37<28:02:31, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:08:19,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1211/17840 [1:47:37<28:02:31, 6.07s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:08:19,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1212/17840 [1:47:43<27:54:22, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1212/17840 [1:47:43<27:54:22, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:29,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:29,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.133, 'learning_rate': 2.9620546318289785e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:29,811 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:35,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:35,800 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0731, 'learning_rate': 2.9618764845605703e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:40,246 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1215/17840 [1:48:01<27:39:01, 5.99s/it]g-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1215/17840 [1:48:01<27:39:01, 5.99s/it]g-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1957, 'learning_rate': 2.9616983372921615e-05, 'epoch': 1.36} + 7%|████▉ | 1215/17840 [1:48:01<27:39:01, 5.99s/it]g-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:47,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:47,558 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9928, 'learning_rate': 2.9615201900237533e-05, 'epoch': 1.36} +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:51,988 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1217/17840 [1:48:13<27:15:54, 5.90s/it]g-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1217/17840 [1:48:13<27:15:54, 5.90s/it]g-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:56,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:56,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:08:56,240 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1218/17840 [1:48:18<26:59:44, 5.85s/it]g-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:01,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:01,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:01,993 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:08:25,360 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1219/17840 [1:48:24<26:52:58, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:09:06,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1219/17840 [1:48:24<26:52:58, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:09:06,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:10,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:06,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:10,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:06,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9934, 'learning_rate': 2.960807600950119e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:14,809 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:06,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1221/17840 [1:48:35<26:30:24, 5.74s/it]g-point operations will not be computed-10 23:09:06,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|████▉ | 1221/17840 [1:48:35<26:30:24, 5.74s/it]g-point operations will not be computed-10 23:09:06,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0687, 'learning_rate': 2.9606294536817103e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:20,383 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:06,346 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1222/17840 [1:48:41<26:12:52, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1222/17840 [1:48:41<26:12:52, 5.68s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0115, 'learning_rate': 2.9604513064133018e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:27,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:27,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8958, 'learning_rate': 2.9602731591448933e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:31,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:31,375 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1224/17840 [1:48:52<25:45:40, 5.58s/it]g-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:35,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:35,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:35,428 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1225/17840 [1:48:58<26:03:55, 5.65s/it]g-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:41,303 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:43,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:43,841 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1473, 'learning_rate': 2.9597387173396674e-05, 'epoch': 1.37} +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:47,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:47,735 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1227/17840 [1:49:08<25:02:58, 5.43s/it]g-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:51,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:51,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:51,574 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:23,191 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1228/17840 [1:49:13<24:36:11, 5.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:09:55,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:57,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:55,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:09:57,868 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:55,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1229/17840 [1:49:18<24:08:06, 5.23s/it]g-point operations will not be computed-10 23:09:55,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:01,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:55,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:01,531 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:55,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:03,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:55,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:03,900 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:55,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:07,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:55,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:07,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:09:55,404 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1231/17840 [1:49:28<23:04:30, 5.00s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:10:09,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:12,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:09,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:12,153 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:09,888 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1232/17840 [1:49:32<22:30:24, 4.88s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:10:14,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:16,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:14,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:16,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:14,398 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1233/17840 [1:49:37<21:38:48, 4.69s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:10:18,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:20,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:18,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:20,568 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:18,589 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1234/17840 [1:49:41<20:42:06, 4.49s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:10:22,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:24,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:22,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:24,286 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:22,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1235/17840 [1:49:44<19:30:42, 4.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:10:26,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1236/17840 [1:49:48<18:20:03, 3.98s/it]g-point operations will not be computed-10 23:10:26,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1236/17840 [1:49:48<18:20:03, 3.98s/it]g-point operations will not be computed-10 23:10:26,088 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:29,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:30,907 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:29,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1237/17840 [1:49:51<17:08:19, 3.72s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:10:32,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1238/17840 [1:49:54<15:53:52, 3.45s/it]g-point operations will not be computed-10 23:10:32,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1238/17840 [1:49:54<15:53:52, 3.45s/it]g-point operations will not be computed-10 23:10:32,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-10 23:10:35,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + g-point operations will not be computed-10 23:10:35,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:38,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:37,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:38,767 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:37,667 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:40,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:39,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:40,828 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:39,898 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1242/17840 [1:50:02<10:50:54, 2.35s/it]g-point operations will not be computed-10 23:10:41,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1242/17840 [1:50:02<10:50:54, 2.35s/it]g-point operations will not be computed-10 23:10:41,793 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1242/17840 [1:50:02<10:50:54, 2.35s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:10:44,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1242/17840 [1:50:02<10:50:54, 2.35s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:10:44,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:48,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:44,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:48,396 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:44,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1243/17840 [1:50:09<17:32:40, 3.81s/it]g-point operations will not be computed-10 23:10:44,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1243/17840 [1:50:09<17:32:40, 3.81s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:10:51,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:10:55,205 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:51,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1244/17840 [1:50:16<21:28:41, 4.66s/it]g-point operations will not be computed-10 23:10:51,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1244/17840 [1:50:16<21:28:41, 4.66s/it]g-point operations will not be computed-10 23:10:51,950 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1244/17840 [1:50:16<21:28:41, 4.66s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:10:58,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1244/17840 [1:50:16<21:28:41, 4.66s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:10:58,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:01,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:58,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:01,807 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:10:58,569 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1245/17840 [1:50:23<24:09:17, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1245/17840 [1:50:23<24:09:17, 5.24s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:08,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:08,413 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1246/17840 [1:50:29<26:02:27, 5.65s/it]g-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:13,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:13,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:13,347 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1247/17840 [1:50:36<27:16:39, 5.92s/it]g-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:19,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:19,905 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1248/17840 [1:50:42<28:08:29, 6.11s/it]g-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1248/17840 [1:50:42<28:08:29, 6.11s/it]g-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2825, 'learning_rate': 2.9558194774346795e-05, 'epoch': 1.4} +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:27,985 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [1:50:49<28:36:24, 6.21s/it]g-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [1:50:49<28:36:24, 6.21s/it]g-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1802, 'learning_rate': 2.9556413301662706e-05, 'epoch': 1.4} + 7%|█████ | 1249/17840 [1:50:49<28:36:24, 6.21s/it]g-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [1:50:49<28:36:24, 6.21s/it]g-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1249/17840 [1:50:49<28:36:24, 6.21s/it]g-point operations will not be computed-10 23:11:05,115 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [1:50:56<29:29:00, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [1:50:56<29:29:00, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [1:50:56<29:29:00, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1250/17840 [1:50:56<29:29:00, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1251/17840 [1:51:02<29:33:53, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:46,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:46,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:46,129 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████ | 1252/17840 [1:51:08<29:34:52, 6.42s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:52,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:52,482 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1253/17840 [1:51:15<29:25:29, 6.39s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1253/17840 [1:51:15<29:25:29, 6.39s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:58,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:11:58,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████�� | 1254/17840 [1:51:21<29:08:56, 6.33s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1254/17840 [1:51:21<29:08:56, 6.33s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:04,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:04,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1255/17840 [1:51:27<28:57:38, 6.29s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1255/17840 [1:51:27<28:57:38, 6.29s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:11,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:11,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1256/17840 [1:51:33<28:50:06, 6.26s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1256/17840 [1:51:33<28:50:06, 6.26s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:17,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:17,352 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1257/17840 [1:51:40<28:49:21, 6.26s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1257/17840 [1:51:40<28:49:21, 6.26s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:23,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:23,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1258/17840 [1:51:46<28:32:02, 6.19s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1258/17840 [1:51:46<28:32:02, 6.19s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:29,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:29,562 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [1:51:52<28:23:27, 6.16s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1259/17840 [1:51:52<28:23:27, 6.16s/it]g-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:35,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:35,650 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:11:38,131 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1260/17840 [1:51:58<28:16:54, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:12:40,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1260/17840 [1:51:58<28:16:54, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:12:40,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9883, 'learning_rate': 2.9536817102137765e-05, 'epoch': 1.41} + 7%|█████▏ | 1260/17840 [1:51:58<28:16:54, 6.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:12:40,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1261/17840 [1:52:04<28:14:19, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:12:40,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1261/17840 [1:52:04<28:14:19, 6.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:12:40,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:47,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:12:40,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:47,817 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:12:40,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1262/17840 [1:52:10<28:08:14, 6.11s/it]g-point operations will not be computed-10 23:12:40,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1262/17840 [1:52:10<28:08:14, 6.11s/it]g-point operations will not be computed-10 23:12:40,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:53,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:12:40,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:53,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:12:40,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:12:53,867 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:12:40,239 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1263/17840 [1:52:16<27:59:12, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:12:58,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1263/17840 [1:52:16<27:59:12, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:12:58,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1263/17840 [1:52:16<27:59:12, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:12:58,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1263/17840 [1:52:16<27:59:12, 6.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:12:58,394 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1264/17840 [1:52:22<27:53:40, 6.06s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:07,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:07,283 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1265/17840 [1:52:28<27:37:00, 6.00s/it]g-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1265/17840 [1:52:28<27:37:00, 6.00s/it]g-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1265/17840 [1:52:28<27:37:00, 6.00s/it]g-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1265/17840 [1:52:28<27:37:00, 6.00s/it]g-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:14,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:14,516 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:18,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:18,895 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1267/17840 [1:52:39<27:09:50, 5.90s/it]g-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:23,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:23,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:23,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:04,363 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1268/17840 [1:52:45<26:53:54, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1268/17840 [1:52:45<26:53:54, 5.84s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:31,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:31,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9841, 'learning_rate': 2.9520783847981e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:31,673 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:37,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:37,336 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9508, 'learning_rate': 2.9519002375296913e-05, 'epoch': 1.42} +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:41,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:41,518 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1271/17840 [1:53:02<26:13:23, 5.70s/it]g-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:45,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:45,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:45,752 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1272/17840 [1:53:08<25:59:43, 5.65s/it]g-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:51,266 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:53,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:53,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9581, 'learning_rate': 2.9513657957244657e-05, 'epoch': 1.43} +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:58,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:13:58,044 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1274/17840 [1:53:19<25:34:34, 5.56s/it]g-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:02,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:02,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:02,139 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1275/17840 [1:53:24<25:51:06, 5.62s/it]g-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:07,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:10,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:10,468 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8824, 'learning_rate': 2.95083135391924e-05, 'epoch': 1.43} +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:14,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:14,366 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1277/17840 [1:53:35<24:54:08, 5.41s/it]g-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:18,201 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:20,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:20,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9188, 'learning_rate': 2.950475059382423e-05, 'epoch': 1.43} +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:24,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:24,313 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1279/17840 [1:53:45<23:49:42, 5.18s/it]g-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:28,015 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:30,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:30,331 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:32,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:32,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:32,734 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:13:27,489 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1281/17840 [1:53:54<22:45:46, 4.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:14:36,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:38,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:14:36,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:38,438 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:14:36,212 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1282/17840 [1:53:59<22:10:15, 4.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:14:40,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:42,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:14:40,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:42,912 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:14:40,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▏ | 1283/17840 [1:54:03<21:37:27, 4.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:14:45,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:47,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:14:45,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:47,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:14:45,077 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1284/17840 [1:54:07<20:51:25, 4.54s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:14:49,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:51,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:14:49,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:51,024 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:14:49,154 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1285/17840 [1:54:11<19:54:30, 4.33s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:14:52,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:54,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:14:52,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:14:54,619 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:14:52,918 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1286/17840 [1:54:15<18:45:24, 4.08s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:14:56,299 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1287/17840 [1:54:18<17:24:12, 3.78s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:14:59,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1287/17840 [1:54:18<17:24:12, 3.78s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:14:59,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1288/17840 [1:54:21<16:11:29, 3.52s/it]g-point operations will not be computed-10 23:14:59,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1288/17840 [1:54:21<16:11:29, 3.52s/it]g-point operations will not be computed-10 23:14:59,338 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:03,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:02,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:03,521 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:02,235 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1289/17840 [1:54:23<15:01:29, 3.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:15:04,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1289/17840 [1:54:23<15:01:29, 3.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:15:04,795 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1290/17840 [1:54:26<13:43:23, 2.99s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:15:07,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1290/17840 [1:54:26<13:43:23, 2.99s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:15:07,047 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1291/17840 [1:54:28<12:22:43, 2.69s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:15:08,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1291/17840 [1:54:28<12:22:43, 2.69s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:15:08,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1292/17840 [1:54:29<10:59:46, 2.39s/it]g-point operations will not be computed-10 23:15:08,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1292/17840 [1:54:29<10:59:46, 2.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:15:12,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:15,370 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:12,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1293/17840 [1:54:36<17:09:34, 3.73s/it]g-point operations will not be computed-10 23:15:12,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1293/17840 [1:54:36<17:09:34, 3.73s/it]g-point operations will not be computed-10 23:15:12,010 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1293/17840 [1:54:36<17:09:34, 3.73s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:15:18,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:22,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:18,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [1:54:43<21:13:31, 4.62s/it]g-point operations will not be computed-10 23:15:18,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [1:54:43<21:13:31, 4.62s/it]g-point operations will not be computed-10 23:15:18,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [1:54:43<21:13:31, 4.62s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:15:25,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1294/17840 [1:54:43<21:13:31, 4.62s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:15:25,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:28,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:25,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:28,716 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:25,427 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1295/17840 [1:54:49<23:58:27, 5.22s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1295/17840 [1:54:49<23:58:27, 5.22s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:35,227 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [1:54:56<25:48:17, 5.62s/it]g-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1296/17840 [1:54:56<25:48:17, 5.62s/it]g-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2823, 'learning_rate': 2.947268408551069e-05, 'epoch': 1.45} +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:41,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1297/17840 [1:55:03<27:10:10, 5.91s/it]g-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1297/17840 [1:55:03<27:10:10, 5.91s/it]g-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0709, 'learning_rate': 2.9470902612826604e-05, 'epoch': 1.45} +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:48,400 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [1:55:09<28:01:40, 6.10s/it]g-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1298/17840 [1:55:09<28:01:40, 6.10s/it]g-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1961, 'learning_rate': 2.946912114014252e-05, 'epoch': 1.46} + 7%|█████▎ | 1298/17840 [1:55:09<28:01:40, 6.10s/it]g-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:56,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:56,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9854, 'learning_rate': 2.9467339667458434e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:56,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:56,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:15:56,462 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:15:32,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [1:55:22<29:20:56, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [1:55:22<29:20:56, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1300/17840 [1:55:22<29:20:56, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [1:55:29<29:25:07, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1301/17840 [1:55:29<29:25:07, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2246, 'learning_rate': 2.9463776722090263e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:14,469 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1302/17840 [1:55:35<29:18:40, 6.38s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1302/17840 [1:55:35<29:18:40, 6.38s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9933, 'learning_rate': 2.9461995249406174e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:20,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1303/17840 [1:55:41<29:04:51, 6.33s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1303/17840 [1:55:41<29:04:51, 6.33s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.015, 'learning_rate': 2.9460213776722093e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:26,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1304/17840 [1:55:48<28:57:46, 6.31s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1304/17840 [1:55:48<28:57:46, 6.31s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.013, 'learning_rate': 2.9458432304038004e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:33,110 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1305/17840 [1:55:54<28:45:03, 6.26s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1305/17840 [1:55:54<28:45:03, 6.26s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0291, 'learning_rate': 2.9456650831353922e-05, 'epoch': 1.46} +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:39,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [1:56:00<28:48:43, 6.27s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1306/17840 [1:56:00<28:48:43, 6.27s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0074, 'learning_rate': 2.9454869358669834e-05, 'epoch': 1.46} + 7%|█████▎ | 1306/17840 [1:56:00<28:48:43, 6.27s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:47,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:47,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8531, 'learning_rate': 2.945308788598575e-05, 'epoch': 1.47} +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:47,255 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:53,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:53,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1087, 'learning_rate': 2.9451306413301663e-05, 'epoch': 1.47} +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:53,410 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:59,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:59,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9014, 'learning_rate': 2.9449524940617578e-05, 'epoch': 1.47} +[WARNING|modeling_utils.py:388] 2022-03-10 23:16:59,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:05,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:05,512 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:08,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:08,504 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1311/17840 [1:56:31<27:55:18, 6.08s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1311/17840 [1:56:31<27:55:18, 6.08s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0712, 'learning_rate': 2.9445961995249407e-05, 'epoch': 1.47} +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:15,991 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1312/17840 [1:56:37<27:47:55, 6.05s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1312/17840 [1:56:37<27:47:55, 6.05s/it]g-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:20,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:20,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:20,444 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:16:05,000 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1313/17840 [1:56:43<27:36:16, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:17:24,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1313/17840 [1:56:43<27:36:16, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:17:24,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1313/17840 [1:56:43<27:36:16, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:17:24,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▎ | 1313/17840 [1:56:43<27:36:16, 6.01s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:17:24,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1314/17840 [1:56:48<27:31:41, 6.00s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:17:24,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:32,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:24,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:32,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:24,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:32,284 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:24,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1315/17840 [1:56:54<27:19:34, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:17:36,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1315/17840 [1:56:54<27:19:34, 5.95s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:17:36,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:40,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:36,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:40,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:36,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8349, 'learning_rate': 2.943705463182898e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:40,973 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:36,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:46,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:36,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:46,773 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:36,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9725, 'learning_rate': 2.9435273159144892e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:51,085 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:36,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1318/17840 [1:57:12<26:46:13, 5.83s/it]g-point operations will not be computed-10 23:17:36,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1318/17840 [1:57:12<26:46:13, 5.83s/it]g-point operations will not be computed-10 23:17:36,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:55,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:36,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:17:55,472 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:36,710 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1319/17840 [1:57:17<26:42:06, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1319/17840 [1:57:17<26:42:06, 5.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0834, 'learning_rate': 2.9431710213776722e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:03,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:03,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0072, 'learning_rate': 2.942992874109264e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:03,884 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:09,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:09,510 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9393, 'learning_rate': 2.942814726840855e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:13,725 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1322/17840 [1:57:34<25:59:46, 5.67s/it]g-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1322/17840 [1:57:34<25:59:46, 5.67s/it]g-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:17,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:17,846 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1323/17840 [1:57:40<25:44:29, 5.61s/it]g-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1323/17840 [1:57:40<25:44:29, 5.61s/it]g-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:23,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:26,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:26,069 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9718, 'learning_rate': 2.9422802850356296e-05, 'epoch': 1.48} +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:30,202 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1325/17840 [1:57:51<26:00:38, 5.67s/it]g-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1325/17840 [1:57:51<26:00:38, 5.67s/it]g-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.139, 'learning_rate': 2.942102137767221e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:36,006 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1326/17840 [1:57:56<25:31:32, 5.56s/it]g-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1326/17840 [1:57:56<25:31:32, 5.56s/it]g-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:39,935 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:42,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:42,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0171, 'learning_rate': 2.941745843230404e-05, 'epoch': 1.49} +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:46,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:46,268 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1328/17840 [1:58:07<24:31:43, 5.35s/it]g-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:50,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:50,143 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:52,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:52,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:56,272 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:18:56,272 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:17:59,769 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1330/17840 [1:58:17<23:34:46, 5.14s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:01,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:01,053 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 7%|█████▍ | 1331/17840 [1:58:21<22:59:16, 5.01s/it]g-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:04,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:04,502 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:06,651 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:08,823 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:10,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:10,871 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:12,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:12,897 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:14,745 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:16,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:16,615 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:18,322 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:20,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:20,038 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:23,162 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:24,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:27,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:27,345 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:28,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:28,655 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:30,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:30,961 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:32,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:32,941 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:34,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:34,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:35,451 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:39,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:39,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:39,035 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:42,357 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:45,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:45,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:45,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:49,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:49,029 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:52,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:52,380 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:55,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:55,675 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:19:59,028 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:02,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:02,290 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.1642, 'learning_rate': 2.9383610451306413e-05, 'epoch': 1.51} +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:05,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:05,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:05,660 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1347/17840 [1:59:28<27:16:01, 5.95s/it]g-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:12,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:12,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:12,344 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1348/17840 [1:59:35<28:02:43, 6.12s/it]g-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1348/17840 [1:59:35<28:02:43, 6.12s/it]g-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:20,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:20,429 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [1:59:41<28:32:40, 6.23s/it]g-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [1:59:41<28:32:40, 6.23s/it]g-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [1:59:41<28:32:40, 6.23s/it]g-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [1:59:41<28:32:40, 6.23s/it]g-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1349/17840 [1:59:41<28:32:40, 6.23s/it]g-point operations will not be computed-10 23:18:58,744 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [1:59:48<29:24:30, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:20:30,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [1:59:48<29:24:30, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:20:30,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [1:59:48<29:24:30, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:20:30,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1350/17840 [1:59:48<29:24:30, 6.42s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:20:30,609 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1351/17840 [1:59:55<29:31:02, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:20:37,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1351/17840 [1:59:55<29:31:02, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:20:37,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1351/17840 [1:59:55<29:31:02, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:20:37,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1351/17840 [1:59:55<29:31:02, 6.44s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:20:37,124 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1352/17840 [2:00:01<29:32:01, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1352/17840 [2:00:01<29:32:01, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1352/17840 [2:00:01<29:32:01, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1352/17840 [2:00:01<29:32:01, 6.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1353/17840 [2:00:07<29:19:32, 6.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:51,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:51,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:51,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1354/17840 [2:00:14<29:10:48, 6.37s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1354/17840 [2:00:14<29:10:48, 6.37s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:59,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:20:59,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:00:20<29:02:33, 6.34s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1355/17840 [2:00:20<29:02:33, 6.34s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:05,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:05,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1356/17840 [2:00:26<28:51:57, 6.30s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1356/17840 [2:00:26<28:51:57, 6.30s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:11,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:11,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1357/17840 [2:00:32<28:45:13, 6.28s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1357/17840 [2:00:32<28:45:13, 6.28s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:17,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:17,751 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1358/17840 [2:00:38<28:29:31, 6.22s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1358/17840 [2:00:38<28:29:31, 6.22s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:23,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:23,861 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1359/17840 [2:00:45<28:19:49, 6.19s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1359/17840 [2:00:45<28:19:49, 6.19s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:29,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:29,949 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1360/17840 [2:00:51<28:10:01, 6.15s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1360/17840 [2:00:51<28:10:01, 6.15s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:35,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:35,921 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1361/17840 [2:00:57<27:55:22, 6.10s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:40,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:40,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:40,439 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1362/17840 [2:01:03<27:47:11, 6.07s/it]g-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:46,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:46,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:21:46,424 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:20:43,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1363/17840 [2:01:09<27:34:09, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:21:50,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1363/17840 [2:01:09<27:34:09, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:21:50,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1363/17840 [2:01:09<27:34:09, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:21:50,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1363/17840 [2:01:09<27:34:09, 6.02s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:21:50,845 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1364/17840 [2:01:14<27:21:16, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:21:56,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1364/17840 [2:01:14<27:21:16, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:21:56,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:00,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:21:56,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:00,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:21:56,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9649, 'learning_rate': 2.934976247030879e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:00,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:21:56,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:06,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:21:56,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:06,784 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:21:56,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0531, 'learning_rate': 2.93479809976247e-05, 'epoch': 1.53} +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:11,058 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:21:56,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1367/17840 [2:01:32<26:42:06, 5.84s/it]g-point operations will not be computed-10 23:21:56,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1367/17840 [2:01:32<26:42:06, 5.84s/it]g-point operations will not be computed-10 23:21:56,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:21:56,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:21:56,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:15,415 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:21:56,694 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1368/17840 [2:01:37<26:31:40, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:22:19,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1368/17840 [2:01:37<26:31:40, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:22:19,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1368/17840 [2:01:37<26:31:40, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:22:19,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1368/17840 [2:01:37<26:31:40, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:22:19,711 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1369/17840 [2:01:43<26:20:01, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:22:25,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1369/17840 [2:01:43<26:20:01, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:22:25,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:29,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:25,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:29,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:25,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.822, 'learning_rate': 2.934085510688836e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:29,483 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:25,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:35,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:25,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:35,061 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:25,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:37,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:25,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:37,849 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:25,348 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1372/17840 [2:02:00<25:40:14, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:22:41,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1372/17840 [2:02:00<25:40:14, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:22:41,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0069, 'learning_rate': 2.933729216152019e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:46,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:41,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:46,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:41,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9051, 'learning_rate': 2.933551068883611e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:50,159 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:41,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1374/17840 [2:02:11<25:18:17, 5.53s/it]g-point operations will not be computed-10 23:22:41,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▌ | 1374/17840 [2:02:11<25:18:17, 5.53s/it]g-point operations will not be computed-10 23:22:41,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:54,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:41,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:22:54,121 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:41,948 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1375/17840 [2:02:16<25:25:26, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:22:58,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1375/17840 [2:02:16<25:25:26, 5.56s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:22:58,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.006, 'learning_rate': 2.9331947743467934e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:02,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:58,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:02,318 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:58,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9758, 'learning_rate': 2.933016627078385e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:06,119 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:58,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1377/17840 [2:02:27<24:22:07, 5.33s/it]g-point operations will not be computed-10 23:22:58,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1377/17840 [2:02:27<24:22:07, 5.33s/it]g-point operations will not be computed-10 23:22:58,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:09,877 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:58,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:12,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:58,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:12,337 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:58,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.832, 'learning_rate': 2.932660332541568e-05, 'epoch': 1.54} +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:16,022 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:22:58,523 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1379/17840 [2:02:36<23:26:10, 5.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1379/17840 [2:02:36<23:26:10, 5.13s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:20,857 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1380/17840 [2:02:41<23:00:16, 5.03s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1380/17840 [2:02:41<23:00:16, 5.03s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:24,388 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:26,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:26,592 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:28,887 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:31,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:31,013 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:33,155 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:35,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:35,130 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:37,095 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:38,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:38,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:40,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:42,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:42,564 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:44,305 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:47,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:47,466 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:48,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:48,876 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:51,515 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:52,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:52,747 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:54,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:54,880 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:57,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:57,640 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:59,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:23:59,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.6792, 'learning_rate': 2.9303444180522567e-05, 'epoch': 1.56} +{'loss': 5.2107, 'learning_rate': 2.9301662707838482e-05, 'epoch': 1.56} +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:02,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:02,874 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:06,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:06,244 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:09,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:09,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:13,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:13,041 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.4006, 'learning_rate': 2.9298099762470308e-05, 'epoch': 1.56} +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:16,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:16,450 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:19,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:19,730 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:23,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:23,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:23,151 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:26,373 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:29,719 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:03:52<27:09:34, 5.95s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1397/17840 [2:03:52<27:09:34, 5.95s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:37,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:37,960 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1398/17840 [2:03:59<27:55:06, 6.11s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1398/17840 [2:03:59<27:55:06, 6.11s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:44,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:44,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:04:05<28:33:33, 6.25s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:04:05<28:33:33, 6.25s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:04:05<28:33:33, 6.25s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:04:05<28:33:33, 6.25s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1399/17840 [2:04:05<28:33:33, 6.25s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1400/17840 [2:04:12<29:27:19, 6.45s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:56,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:56,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:24:56,308 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1401/17840 [2:04:19<29:27:02, 6.45s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:02,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:02,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:02,727 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1402/17840 [2:04:25<29:23:58, 6.44s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1402/17840 [2:04:25<29:23:58, 6.44s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:10,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:10,649 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:04:31<29:10:54, 6.39s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1403/17840 [2:04:31<29:10:54, 6.39s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:16,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:16,875 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1404/17840 [2:04:38<28:59:13, 6.35s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1404/17840 [2:04:38<28:59:13, 6.35s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:23,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:23,043 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1405/17840 [2:04:44<28:43:38, 6.29s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▋ | 1405/17840 [2:04:44<28:43:38, 6.29s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:29,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:29,241 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:04:50<28:32:36, 6.25s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1406/17840 [2:04:50<28:32:36, 6.25s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:35,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:35,325 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1407/17840 [2:04:56<28:20:26, 6.21s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1407/17840 [2:04:56<28:20:26, 6.21s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:41,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:41,522 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:05:02<28:18:10, 6.20s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1408/17840 [2:05:02<28:18:10, 6.20s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:47,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:47,610 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1409/17840 [2:05:08<28:09:03, 6.17s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1409/17840 [2:05:08<28:09:03, 6.17s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:53,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:53,722 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1410/17840 [2:05:14<28:02:18, 6.14s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1410/17840 [2:05:14<28:02:18, 6.14s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:59,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:25:59,781 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1411/17840 [2:05:20<27:55:50, 6.12s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:04,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:04,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:04,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1412/17840 [2:05:26<27:46:36, 6.09s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:10,287 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1413/17840 [2:05:32<27:34:34, 6.04s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:16,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:16,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:16,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1414/17840 [2:05:38<27:28:03, 6.02s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:22,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:22,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:22,146 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1415/17840 [2:05:44<27:14:01, 5.97s/it]g-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:27,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:27,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:27,995 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:23:18,486 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1416/17840 [2:05:50<27:03:52, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1416/17840 [2:05:50<27:03:52, 5.93s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:36,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:36,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8235, 'learning_rate': 2.925712589073634e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:36,714 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:42,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:42,497 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.801, 'learning_rate': 2.925534441805226e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:46,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:46,899 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1419/17840 [2:06:07<26:41:30, 5.85s/it]g-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1419/17840 [2:06:07<26:41:30, 5.85s/it]g-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:52,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:52,576 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1420/17840 [2:06:13<26:23:42, 5.79s/it]g-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:56,774 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:59,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:26:59,559 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0244, 'learning_rate': 2.925e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:03,754 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1422/17840 [2:06:24<25:53:36, 5.68s/it]g-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1422/17840 [2:06:24<25:53:36, 5.68s/it]g-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0703, 'learning_rate': 2.9248218527315918e-05, 'epoch': 1.59} +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:09,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:09,269 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1423/17840 [2:06:30<25:40:28, 5.63s/it]g-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:13,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:13,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:13,471 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:26:32,391 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1424/17840 [2:06:35<25:31:56, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:27:17,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1424/17840 [2:06:35<25:31:56, 5.60s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:27:17,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:21,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:17,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:21,956 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:17,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.7618, 'learning_rate': 2.924287410926366e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:26,050 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:17,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1426/17840 [2:06:47<25:26:36, 5.58s/it]g-point operations will not be computed-10 23:27:17,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1426/17840 [2:06:47<25:26:36, 5.58s/it]g-point operations will not be computed-10 23:27:17,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:29,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:17,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:29,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:17,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:29,971 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:17,548 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1427/17840 [2:06:52<24:52:06, 5.45s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:27:33,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:36,350 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:33,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1428/17840 [2:06:57<24:21:06, 5.34s/it]g-point operations will not be computed-10 23:27:33,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1428/17840 [2:06:57<24:21:06, 5.34s/it]g-point operations will not be computed-10 23:27:33,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:40,166 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:33,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:42,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:33,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:42,644 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:33,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8137, 'learning_rate': 2.9235748218527317e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:46,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:33,859 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1430/17840 [2:07:07<23:29:14, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:27:48,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1430/17840 [2:07:07<23:29:14, 5.15s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:27:48,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8495, 'learning_rate': 2.923396674584323e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:52,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:48,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:52,316 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:48,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9221, 'learning_rate': 2.9232185273159147e-05, 'epoch': 1.6} +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:55,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:48,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:27:55,758 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:48,819 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1432/17840 [2:07:16<22:17:06, 4.89s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:27:58,054 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:28:00,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:58,054 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:28:00,187 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:27:58,054 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1433/17840 [2:07:20<21:32:34, 4.73s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:02,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:28:04,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:02,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:28:04,260 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:02,300 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1434/17840 [2:07:24<20:32:47, 4.51s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:06,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1435/17840 [2:07:28<19:34:50, 4.30s/it]g-point operations will not be computed-10 23:28:06,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1435/17840 [2:07:28<19:34:50, 4.30s/it]g-point operations will not be computed-10 23:28:06,282 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▊ | 1435/17840 [2:07:28<19:34:50, 4.30s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:09,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1436/17840 [2:07:32<18:21:57, 4.03s/it]g-point operations will not be computed-10 23:28:09,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1436/17840 [2:07:32<18:21:57, 4.03s/it]g-point operations will not be computed-10 23:28:09,963 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:28:14,821 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:13,314 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1437/17840 [2:07:35<17:06:41, 3.76s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:16,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1437/17840 [2:07:35<17:06:41, 3.76s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:16,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1438/17840 [2:07:37<15:39:05, 3.44s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:18,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1438/17840 [2:07:37<15:39:05, 3.44s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:18,920 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1439/17840 [2:07:40<14:14:11, 3.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:21,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1439/17840 [2:07:40<14:14:11, 3.12s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:21,256 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1440/17840 [2:07:42<12:51:14, 2.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:23,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1440/17840 [2:07:42<12:51:14, 2.82s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:23,306 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1441/17840 [2:07:44<11:34:09, 2.54s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:25,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1441/17840 [2:07:44<11:34:09, 2.54s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:25,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1442/17840 [2:07:45<10:20:47, 2.27s/it]g-point operations will not be computed-10 23:28:25,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1442/17840 [2:07:45<10:20:47, 2.27s/it]g-point operations will not be computed-10 23:28:25,134 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1442/17840 [2:07:45<10:20:47, 2.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:28,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1442/17840 [2:07:45<10:20:47, 2.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:28,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1442/17840 [2:07:45<10:20:47, 2.27s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:28,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1443/17840 [2:07:52<16:41:06, 3.66s/it]g-point operations will not be computed-10 23:28:28,101 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1443/17840 [2:07:52<16:41:06, 3.66s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:34,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1443/17840 [2:07:52<16:41:06, 3.66s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:34,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1443/17840 [2:07:52<16:41:06, 3.66s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:34,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:28:38,231 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:34,922 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1444/17840 [2:07:59<20:50:30, 4.58s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:41,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1444/17840 [2:07:59<20:50:30, 4.58s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:41,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:28:44,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:41,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:28:44,885 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:41,631 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:08:06<23:39:07, 5.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:48,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1445/17840 [2:08:06<23:39:07, 5.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:48,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:28:51,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:48,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:28:51,485 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:48,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1446/17840 [2:08:12<25:33:07, 5.61s/it]g-point operations will not be computed-10 23:28:48,214 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1446/17840 [2:08:12<25:33:07, 5.61s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:28:58,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:28:58,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:08:19<26:49:59, 5.89s/it]g-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1447/17840 [2:08:19<26:49:59, 5.89s/it]g-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:04,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:04,527 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1448/17840 [2:08:25<27:36:30, 6.06s/it]g-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1448/17840 [2:08:25<27:36:30, 6.06s/it]g-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:10,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:10,962 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:08:32<28:05:45, 6.17s/it]g-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1449/17840 [2:08:32<28:05:45, 6.17s/it]g-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:17,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:17,367 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:28:54,831 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1450/17840 [2:08:39<28:56:59, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:29:21,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1450/17840 [2:08:39<28:56:59, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:29:21,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1450/17840 [2:08:39<28:56:59, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:29:21,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1450/17840 [2:08:39<28:56:59, 6.36s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:29:21,063 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1451/17840 [2:08:45<29:04:42, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1451/17840 [2:08:45<29:04:42, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1451/17840 [2:08:45<29:04:42, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1451/17840 [2:08:45<29:04:42, 6.39s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1452/17840 [2:08:51<29:10:34, 6.41s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:35,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:35,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:35,480 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1453/17840 [2:08:58<29:04:49, 6.39s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:41,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:41,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:41,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1454/17840 [2:09:04<28:54:17, 6.35s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1454/17840 [2:09:04<28:54:17, 6.35s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:49,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:49,540 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1455/17840 [2:09:10<28:45:24, 6.32s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1455/17840 [2:09:10<28:45:24, 6.32s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:55,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:29:55,797 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1456/17840 [2:09:17<28:39:02, 6.30s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1456/17840 [2:09:17<28:39:02, 6.30s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:02,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:02,001 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1457/17840 [2:09:23<28:31:57, 6.27s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1457/17840 [2:09:23<28:31:57, 6.27s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:08,203 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1458/17840 [2:09:29<28:25:22, 6.25s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1458/17840 [2:09:29<28:25:22, 6.25s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8579, 'learning_rate': 2.918408551068884e-05, 'epoch': 1.63} +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:14,364 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1459/17840 [2:09:35<28:15:10, 6.21s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1459/17840 [2:09:35<28:15:10, 6.21s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.0062, 'learning_rate': 2.918230403800475e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:20,435 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:09:41<28:05:27, 6.17s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1460/17840 [2:09:41<28:05:27, 6.17s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8479, 'learning_rate': 2.9180522565320668e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:26,567 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1461/17840 [2:09:47<28:01:00, 6.16s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1461/17840 [2:09:47<28:01:00, 6.16s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8372, 'learning_rate': 2.917874109263658e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:32,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:32,611 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1462/17840 [2:09:53<27:47:26, 6.11s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:37,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:37,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:37,103 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1463/17840 [2:09:59<27:32:28, 6.05s/it]g-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:43,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:43,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:43,018 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:29:27,517 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1464/17840 [2:10:05<27:24:57, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:30:47,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1464/17840 [2:10:05<27:24:57, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:30:47,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1464/17840 [2:10:05<27:24:57, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:30:47,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1464/17840 [2:10:05<27:24:57, 6.03s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:30:47,509 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1465/17840 [2:10:11<27:11:47, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:30:53,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|█████▉ | 1465/17840 [2:10:11<27:11:47, 5.98s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:30:53,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:57,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:30:53,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:30:57,596 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:30:53,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.9785, 'learning_rate': 2.9169833729216153e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:01,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:30:53,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1467/17840 [2:10:23<26:45:10, 5.88s/it]g-point operations will not be computed-10 23:30:53,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1467/17840 [2:10:23<26:45:10, 5.88s/it]g-point operations will not be computed-10 23:30:53,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8827, 'learning_rate': 2.9168052256532068e-05, 'epoch': 1.64} +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:07,775 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:30:53,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1468/17840 [2:10:28<26:36:59, 5.85s/it]g-point operations will not be computed-10 23:30:53,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1468/17840 [2:10:28<26:36:59, 5.85s/it]g-point operations will not be computed-10 23:30:53,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:12,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:30:53,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:12,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:30:53,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:12,055 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:30:53,334 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1469/17840 [2:10:34<26:22:32, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:31:16,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1469/17840 [2:10:34<26:22:32, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:31:16,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1469/17840 [2:10:34<26:22:32, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:31:16,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1469/17840 [2:10:34<26:22:32, 5.80s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:31:16,341 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1470/17840 [2:10:40<26:11:26, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:31:21,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1470/17840 [2:10:40<26:11:26, 5.76s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:31:21,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:26,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:21,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:26,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:21,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.7572, 'learning_rate': 2.9160926365795727e-05, 'epoch': 1.65} +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:30,206 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:21,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1472/17840 [2:10:51<25:35:29, 5.63s/it]g-point operations will not be computed-10 23:31:21,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1472/17840 [2:10:51<25:35:29, 5.63s/it]g-point operations will not be computed-10 23:31:21,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:34,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:21,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:34,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:21,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:34,343 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:21,968 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1473/17840 [2:10:56<25:24:17, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:31:38,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1473/17840 [2:10:56<25:24:17, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:31:38,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:42,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:38,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:42,461 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:38,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.6764, 'learning_rate': 2.9155581947743468e-05, 'epoch': 1.65} +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:46,481 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:38,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1475/17840 [2:11:07<25:28:43, 5.60s/it]g-point operations will not be computed-10 23:31:38,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1475/17840 [2:11:07<25:28:43, 5.60s/it]g-point operations will not be computed-10 23:31:38,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:50,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:38,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:50,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:38,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:50,891 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:38,459 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1476/17840 [2:11:13<24:54:16, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:31:54,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1476/17840 [2:11:13<24:54:16, 5.48s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:31:54,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:58,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:54,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:31:58,382 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:54,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:00,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:54,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:00,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:54,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:00,911 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:31:54,733 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1478/17840 [2:11:23<23:45:21, 5.23s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:32:04,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:07,065 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:04,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1479/17840 [2:11:27<23:15:16, 5.12s/it]g-point operations will not be computed-10 23:32:04,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1479/17840 [2:11:27<23:15:16, 5.12s/it]g-point operations will not be computed-10 23:32:04,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:10,643 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:04,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:12,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:04,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:12,980 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:04,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 5.8229, 'learning_rate': 2.9144893111638956e-05, 'epoch': 1.66} + 8%|██████ | 1481/17840 [2:11:37<22:10:21, 4.88s/it]g-point operations will not be computed-10 23:32:04,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1481/17840 [2:11:37<22:10:21, 4.88s/it]g-point operations will not be computed-10 23:32:04,664 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1481/17840 [2:11:37<22:10:21, 4.88s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:32:18,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:20,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:18,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:20,896 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:18,743 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1482/17840 [2:11:41<21:29:57, 4.73s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:32:23,054 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:25,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:23,054 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:25,123 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:23,054 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1483/17840 [2:11:45<20:45:21, 4.57s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:32:27,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:29,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:27,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:29,168 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:27,211 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██���███ | 1484/17840 [2:11:49<19:59:28, 4.40s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:32:31,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:32,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:31,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:32,958 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:31,174 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1485/17840 [2:11:53<19:01:05, 4.19s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:32:34,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1486/17840 [2:11:56<17:53:59, 3.94s/it]g-point operations will not be computed-10 23:32:34,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1486/17840 [2:11:56<17:53:59, 3.94s/it]g-point operations will not be computed-10 23:32:34,760 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:39,602 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:38,066 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1487/17840 [2:12:00<16:49:44, 3.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:32:41,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1487/17840 [2:12:00<16:49:44, 3.70s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:32:41,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1488/17840 [2:12:02<15:46:37, 3.47s/it]g-point operations will not be computed-10 23:32:41,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1488/17840 [2:12:02<15:46:37, 3.47s/it]g-point operations will not be computed-10 23:32:41,207 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1489/17840 [2:12:05<14:19:32, 3.15s/it]g-point operations will not be computed-10 23:32:43,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1489/17840 [2:12:05<14:19:32, 3.15s/it]g-point operations will not be computed-10 23:32:43,976 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1490/17840 [2:12:07<12:56:33, 2.85s/it]g-point operations will not be computed-10 23:32:46,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1490/17840 [2:12:07<12:56:33, 2.85s/it]g-point operations will not be computed-10 23:32:46,315 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1491/17840 [2:12:09<11:37:57, 2.56s/it]g-point operations will not be computed-10 23:32:48,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1491/17840 [2:12:09<11:37:57, 2.56s/it]g-point operations will not be computed-10 23:32:48,397 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1492/17840 [2:12:11<10:23:49, 2.29s/it]g-point operations will not be computed-10 23:32:50,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1492/17840 [2:12:11<10:23:49, 2.29s/it]g-point operations will not be computed-10 23:32:50,219 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1492/17840 [2:12:11<10:23:49, 2.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:32:53,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1492/17840 [2:12:11<10:23:49, 2.29s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:32:53,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:56,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:53,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:32:56,603 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:53,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1493/17840 [2:12:17<16:36:41, 3.66s/it]g-point operations will not be computed-10 23:32:53,177 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1493/17840 [2:12:17<16:36:41, 3.66s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:32:59,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:33:03,251 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:32:59,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:12:24<20:40:19, 4.55s/it]g-point operations will not be computed-10 23:32:59,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:12:24<20:40:19, 4.55s/it]g-point operations will not be computed-10 23:32:59,975 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1494/17840 [2:12:24<20:40:19, 4.55s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:33:06,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:33:09,917 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:33:06,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1495/17840 [2:12:31<23:35:30, 5.20s/it]g-point operations will not be computed-10 23:33:06,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1495/17840 [2:12:31<23:35:30, 5.20s/it]g-point operations will not be computed-10 23:33:06,600 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1495/17840 [2:12:31<23:35:30, 5.20s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:33:13,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:33:16,452 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:33:13,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:12:37<25:23:32, 5.59s/it]g-point operations will not be computed-10 23:33:13,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:12:37<25:23:32, 5.59s/it]g-point operations will not be computed-10 23:33:13,278 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:12:37<25:23:32, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:33:19,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:12:37<25:23:32, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:33:19,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████ | 1496/17840 [2:12:37<25:23:32, 5.59s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:33:19,814 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1497/17840 [2:12:44<26:37:23, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:33:26,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1497/17840 [2:12:44<26:37:23, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:33:26,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +{'loss': 6.2014, 'learning_rate': 2.9114608076009504e-05, 'epoch': 1.68} + 8%|██████▏ | 1497/17840 [2:12:44<26:37:23, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:33:26,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1497/17840 [2:12:44<26:37:23, 5.86s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:33:26,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1498/17840 [2:12:50<27:25:59, 6.04s/it][WARNING|modeling_utils.py:388] 2022-03-10 23:33:26,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:33:34,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:33:26,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:33:34,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:33:26,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:33:34,267 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:33:26,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed + 8%|██████▏ | 1499/17840 [2:12:57<27:55:22, 6.15s/it]g-point operations will not be computed-10 23:33:26,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:33:40,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:33:26,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[WARNING|modeling_utils.py:388] 2022-03-10 23:33:40,707 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed-10 23:33:26,291 >> Could not estimate the number of tokens of the input, floating-point operations will not be computed +[INFO|trainer.py:2366] 2022-03-10 23:33:44,441 >> Num examples = 2642 | 1500/17840 [2:13:04<28:52:45, 6.36s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|trainer.py:2366] 2022-03-10 23:33:44,441 >> Num examples = 2642 | 1500/17840 [2:13:04<28:52:45, 6.36s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +{'loss': 5.9849, 'learning_rate': 2.9109263657957245e-05, 'epoch': 1.68} +[INFO|trainer.py:2366] 2022-03-10 23:33:44,441 >> Num examples = 2642 | 1500/17840 [2:13:04<28:52:45, 6.36s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|█▎ | 5/331 [00:04<05:15, 1.03it/s][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|█▊ | 7/331 [00:06<05:52, 1.09s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 2%|██ | 8/331 [00:07<05:56, 1.10s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▎ | 9/331 [00:09<06:55, 1.29s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 3%|██▋ | 11/331 [00:12<07:40, 1.44s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|██▉ | 12/331 [00:14<07:38, 1.44s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|███▏ | 13/331 [00:16<07:57, 1.50s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 4%|███▍ | 14/331 [00:17<08:02, 1.52s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|███▋ | 15/331 [00:20<09:27, 1.80s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|███▉ | 16/331 [00:21<09:37, 1.83s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 5%|████▍ | 18/331 [00:24<08:14, 1.58s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|████▋ | 19/331 [00:26<08:35, 1.65s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|████▉ | 20/331 [00:27<07:57, 1.53s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 6%|█████▏ | 21/331 [00:29<07:54, 1.53s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 7%|█████▋ | 23/331 [00:33<09:21, 1.82s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 7%|█████▉ | 24/331 [00:36<10:13, 2.00s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▏ | 25/331 [00:38<10:22, 2.03s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▍ | 26/331 [00:39<09:26, 1.86s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 8%|██████▋ | 27/331 [00:41<09:39, 1.91s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▏ | 29/331 [00:45<09:35, 1.90s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▍ | 30/331 [00:47<09:09, 1.82s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 9%|███████▋ | 31/331 [00:48<08:45, 1.75s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|███████▉ | 32/331 [00:50<08:43, 1.75s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 10%|████████▏ | 33/331 [00:52<08:52, 1.79s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|████████▋ | 35/331 [00:55<08:17, 1.68s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|████████▉ | 36/331 [00:57<08:34, 1.74s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|████████▉ | 36/331 [00:57<08:34, 1.74s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 11%|█████████▍ | 38/331 [01:01<09:07, 1.87s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|█████████▋ | 39/331 [01:02<08:27, 1.74s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 12%|██████████▏ | 41/331 [01:05<07:03, 1.46s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▍ | 42/331 [01:06<07:26, 1.55s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▋ | 43/331 [01:09<08:17, 1.73s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 13%|██████████▉ | 44/331 [01:11<08:48, 1.84s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▏ | 45/331 [01:12<08:42, 1.83s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 14%|███████████▋ | 47/331 [01:15<07:11, 1.52s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|███████████▉ | 48/331 [01:16<07:17, 1.55s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▏ | 49/331 [01:18<07:47, 1.66s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▍ | 50/331 [01:20<08:14, 1.76s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 15%|████████████▋ | 51/331 [01:23<08:54, 1.91s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|████████████▉ | 52/331 [01:24<08:36, 1.85s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 16%|█████████████▍ | 54/331 [01:27<07:28, 1.62s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|█████████████▋ | 55/331 [01:29<07:56, 1.73s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|█████████████▊ | 56/331 [01:31<07:35, 1.66s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 17%|██████████████ | 57/331 [01:32<07:12, 1.58s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▎ | 58/331 [01:34<08:15, 1.81s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▌ | 59/331 [01:36<07:52, 1.74s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 18%|██████████████▊ | 60/331 [01:38<07:52, 1.74s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▎ | 62/331 [01:41<07:50, 1.75s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 19%|███████████████▊ | 64/331 [01:45<07:57, 1.79s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████ | 65/331 [01:47<07:30, 1.69s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████▎ | 66/331 [01:50<09:16, 2.10s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 20%|████████████████▌ | 67/331 [01:53<10:13, 2.33s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|████████████████▊ | 68/331 [01:54<09:26, 2.15s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████ | 69/331 [01:56<09:22, 2.15s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████▎ | 70/331 [01:59<09:32, 2.20s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 21%|█████████████████▌ | 71/331 [02:01<09:55, 2.29s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|█████████████████▊ | 72/331 [02:03<08:55, 2.07s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|██████████████████ | 73/331 [02:05<08:29, 1.98s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 22%|██████████████████▎ | 74/331 [02:07<08:33, 2.00s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|██████████████████▌ | 75/331 [02:09<09:06, 2.13s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|██████████████████▊ | 76/331 [02:11<08:40, 2.04s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 23%|███████████████████ | 77/331 [02:13<08:04, 1.91s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▌ | 79/331 [02:15<07:00, 1.67s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|███████████████████▊ | 80/331 [02:17<06:31, 1.56s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 24%|████████████████████ | 81/331 [02:19<07:23, 1.77s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▎ | 82/331 [02:20<06:38, 1.60s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▌ | 83/331 [02:23<08:06, 1.96s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 25%|████████████████████▊ | 84/331 [02:25<08:14, 2.00s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 26%|█████████████████████ | 85/331 [02:27<07:41, 1.88s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 26%|█████████████████████▎ | 86/331 [02:29<07:53, 1.93s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|█████████████████████▊ | 88/331 [02:31<06:32, 1.62s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████ | 89/331 [02:33<05:53, 1.46s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 27%|██████████████████████▎ | 90/331 [02:34<05:56, 1.48s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|██████████████████████▊ | 92/331 [02:37<05:48, 1.46s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|███████████████████████ | 93/331 [02:39<06:15, 1.58s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 28%|███████████████████████▎ | 94/331 [02:41<06:19, 1.60s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|███████████████████████▌ | 95/331 [02:42<06:12, 1.58s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 29%|████████████████████████ | 97/331 [02:45<05:46, 1.48s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▎ | 98/331 [02:47<06:33, 1.69s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 30%|████████████████████████▍ | 100/331 [02:50<05:34, 1.45s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|████████████████████████▋ | 101/331 [02:51<05:18, 1.39s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|████████████████████████▉ | 102/331 [02:53<06:37, 1.74s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|█████████████████████████▏ | 103/331 [02:55<06:20, 1.67s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 31%|█████████████████████████▍ | 104/331 [02:57<06:15, 1.65s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|█████████████████████████▋ | 105/331 [02:58<06:28, 1.72s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 32%|██████████████████████████▏ | 107/331 [03:02<06:05, 1.63s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▍ | 108/331 [03:03<06:05, 1.64s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▋ | 109/331 [03:05<05:53, 1.59s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 33%|██████████████████████████▉ | 110/331 [03:07<06:27, 1.75s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▍ | 112/331 [03:10<05:48, 1.59s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▋ | 113/331 [03:11<05:33, 1.53s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 34%|███████████████████████████▉ | 114/331 [03:13<05:29, 1.52s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▍ | 116/331 [03:16<05:25, 1.51s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 35%|████████████████████████████▋ | 117/331 [03:17<05:09, 1.45s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|████████████████████████████▉ | 118/331 [03:19<05:11, 1.46s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 36%|█████████████████████████████▎ | 120/331 [03:22<05:18, 1.51s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|█████████████████████████████▌ | 121/331 [03:24<05:45, 1.64s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|█████��███████████████████████▊ | 122/331 [03:25<05:42, 1.64s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|██████████████████████████████ | 123/331 [03:27<05:51, 1.69s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 37%|██████████████████████████████▎ | 124/331 [03:29<05:40, 1.64s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|██████████████████████████████▌ | 125/331 [03:30<05:54, 1.72s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|██████████████████████████████▊ | 126/331 [03:33<06:23, 1.87s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 38%|███████████████████████████████ | 127/331 [03:35<07:04, 2.08s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▎ | 128/331 [03:38<07:28, 2.21s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▌ | 129/331 [03:40<07:30, 2.23s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 39%|███████████████████████████████▊ | 130/331 [03:42<07:24, 2.21s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▎ | 132/331 [03:46<06:34, 1.98s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▌ | 133/331 [03:47<06:08, 1.86s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 40%|████████████████████████████████▊ | 134/331 [03:49<05:57, 1.81s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████ | 135/331 [03:51<05:39, 1.73s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████▎ | 136/331 [03:52<05:32, 1.70s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 41%|█████████████████████████████████▌ | 137/331 [03:55<06:26, 1.99s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|█████████████████████████████████▊ | 138/331 [03:57<06:56, 2.16s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|██████████████████████████████████ | 139/331 [03:59<06:04, 1.90s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 42%|██████████████████████████████████▎ | 140/331 [04:01<06:52, 2.16s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▌ | 141/331 [04:03<06:00, 1.90s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 43%|██████████████████████████████████▉ | 143/331 [04:06<05:45, 1.84s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▏ | 144/331 [04:08<05:46, 1.85s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▍ | 145/331 [04:10<05:40, 1.83s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▋ | 146/331 [04:12<05:41, 1.84s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 44%|███████████████████████████████████▉ | 147/331 [04:13<05:25, 1.77s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▍ | 149/331 [04:16<04:46, 1.57s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 45%|████████████████████████████████████▋ | 150/331 [04:18<05:00, 1.66s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|████████████████████████████████████▉ | 151/331 [04:19<04:51, 1.62s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 46%|█████████████████████████████████████▍ | 153/331 [04:22<04:31, 1.52s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|█████████████████████████████████████▋ | 154/331 [04:24<04:39, 1.58s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|█████████████████████████████████████▉ | 155/331 [04:27<05:27, 1.86s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|██████████████████████████████████████▏ | 156/331 [04:29<05:53, 2.02s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 47%|██████████████████████████████████████▍ | 157/331 [04:31<06:03, 2.09s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|██████████████████████████████████████▉ | 159/331 [04:34<05:19, 1.86s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 48%|███████████████████████████████████████▏ | 160/331 [04:36<05:07, 1.80s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▍ | 161/331 [04:37<04:43, 1.67s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▋ | 162/331 [04:39<04:54, 1.74s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 49%|███████████████████████████████████████▉ | 163/331 [04:42<05:21, 1.91s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▏ | 164/331 [04:43<04:42, 1.69s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▍ | 165/331 [04:45<04:58, 1.80s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 50%|████████████████████████████████████████▌ | 166/331 [04:47<05:04, 1.84s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████ | 168/331 [04:50<04:45, 1.75s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████▎ | 169/331 [04:52<04:43, 1.75s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 51%|█████████████████████████████████████████▌ | 170/331 [04:54<04:31, 1.69s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|██████████████████████████████████████████ | 172/331 [04:57<04:06, 1.55s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 52%|██████████████████████████████████████████▎ | 173/331 [04:58<03:59, 1.51s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|██████████████████████████████████████████▊ | 175/331 [05:01<03:49, 1.47s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|███████████████████████████████████████████ | 176/331 [05:02<03:58, 1.54s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 53%|███████████████████████████████████████████▎ | 177/331 [05:04<04:12, 1.64s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|███████████████████████████████████████████▌ | 178/331 [05:07<04:56, 1.94s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 54%|████████████████████████████████████████████ | 180/331 [05:11<04:50, 1.92s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|██████████████████████���█████████████████████▎ | 181/331 [05:13<04:48, 1.92s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▌ | 182/331 [05:14<04:28, 1.81s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 55%|████████████████████████████████████████████▊ | 183/331 [05:16<04:11, 1.70s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▎ | 185/331 [05:18<03:26, 1.41s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▌ | 186/331 [05:20<03:45, 1.56s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 56%|█████████████████████████████████████████████▊ | 187/331 [05:22<04:04, 1.70s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██████████████████████████████████████████████ | 188/331 [05:24<04:02, 1.70s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 57%|██████████████████████████████████████████████▍ | 190/331 [05:27<03:45, 1.60s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|██████████████████████████████████████████████▋ | 191/331 [05:28<03:46, 1.62s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|██████████████████████████████████████████████▉ | 192/331 [05:30<03:51, 1.66s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 58%|███████████████████████████████████████████████▏ | 193/331 [05:32<04:06, 1.79s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▋ | 195/331 [05:35<03:26, 1.52s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 59%|███████████████████████████████████████████████▉ | 196/331 [05:37<03:38, 1.62s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▏ | 197/331 [05:38<03:26, 1.54s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▋ | 199/331 [05:41<03:19, 1.51s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 60%|████████████████████████████████████████████████▉ | 200/331 [05:42<03:15, 1.49s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▏ | 201/331 [05:44<03:16, 1.52s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▍ | 202/331 [05:46<03:23, 1.58s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 61%|█████████████████████████████████████████████████▋ | 203/331 [05:48<03:37, 1.70s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|█████████████████████████████████████████████████▉ | 204/331 [05:50<03:51, 1.82s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|██████████████████████████████████████████████████▏ | 205/331 [05:52<03:57, 1.88s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 62%|██████████████████████████████████████████████████▍ | 206/331 [05:53<03:47, 1.82s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|██████████████████████████████████████████████████▋ | 207/331 [05:56<04:14, 2.06s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|██████████████████████████████████████████████████▉ | 208/331 [05:58<04:22, 2.13s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|███████████████████████████████████████████████████▏ | 209/331 [06:00<03:59, 1.96s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 63%|███████████████████████████████████████████████████▍ | 210/331 [06:01<03:41, 1.83s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|███████████████████████████████████████████████████▋ | 211/331 [06:04<03:50, 1.92s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 64%|████████████████████████████████████████████████████ | 213/331 [06:07<03:25, 1.74s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▎ | 214/331 [06:08<03:15, 1.67s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▌ | 215/331 [06:10<03:05, 1.60s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 65%|████████████████████████████████████████████████████▊ | 216/331 [06:12<03:32, 1.85s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████ | 217/331 [06:14<03:21, 1.77s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▎ | 218/331 [06:16<03:26, 1.82s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 66%|█████████████████████████████████████████████████████▊ | 220/331 [06:19<03:06, 1.68s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████ | 221/331 [06:21<03:04, 1.67s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████▎ | 222/331 [06:22<03:01, 1.66s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 67%|██████████████████████████████████████████████████████▌ | 223/331 [06:24<03:10, 1.76s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|██████████████████████████████████████████████████████▊ | 224/331 [06:26<03:16, 1.84s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|█████████████████████████████████████████████��█████████ | 225/331 [06:28<03:09, 1.79s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 68%|███████████████████████████████████████████████████████▎ | 226/331 [06:30<03:27, 1.97s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|███████████████████████████████████████████████████████▌ | 227/331 [06:32<03:16, 1.89s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|████████████████████████████████████████████████████████ | 229/331 [06:35<02:50, 1.68s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 69%|████████████████████████████████████████████████████████▎ | 230/331 [06:36<02:42, 1.61s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|████████████████████████████████████████████████████████▌ | 231/331 [06:38<02:46, 1.67s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|████████████████████████████████████████████████████████▊ | 232/331 [06:40<02:46, 1.69s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 70%|█████████████████████████████████████████████████████████ | 233/331 [06:42<02:57, 1.81s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▎ | 234/331 [06:44<02:54, 1.80s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▌ | 235/331 [06:45<02:45, 1.72s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 71%|█████████████████████████████████████████████████████████▊ | 236/331 [06:48<03:19, 2.10s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|█████████████████████████████████████████████████████████▉ | 237/331 [06:51<03:18, 2.11s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|██████████████████████████████████████████████████████████▏ | 238/331 [06:52<03:09, 2.03s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 72%|██████████████████████████████████████████████████████████▍ | 239/331 [06:55<03:14, 2.12s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|██████████████████████████████████████████████████████████▋ | 240/331 [06:57<03:26, 2.27s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|██████████████████████████████████████████████████████████▉ | 241/331 [07:00<03:40, 2.45s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|███████████████████████████████████████████████████████████▏ | 242/331 [07:02<03:32, 2.39s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 73%|███████████████████████████████████████████████████████████▍ | 243/331 [07:04<03:17, 2.24s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|███████████████████████████████████████████████████████████▋ | 244/331 [07:07<03:15, 2.24s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|███████████████████████████████████████████████████████████▉ | 245/331 [07:09<03:13, 2.25s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 74%|████████████████████████████████████████████████████████████▏ | 246/331 [07:12<03:32, 2.50s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▍ | 247/331 [07:14<03:25, 2.45s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 75%|████████████████████████████████████████████████████████████▋ | 248/331 [07:16<03:09, 2.28s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▏ | 250/331 [07:19<02:38, 1.96s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▍ | 251/331 [07:21<02:34, 1.94s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▋ | 252/331 [07:23<02:21, 1.79s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 76%|█████████████████████████████████████████████████████████████▉ | 253/331 [07:25<02:33, 1.97s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▏ | 254/331 [07:27<02:31, 1.96s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▍ | 255/331 [07:29<02:35, 2.04s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 77%|██████████████████████████████████████████████████████████████▋ | 256/331 [07:31<02:16, 1.82s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|██████████████████████████████████████████████████████████████▉ | 257/331 [07:33<02:26, 1.98s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|███████████████████████████████████████████████████████████████▏ | 258/331 [07:34<02:07, 1.75s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 78%|███████████████████████████████████████████████████████████████▍ | 259/331 [07:36<02:11, 1.83s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|███████████████████████████████████████████████████████████████▊ | 261/331 [07:39<01:49, 1.57s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|████████████████████████████████████████████████████████████████ | 262/331 [07:41<01:56, 1.68s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 79%|████████████████████████████████████████████████████████████████▎ | 263/331 [07:43<02:09, 1.90s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|████████████████████████████████████████████████████████████████▌ | 264/331 [07:45<02:03, 1.84s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|████████████████████████████████████████████████████████████████▊ | 265/331 [07:46<01:51, 1.70s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 80%|█████████████████████████████████████████████████████████████████ | 266/331 [07:48<01:45, 1.63s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▌ | 268/331 [07:52<01:49, 1.75s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 81%|█████████████████████████████████████████████████████████████████▊ | 269/331 [07:54<01:58, 1.91s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████ | 270/331 [07:56<02:00, 1.98s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▎ | 271/331 [07:58<01:58, 1.97s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▌ | 272/331 [08:00<01:55, 1.95s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 82%|██████████████████████████████████████████████████████████████████▊ | 273/331 [08:02<01:54, 1.97s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████ | 274/331 [08:05<02:05, 2.20s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████▎ | 275/331 [08:07<02:04, 2.23s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 83%|███████████████████████████████████████████████████████████████████▌ | 276/331 [08:09<01:55, 2.11s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|████████████████████████████████████████████████████████████████████ | 278/331 [08:12<01:34, 1.79s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 84%|████████████████████████████████████████████████████████████████████▎ | 279/331 [08:15<01:50, 2.13s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|████████████████████████████████████████████████████████████████████▌ | 280/331 [08:17<01:49, 2.14s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|████████████████████████████████████████████████████████████████████▊ | 281/331 [08:19<01:54, 2.29s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|█████████████████████████████████████████████████████████████████████ | 282/331 [08:21<01:48, 2.21s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 85%|█████████████████████████████████████████████████████████████████████▎ | 283/331 [08:24<01:44, 2.18s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▍ | 284/331 [08:25<01:37, 2.08s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▋ | 285/331 [08:28<01:38, 2.14s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 86%|█████████████████████████████████████████████████████████████████████▉ | 286/331 [08:30<01:40, 2.24s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▍ | 288/331 [08:34<01:32, 2.15s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 87%|██████████████████████████████████████████████████████████████████████▋ | 289/331 [08:36<01:21, 1.94s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|██████████████████████████████████████████████████████████████████████▉ | 290/331 [08:37<01:12, 1.76s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 88%|███████████████████████████████████████████████████████████████████████▏ | 291/331 [08:39<01:10, 1.77s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|███████████████████████████████████████████████████████████████████████▋ | 293/331 [08:42<01:03, 1.68s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|███████████████████████████████████████████████████████████████████████▉ | 294/331 [08:44<01:01, 1.66s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|████████████████████████████████████████████████████████████████████████▏ | 295/331 [08:46<01:01, 1.69s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 89%|████████████████████████████████████████████████████████████████████████▍ | 296/331 [08:47<00:55, 1.60s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|████████████████████████████████████████████████████████████████████████▋ | 297/331 [08:49<01:03, 1.88s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|████████████████████████████████████████████████████████████████████████▉ | 298/331 [08:52<01:11, 2.17s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 90%|█████████████████████████████████████████████████████████████████████████▏ | 299/331 [08:54<01:03, 1.98s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 91%|█████████████████████████████████████████████████████████████████████████▍ | 300/331 [08:55<00:57, 1.86s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 91%|█████████████████████████████████████████████████████████████████████████▋ | 301/331 [08:57<00:53, 1.80s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▏ | 303/331 [09:00<00:48, 1.74s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▍ | 304/331 [09:03<00:51, 1.90s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▋ | 305/331 [09:04<00:48, 1.87s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 92%|██████████████████████████████████████████████████████████████████████████▉ | 306/331 [09:07<00:53, 2.14s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▏ | 307/331 [09:09<00:50, 2.10s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▎ | 308/331 [09:11<00:48, 2.12s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 93%|███████████████████████████████████████████████████████████████████████████▌ | 309/331 [09:14<00:50, 2.31s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|███████████████████████████████████████████████████████████████████████████▊ | 310/331 [09:16<00:43, 2.09s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|████████████████████████████████████████████████████████████████████████████ | 311/331 [09:18<00:43, 2.18s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 94%|████████████████████████████████████████████████████████████████████████████▎ | 312/331 [09:20<00:37, 1.99s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|████████████████████████████████████████████████████████████████████████████▌ | 313/331 [09:21<00:33, 1.87s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|████████████████████████████████��███████████████████████████████████████████▊ | 314/331 [09:24<00:33, 2.00s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|█████████████████████████████████████████████████████████████████████████████ | 315/331 [09:26<00:31, 1.98s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 95%|█████████████████████████████████████████████████████████████████████████████▎ | 316/331 [09:28<00:29, 1.98s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|█████████████████████████████████████████████████████████████████████████████▌ | 317/331 [09:30<00:28, 2.01s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 96%|██████████████████████████████████████████████████████████████████████████████ | 319/331 [09:32<00:20, 1.70s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▎ | 320/331 [09:34<00:19, 1.75s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 97%|██████████████████████████████████████████████████████████████████████████████▌ | 321/331 [09:36<00:18, 1.82s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████ | 323/331 [09:40<00:14, 1.84s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▎ | 324/331 [09:43<00:14, 2.00s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▎ | 324/331 [09:43<00:14, 2.00s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▎ | 324/331 [09:43<00:14, 2.00s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 98%|███████████████████████████████████████████████████████████████████████████████▊ | 326/331 [09:47<00:10, 2.06s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|████████████████████████████████████████████████████████████████████████████████ | 327/331 [09:49<00:08, 2.14s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. + 99%|████████████████████████████████████████████████████████████████████████████████▌| 329/331 [09:53<00:04, 2.04s/it][INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|configuration_utils.py:438] 2022-03-10 23:43:43,511 >> Configuration saved in ./checkpoint-1500/config.json [INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|configuration_utils.py:438] 2022-03-10 23:43:43,511 >> Configuration saved in ./checkpoint-1500/config.json [INFO|trainer.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +03/10/2022 23:43:43 - INFO - datasets.metric - Removing /home/sanchit_huggingface_co/.cache/huggingface/metrics/wer/default/default_experiment-1-0.arrow +[INFO|feature_extraction_utils.py:324] 2022-03-10 23:43:47,402 >> Configuration saved in ./checkpoint-1500/preprocessor_config.jsoner.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|feature_extraction_utils.py:324] 2022-03-10 23:43:47,402 >> Configuration saved in ./checkpoint-1500/preprocessor_config.jsoner.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +[INFO|feature_extraction_utils.py:324] 2022-03-10 23:43:47,402 >> Configuration saved in ./checkpoint-1500/preprocessor_config.jsoner.py:560] 2022-03-10 23:33:44,439 >> The following columns in the evaluation set don't have a corresponding argument in `SpeechEncoderDecoderModel.forward` and have been ignored: input_length. If input_length are not expected by `SpeechEncoderDecoderModel.forward`, you can safely ignore this message. +03/10/2022 23:44:01 - WARNING - huggingface_hub.repository - Adding files tracked by Git LFS: ['wandb/run-20220310_212039-1nikmzrh/run-1nikmzrh.wandb']. This may take a bit of time if the files are large.